blob: 39a3baf1a943de5fef99d617928b85df75ea81b3 [file] [log] [blame]
/*
* Copyright (C) 2016-2019 Apple Inc. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY
* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
* OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#include "config.h"
#include "AirCode.h"
#include "AirGenerate.h"
#include "AirSpecial.h"
#include "AllowMacroScratchRegisterUsage.h"
#include "B3BasicBlockInlines.h"
#include "B3Compilation.h"
#include "B3Procedure.h"
#include "B3PatchpointSpecial.h"
#include "B3PatchpointValue.h"
#include "B3StackmapGenerationParams.h"
#include "CCallHelpers.h"
#include "InitializeThreading.h"
#include "LinkBuffer.h"
#include "ProbeContext.h"
#include "PureNaN.h"
#include <regex>
#include <string>
#include <wtf/DataLog.h>
#include <wtf/Lock.h>
#include <wtf/NumberOfCores.h>
#include <wtf/StdMap.h>
#include <wtf/Threading.h>
#include <wtf/text/StringCommon.h>
// We don't have a NO_RETURN_DUE_TO_EXIT, nor should we. That's ridiculous.
static bool hiddenTruthBecauseNoReturnIsStupid() { return true; }
static void usage()
{
dataLog("Usage: testair [<filter>]\n");
if (hiddenTruthBecauseNoReturnIsStupid())
exit(1);
}
#if ENABLE(B3_JIT)
using namespace JSC;
using namespace JSC::B3::Air;
using JSC::B3::FP;
using JSC::B3::GP;
using JSC::B3::Width;
using JSC::B3::Width8;
using JSC::B3::Width16;
using JSC::B3::Width32;
using JSC::B3::Width64;
namespace {
Lock crashLock;
// Nothing fancy for now; we just use the existing WTF assertion machinery.
#define CHECK(x) do { \
if (!!(x)) \
break; \
crashLock.lock(); \
WTFReportAssertionFailure(__FILE__, __LINE__, WTF_PRETTY_FUNCTION, #x); \
CRASH(); \
} while (false)
std::unique_ptr<B3::Compilation> compile(B3::Procedure& proc)
{
prepareForGeneration(proc.code());
CCallHelpers jit;
generate(proc.code(), jit);
LinkBuffer linkBuffer(jit, nullptr);
return makeUnique<B3::Compilation>(
FINALIZE_CODE(linkBuffer, B3CompilationPtrTag, "testair compilation"), proc.releaseByproducts());
}
template<typename T, typename... Arguments>
T invoke(const B3::Compilation& code, Arguments... arguments)
{
void* executableAddress = untagCFunctionPtr(code.code().executableAddress(), B3CompilationPtrTag);
T (*function)(Arguments...) = bitwise_cast<T(*)(Arguments...)>(executableAddress);
return function(arguments...);
}
template<typename T, typename... Arguments>
T compileAndRun(B3::Procedure& procedure, Arguments... arguments)
{
return invoke<T>(*compile(procedure), arguments...);
}
void testSimple()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
root->append(Move, nullptr, Arg::imm(42), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
CHECK(compileAndRun<int>(proc) == 42);
}
// Use this to put a constant into a register without Air being able to see the constant.
template<typename T>
void loadConstantImpl(BasicBlock* block, T value, B3::Air::Opcode move, Tmp tmp, Tmp scratch)
{
static Lock lock;
static StdMap<T, T*>* map; // I'm not messing with HashMap's problems with integers.
LockHolder locker(lock);
if (!map)
map = new StdMap<T, T*>();
if (!map->count(value))
(*map)[value] = new T(value);
T* ptr = (*map)[value];
block->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(ptr)), scratch);
block->append(move, nullptr, Arg::addr(scratch), tmp);
}
template<typename T>
void loadConstant(BasicBlock* block, T value, Tmp tmp)
{
loadConstantImpl(block, value, Move, tmp, tmp);
}
void loadDoubleConstant(BasicBlock* block, double value, Tmp tmp, Tmp scratch)
{
loadConstantImpl<double>(block, value, MoveDouble, tmp, scratch);
}
void testShuffleSimpleSwap()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
loadConstant(root, 4, Tmp(GPRInfo::regT3));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT3), Arg::widthArg(Width32),
Tmp(GPRInfo::regT3), Tmp(GPRInfo::regT2), Arg::widthArg(Width32));
int32_t things[4];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1);
CHECK(things[1] == 2);
CHECK(things[2] == 4);
CHECK(things[3] == 3);
}
void testShuffleSimpleShift()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
loadConstant(root, 4, Tmp(GPRInfo::regT3));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT3), Arg::widthArg(Width32),
Tmp(GPRInfo::regT3), Tmp(GPRInfo::regT4), Arg::widthArg(Width32));
int32_t things[5];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT4), Arg::addr(base, 4 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1);
CHECK(things[1] == 2);
CHECK(things[2] == 3);
CHECK(things[3] == 3);
CHECK(things[4] == 4);
}
void testShuffleLongShift()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
loadConstant(root, 4, Tmp(GPRInfo::regT3));
loadConstant(root, 5, Tmp(GPRInfo::regT4));
loadConstant(root, 6, Tmp(GPRInfo::regT5));
loadConstant(root, 7, Tmp(GPRInfo::regT6));
loadConstant(root, 8, Tmp(GPRInfo::regT7));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Tmp(GPRInfo::regT2), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT3), Arg::widthArg(Width32),
Tmp(GPRInfo::regT3), Tmp(GPRInfo::regT4), Arg::widthArg(Width32),
Tmp(GPRInfo::regT4), Tmp(GPRInfo::regT5), Arg::widthArg(Width32),
Tmp(GPRInfo::regT5), Tmp(GPRInfo::regT6), Arg::widthArg(Width32),
Tmp(GPRInfo::regT6), Tmp(GPRInfo::regT7), Arg::widthArg(Width32));
int32_t things[8];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT4), Arg::addr(base, 4 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT5), Arg::addr(base, 5 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT6), Arg::addr(base, 6 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT7), Arg::addr(base, 7 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1);
CHECK(things[1] == 1);
CHECK(things[2] == 2);
CHECK(things[3] == 3);
CHECK(things[4] == 4);
CHECK(things[5] == 5);
CHECK(things[6] == 6);
CHECK(things[7] == 7);
}
void testShuffleLongShiftBackwards()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
loadConstant(root, 4, Tmp(GPRInfo::regT3));
loadConstant(root, 5, Tmp(GPRInfo::regT4));
loadConstant(root, 6, Tmp(GPRInfo::regT5));
loadConstant(root, 7, Tmp(GPRInfo::regT6));
loadConstant(root, 8, Tmp(GPRInfo::regT7));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT6), Tmp(GPRInfo::regT7), Arg::widthArg(Width32),
Tmp(GPRInfo::regT5), Tmp(GPRInfo::regT6), Arg::widthArg(Width32),
Tmp(GPRInfo::regT4), Tmp(GPRInfo::regT5), Arg::widthArg(Width32),
Tmp(GPRInfo::regT3), Tmp(GPRInfo::regT4), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT3), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Tmp(GPRInfo::regT2), Arg::widthArg(Width32),
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32));
int32_t things[8];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT4), Arg::addr(base, 4 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT5), Arg::addr(base, 5 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT6), Arg::addr(base, 6 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT7), Arg::addr(base, 7 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1);
CHECK(things[1] == 1);
CHECK(things[2] == 2);
CHECK(things[3] == 3);
CHECK(things[4] == 4);
CHECK(things[5] == 5);
CHECK(things[6] == 6);
CHECK(things[7] == 7);
}
void testShuffleSimpleRotate()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
loadConstant(root, 4, Tmp(GPRInfo::regT3));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Tmp(GPRInfo::regT2), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT0), Arg::widthArg(Width32));
int32_t things[4];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 3);
CHECK(things[1] == 1);
CHECK(things[2] == 2);
CHECK(things[3] == 4);
}
void testShuffleSimpleBroadcast()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
loadConstant(root, 4, Tmp(GPRInfo::regT3));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32),
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT2), Arg::widthArg(Width32),
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT3), Arg::widthArg(Width32));
int32_t things[4];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1);
CHECK(things[1] == 1);
CHECK(things[2] == 1);
CHECK(things[3] == 1);
}
void testShuffleBroadcastAllRegs()
{
B3::Procedure proc;
Code& code = proc.code();
const Vector<Reg>& regs = code.regsInPriorityOrder(GP);
BasicBlock* root = code.addBlock();
root->append(Move, nullptr, Arg::imm(35), Tmp(GPRInfo::regT0));
unsigned count = 1;
for (Reg reg : regs) {
if (reg != Reg(GPRInfo::regT0))
loadConstant(root, count++, Tmp(reg));
}
Inst& shuffle = root->append(Shuffle, nullptr);
for (Reg reg : regs) {
if (reg != Reg(GPRInfo::regT0))
shuffle.append(Tmp(GPRInfo::regT0), Tmp(reg), Arg::widthArg(Width32));
}
StackSlot* slot = code.addStackSlot(sizeof(int32_t) * regs.size(), StackSlotKind::Locked);
for (unsigned i = 0; i < regs.size(); ++i)
root->append(Move32, nullptr, Tmp(regs[i]), Arg::stack(slot, i * sizeof(int32_t)));
Vector<int32_t> things(regs.size(), 666);
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things[0])), base);
for (unsigned i = 0; i < regs.size(); ++i) {
root->append(Move32, nullptr, Arg::stack(slot, i * sizeof(int32_t)), Tmp(GPRInfo::regT0));
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, i * sizeof(int32_t)));
}
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
CHECK(!compileAndRun<int>(proc));
for (int32_t thing : things)
CHECK(thing == 35);
}
void testShuffleTreeShift()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
loadConstant(root, 4, Tmp(GPRInfo::regT3));
loadConstant(root, 5, Tmp(GPRInfo::regT4));
loadConstant(root, 6, Tmp(GPRInfo::regT5));
loadConstant(root, 7, Tmp(GPRInfo::regT6));
loadConstant(root, 8, Tmp(GPRInfo::regT7));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32),
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT2), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Tmp(GPRInfo::regT3), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Tmp(GPRInfo::regT4), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT5), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT6), Arg::widthArg(Width32),
Tmp(GPRInfo::regT3), Tmp(GPRInfo::regT7), Arg::widthArg(Width32));
int32_t things[8];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT4), Arg::addr(base, 4 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT5), Arg::addr(base, 5 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT6), Arg::addr(base, 6 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT7), Arg::addr(base, 7 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1);
CHECK(things[1] == 1);
CHECK(things[2] == 1);
CHECK(things[3] == 2);
CHECK(things[4] == 2);
CHECK(things[5] == 3);
CHECK(things[6] == 3);
CHECK(things[7] == 4);
}
void testShuffleTreeShiftBackward()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
loadConstant(root, 4, Tmp(GPRInfo::regT3));
loadConstant(root, 5, Tmp(GPRInfo::regT4));
loadConstant(root, 6, Tmp(GPRInfo::regT5));
loadConstant(root, 7, Tmp(GPRInfo::regT6));
loadConstant(root, 8, Tmp(GPRInfo::regT7));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT3), Tmp(GPRInfo::regT7), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT6), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT5), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Tmp(GPRInfo::regT4), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Tmp(GPRInfo::regT3), Arg::widthArg(Width32),
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT2), Arg::widthArg(Width32),
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32));
int32_t things[8];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT4), Arg::addr(base, 4 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT5), Arg::addr(base, 5 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT6), Arg::addr(base, 6 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT7), Arg::addr(base, 7 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1);
CHECK(things[1] == 1);
CHECK(things[2] == 1);
CHECK(things[3] == 2);
CHECK(things[4] == 2);
CHECK(things[5] == 3);
CHECK(things[6] == 3);
CHECK(things[7] == 4);
}
void testShuffleTreeShiftOtherBackward()
{
// NOTE: This test was my original attempt at TreeShiftBackward but mistakes were made. So, this
// ends up being just a weird test. But weird tests are useful, so I kept it.
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
loadConstant(root, 4, Tmp(GPRInfo::regT3));
loadConstant(root, 5, Tmp(GPRInfo::regT4));
loadConstant(root, 6, Tmp(GPRInfo::regT5));
loadConstant(root, 7, Tmp(GPRInfo::regT6));
loadConstant(root, 8, Tmp(GPRInfo::regT7));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT4), Tmp(GPRInfo::regT7), Arg::widthArg(Width32),
Tmp(GPRInfo::regT5), Tmp(GPRInfo::regT6), Arg::widthArg(Width32),
Tmp(GPRInfo::regT5), Tmp(GPRInfo::regT5), Arg::widthArg(Width32),
Tmp(GPRInfo::regT6), Tmp(GPRInfo::regT4), Arg::widthArg(Width32),
Tmp(GPRInfo::regT6), Tmp(GPRInfo::regT3), Arg::widthArg(Width32),
Tmp(GPRInfo::regT7), Tmp(GPRInfo::regT2), Arg::widthArg(Width32),
Tmp(GPRInfo::regT7), Tmp(GPRInfo::regT1), Arg::widthArg(Width32));
int32_t things[8];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT4), Arg::addr(base, 4 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT5), Arg::addr(base, 5 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT6), Arg::addr(base, 6 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT7), Arg::addr(base, 7 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1);
CHECK(things[1] == 8);
CHECK(things[2] == 8);
CHECK(things[3] == 7);
CHECK(things[4] == 7);
CHECK(things[5] == 6);
CHECK(things[6] == 6);
CHECK(things[7] == 5);
}
void testShuffleMultipleShifts()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
loadConstant(root, 4, Tmp(GPRInfo::regT3));
loadConstant(root, 5, Tmp(GPRInfo::regT4));
loadConstant(root, 6, Tmp(GPRInfo::regT5));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT3), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT4), Arg::widthArg(Width32),
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT5), Arg::widthArg(Width32));
int32_t things[6];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT4), Arg::addr(base, 4 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT5), Arg::addr(base, 5 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1);
CHECK(things[1] == 1);
CHECK(things[2] == 3);
CHECK(things[3] == 3);
CHECK(things[4] == 3);
CHECK(things[5] == 1);
}
void testShuffleRotateWithFringe()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
loadConstant(root, 4, Tmp(GPRInfo::regT3));
loadConstant(root, 5, Tmp(GPRInfo::regT4));
loadConstant(root, 6, Tmp(GPRInfo::regT5));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Tmp(GPRInfo::regT2), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT0), Arg::widthArg(Width32),
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT3), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Tmp(GPRInfo::regT4), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT5), Arg::widthArg(Width32));
int32_t things[6];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT4), Arg::addr(base, 4 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT5), Arg::addr(base, 5 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 3);
CHECK(things[1] == 1);
CHECK(things[2] == 2);
CHECK(things[3] == 1);
CHECK(things[4] == 2);
CHECK(things[5] == 3);
}
void testShuffleRotateWithFringeInWeirdOrder()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
loadConstant(root, 4, Tmp(GPRInfo::regT3));
loadConstant(root, 5, Tmp(GPRInfo::regT4));
loadConstant(root, 6, Tmp(GPRInfo::regT5));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT3), Arg::widthArg(Width32),
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Tmp(GPRInfo::regT4), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT0), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT5), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Tmp(GPRInfo::regT2), Arg::widthArg(Width32));
int32_t things[6];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT4), Arg::addr(base, 4 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT5), Arg::addr(base, 5 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 3);
CHECK(things[1] == 1);
CHECK(things[2] == 2);
CHECK(things[3] == 1);
CHECK(things[4] == 2);
CHECK(things[5] == 3);
}
void testShuffleRotateWithLongFringe()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
loadConstant(root, 4, Tmp(GPRInfo::regT3));
loadConstant(root, 5, Tmp(GPRInfo::regT4));
loadConstant(root, 6, Tmp(GPRInfo::regT5));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Tmp(GPRInfo::regT2), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT0), Arg::widthArg(Width32),
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT3), Arg::widthArg(Width32),
Tmp(GPRInfo::regT3), Tmp(GPRInfo::regT4), Arg::widthArg(Width32),
Tmp(GPRInfo::regT4), Tmp(GPRInfo::regT5), Arg::widthArg(Width32));
int32_t things[6];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT4), Arg::addr(base, 4 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT5), Arg::addr(base, 5 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 3);
CHECK(things[1] == 1);
CHECK(things[2] == 2);
CHECK(things[3] == 1);
CHECK(things[4] == 4);
CHECK(things[5] == 5);
}
void testShuffleMultipleRotates()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
loadConstant(root, 4, Tmp(GPRInfo::regT3));
loadConstant(root, 5, Tmp(GPRInfo::regT4));
loadConstant(root, 6, Tmp(GPRInfo::regT5));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Tmp(GPRInfo::regT2), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT0), Arg::widthArg(Width32),
Tmp(GPRInfo::regT3), Tmp(GPRInfo::regT4), Arg::widthArg(Width32),
Tmp(GPRInfo::regT4), Tmp(GPRInfo::regT5), Arg::widthArg(Width32),
Tmp(GPRInfo::regT5), Tmp(GPRInfo::regT3), Arg::widthArg(Width32));
int32_t things[6];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT4), Arg::addr(base, 4 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT5), Arg::addr(base, 5 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 3);
CHECK(things[1] == 1);
CHECK(things[2] == 2);
CHECK(things[3] == 6);
CHECK(things[4] == 4);
CHECK(things[5] == 5);
}
void testShuffleShiftAndRotate()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
loadConstant(root, 4, Tmp(GPRInfo::regT3));
loadConstant(root, 5, Tmp(GPRInfo::regT4));
loadConstant(root, 6, Tmp(GPRInfo::regT5));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Tmp(GPRInfo::regT2), Arg::widthArg(Width32),
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT0), Arg::widthArg(Width32),
Tmp(GPRInfo::regT3), Tmp(GPRInfo::regT4), Arg::widthArg(Width32),
Tmp(GPRInfo::regT4), Tmp(GPRInfo::regT5), Arg::widthArg(Width32));
int32_t things[6];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT4), Arg::addr(base, 4 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT5), Arg::addr(base, 5 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 3);
CHECK(things[1] == 1);
CHECK(things[2] == 2);
CHECK(things[3] == 4);
CHECK(things[4] == 4);
CHECK(things[5] == 5);
}
void testShuffleShiftAllRegs()
{
B3::Procedure proc;
Code& code = proc.code();
const Vector<Reg>& regs = code.regsInPriorityOrder(GP);
BasicBlock* root = code.addBlock();
for (unsigned i = 0; i < regs.size(); ++i)
loadConstant(root, 35 + i, Tmp(regs[i]));
Inst& shuffle = root->append(Shuffle, nullptr);
for (unsigned i = 1; i < regs.size(); ++i)
shuffle.append(Tmp(regs[i - 1]), Tmp(regs[i]), Arg::widthArg(Width32));
StackSlot* slot = code.addStackSlot(sizeof(int32_t) * regs.size(), StackSlotKind::Locked);
for (unsigned i = 0; i < regs.size(); ++i)
root->append(Move32, nullptr, Tmp(regs[i]), Arg::stack(slot, i * sizeof(int32_t)));
Vector<int32_t> things(regs.size(), 666);
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things[0])), base);
for (unsigned i = 0; i < regs.size(); ++i) {
root->append(Move32, nullptr, Arg::stack(slot, i * sizeof(int32_t)), Tmp(GPRInfo::regT0));
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, i * sizeof(int32_t)));
}
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 35);
for (unsigned i = 1; i < regs.size(); ++i)
CHECK(things[i] == 35 + static_cast<int32_t>(i) - 1);
}
void testShuffleRotateAllRegs()
{
B3::Procedure proc;
Code& code = proc.code();
const Vector<Reg>& regs = code.regsInPriorityOrder(GP);
BasicBlock* root = code.addBlock();
for (unsigned i = 0; i < regs.size(); ++i)
loadConstant(root, 35 + i, Tmp(regs[i]));
Inst& shuffle = root->append(Shuffle, nullptr);
for (unsigned i = 1; i < regs.size(); ++i)
shuffle.append(Tmp(regs[i - 1]), Tmp(regs[i]), Arg::widthArg(Width32));
shuffle.append(Tmp(regs.last()), Tmp(regs[0]), Arg::widthArg(Width32));
StackSlot* slot = code.addStackSlot(sizeof(int32_t) * regs.size(), StackSlotKind::Locked);
for (unsigned i = 0; i < regs.size(); ++i)
root->append(Move32, nullptr, Tmp(regs[i]), Arg::stack(slot, i * sizeof(int32_t)));
Vector<int32_t> things(regs.size(), 666);
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things[0])), base);
for (unsigned i = 0; i < regs.size(); ++i) {
root->append(Move32, nullptr, Arg::stack(slot, i * sizeof(int32_t)), Tmp(GPRInfo::regT0));
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, i * sizeof(int32_t)));
}
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 35 + static_cast<int32_t>(regs.size()) - 1);
for (unsigned i = 1; i < regs.size(); ++i)
CHECK(things[i] == 35 + static_cast<int32_t>(i) - 1);
}
void testShuffleSimpleSwap64()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 10000000000000000ll, Tmp(GPRInfo::regT0));
loadConstant(root, 20000000000000000ll, Tmp(GPRInfo::regT1));
loadConstant(root, 30000000000000000ll, Tmp(GPRInfo::regT2));
loadConstant(root, 40000000000000000ll, Tmp(GPRInfo::regT3));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT3), Arg::widthArg(Width64),
Tmp(GPRInfo::regT3), Tmp(GPRInfo::regT2), Arg::widthArg(Width64));
int64_t things[4];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int64_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 10000000000000000ll);
CHECK(things[1] == 20000000000000000ll);
CHECK(things[2] == 40000000000000000ll);
CHECK(things[3] == 30000000000000000ll);
}
void testShuffleSimpleShift64()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 10000000000000000ll, Tmp(GPRInfo::regT0));
loadConstant(root, 20000000000000000ll, Tmp(GPRInfo::regT1));
loadConstant(root, 30000000000000000ll, Tmp(GPRInfo::regT2));
loadConstant(root, 40000000000000000ll, Tmp(GPRInfo::regT3));
loadConstant(root, 50000000000000000ll, Tmp(GPRInfo::regT4));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT3), Arg::widthArg(Width64),
Tmp(GPRInfo::regT3), Tmp(GPRInfo::regT4), Arg::widthArg(Width64));
int64_t things[5];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT4), Arg::addr(base, 4 * sizeof(int64_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 10000000000000000ll);
CHECK(things[1] == 20000000000000000ll);
CHECK(things[2] == 30000000000000000ll);
CHECK(things[3] == 30000000000000000ll);
CHECK(things[4] == 40000000000000000ll);
}
void testShuffleSwapMixedWidth()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 10000000000000000ll, Tmp(GPRInfo::regT0));
loadConstant(root, 20000000000000000ll, Tmp(GPRInfo::regT1));
loadConstant(root, 30000000000000000ll, Tmp(GPRInfo::regT2));
loadConstant(root, 40000000000000000ll, Tmp(GPRInfo::regT3));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT3), Arg::widthArg(Width32),
Tmp(GPRInfo::regT3), Tmp(GPRInfo::regT2), Arg::widthArg(Width64));
int64_t things[4];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int64_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 10000000000000000ll);
CHECK(things[1] == 20000000000000000ll);
CHECK(things[2] == 40000000000000000ll);
CHECK(things[3] == static_cast<uint32_t>(30000000000000000ll));
}
void testShuffleShiftMixedWidth()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadConstant(root, 10000000000000000ll, Tmp(GPRInfo::regT0));
loadConstant(root, 20000000000000000ll, Tmp(GPRInfo::regT1));
loadConstant(root, 30000000000000000ll, Tmp(GPRInfo::regT2));
loadConstant(root, 40000000000000000ll, Tmp(GPRInfo::regT3));
loadConstant(root, 50000000000000000ll, Tmp(GPRInfo::regT4));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT2), Tmp(GPRInfo::regT3), Arg::widthArg(Width64),
Tmp(GPRInfo::regT3), Tmp(GPRInfo::regT4), Arg::widthArg(Width32));
int64_t things[5];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT3), Arg::addr(base, 3 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT4), Arg::addr(base, 4 * sizeof(int64_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 10000000000000000ll);
CHECK(things[1] == 20000000000000000ll);
CHECK(things[2] == 30000000000000000ll);
CHECK(things[3] == 30000000000000000ll);
CHECK(things[4] == static_cast<uint32_t>(40000000000000000ll));
}
void testShuffleShiftMemory()
{
B3::Procedure proc;
Code& code = proc.code();
int32_t memory[2];
memory[0] = 35;
memory[1] = 36;
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
root->append(Move, nullptr, Arg::immPtr(&memory), Tmp(GPRInfo::regT2));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32),
Arg::addr(Tmp(GPRInfo::regT2), 0 * sizeof(int32_t)),
Arg::addr(Tmp(GPRInfo::regT2), 1 * sizeof(int32_t)), Arg::widthArg(Width32));
int32_t things[2];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1);
CHECK(things[1] == 1);
CHECK(memory[0] == 35);
CHECK(memory[1] == 35);
}
void testShuffleShiftMemoryLong()
{
B3::Procedure proc;
Code& code = proc.code();
int32_t memory[2];
memory[0] = 35;
memory[1] = 36;
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
loadConstant(root, 3, Tmp(GPRInfo::regT2));
root->append(Move, nullptr, Arg::immPtr(&memory), Tmp(GPRInfo::regT3));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Arg::addr(Tmp(GPRInfo::regT3), 0 * sizeof(int32_t)),
Arg::widthArg(Width32),
Arg::addr(Tmp(GPRInfo::regT3), 0 * sizeof(int32_t)),
Arg::addr(Tmp(GPRInfo::regT3), 1 * sizeof(int32_t)), Arg::widthArg(Width32),
Arg::addr(Tmp(GPRInfo::regT3), 1 * sizeof(int32_t)), Tmp(GPRInfo::regT2),
Arg::widthArg(Width32));
int32_t things[3];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT2), Arg::addr(base, 2 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1);
CHECK(things[1] == 1);
CHECK(things[2] == 36);
CHECK(memory[0] == 2);
CHECK(memory[1] == 35);
}
void testShuffleShiftMemoryAllRegs()
{
B3::Procedure proc;
Code& code = proc.code();
int32_t memory[2];
memory[0] = 35;
memory[1] = 36;
Vector<Reg> regs = code.regsInPriorityOrder(GP);
regs.removeFirst(Reg(GPRInfo::regT0));
BasicBlock* root = code.addBlock();
for (unsigned i = 0; i < regs.size(); ++i)
loadConstant(root, i + 1, Tmp(regs[i]));
root->append(Move, nullptr, Arg::immPtr(&memory), Tmp(GPRInfo::regT0));
Inst& shuffle = root->append(
Shuffle, nullptr,
Tmp(regs[0]), Arg::addr(Tmp(GPRInfo::regT0), 0 * sizeof(int32_t)),
Arg::widthArg(Width32),
Arg::addr(Tmp(GPRInfo::regT0), 0 * sizeof(int32_t)),
Arg::addr(Tmp(GPRInfo::regT0), 1 * sizeof(int32_t)), Arg::widthArg(Width32),
Arg::addr(Tmp(GPRInfo::regT0), 1 * sizeof(int32_t)), Tmp(regs[1]),
Arg::widthArg(Width32));
for (unsigned i = 2; i < regs.size(); ++i)
shuffle.append(Tmp(regs[i - 1]), Tmp(regs[i]), Arg::widthArg(Width32));
Vector<int32_t> things(regs.size(), 666);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things[0])), Tmp(GPRInfo::regT0));
for (unsigned i = 0; i < regs.size(); ++i) {
root->append(
Move32, nullptr, Tmp(regs[i]), Arg::addr(Tmp(GPRInfo::regT0), i * sizeof(int32_t)));
}
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1);
CHECK(things[1] == 36);
for (unsigned i = 2; i < regs.size(); ++i)
CHECK(things[i] == static_cast<int32_t>(i));
CHECK(memory[0] == 1);
CHECK(memory[1] == 35);
}
void testShuffleShiftMemoryAllRegs64()
{
B3::Procedure proc;
Code& code = proc.code();
int64_t memory[2];
memory[0] = 35000000000000ll;
memory[1] = 36000000000000ll;
Vector<Reg> regs = code.regsInPriorityOrder(GP);
regs.removeFirst(Reg(GPRInfo::regT0));
BasicBlock* root = code.addBlock();
for (unsigned i = 0; i < regs.size(); ++i)
loadConstant(root, (i + 1) * 1000000000000ll, Tmp(regs[i]));
root->append(Move, nullptr, Arg::immPtr(&memory), Tmp(GPRInfo::regT0));
Inst& shuffle = root->append(
Shuffle, nullptr,
Tmp(regs[0]), Arg::addr(Tmp(GPRInfo::regT0), 0 * sizeof(int64_t)),
Arg::widthArg(Width64),
Arg::addr(Tmp(GPRInfo::regT0), 0 * sizeof(int64_t)),
Arg::addr(Tmp(GPRInfo::regT0), 1 * sizeof(int64_t)), Arg::widthArg(Width64),
Arg::addr(Tmp(GPRInfo::regT0), 1 * sizeof(int64_t)), Tmp(regs[1]),
Arg::widthArg(Width64));
for (unsigned i = 2; i < regs.size(); ++i)
shuffle.append(Tmp(regs[i - 1]), Tmp(regs[i]), Arg::widthArg(Width64));
Vector<int64_t> things(regs.size(), 666);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things[0])), Tmp(GPRInfo::regT0));
for (unsigned i = 0; i < regs.size(); ++i) {
root->append(
Move, nullptr, Tmp(regs[i]), Arg::addr(Tmp(GPRInfo::regT0), i * sizeof(int64_t)));
}
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1000000000000ll);
CHECK(things[1] == 36000000000000ll);
for (unsigned i = 2; i < regs.size(); ++i)
CHECK(things[i] == static_cast<int64_t>(i) * 1000000000000ll);
CHECK(memory[0] == 1000000000000ll);
CHECK(memory[1] == 35000000000000ll);
}
int64_t combineHiLo(int64_t high, int64_t low)
{
union {
int64_t value;
int32_t halves[2];
} u;
u.value = high;
u.halves[0] = static_cast<int32_t>(low);
return u.value;
}
void testShuffleShiftMemoryAllRegsMixedWidth()
{
B3::Procedure proc;
Code& code = proc.code();
int64_t memory[2];
memory[0] = 35000000000000ll;
memory[1] = 36000000000000ll;
Vector<Reg> regs = code.regsInPriorityOrder(GP);
regs.removeFirst(Reg(GPRInfo::regT0));
BasicBlock* root = code.addBlock();
for (unsigned i = 0; i < regs.size(); ++i)
loadConstant(root, (i + 1) * 1000000000000ll, Tmp(regs[i]));
root->append(Move, nullptr, Arg::immPtr(&memory), Tmp(GPRInfo::regT0));
Inst& shuffle = root->append(
Shuffle, nullptr,
Tmp(regs[0]), Arg::addr(Tmp(GPRInfo::regT0), 0 * sizeof(int64_t)),
Arg::widthArg(Width32),
Arg::addr(Tmp(GPRInfo::regT0), 0 * sizeof(int64_t)),
Arg::addr(Tmp(GPRInfo::regT0), 1 * sizeof(int64_t)), Arg::widthArg(Width64),
Arg::addr(Tmp(GPRInfo::regT0), 1 * sizeof(int64_t)), Tmp(regs[1]),
Arg::widthArg(Width32));
for (unsigned i = 2; i < regs.size(); ++i) {
shuffle.append(
Tmp(regs[i - 1]), Tmp(regs[i]),
(i & 1) ? Arg::widthArg(Width32) : Arg::widthArg(Width64));
}
Vector<int64_t> things(regs.size(), 666);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things[0])), Tmp(GPRInfo::regT0));
for (unsigned i = 0; i < regs.size(); ++i) {
root->append(
Move, nullptr, Tmp(regs[i]), Arg::addr(Tmp(GPRInfo::regT0), i * sizeof(int64_t)));
}
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1000000000000ll);
CHECK(things[1] == static_cast<uint32_t>(36000000000000ll));
for (unsigned i = 2; i < regs.size(); ++i) {
int64_t value = static_cast<int64_t>(i) * 1000000000000ll;
CHECK(things[i] == ((i & 1) ? static_cast<uint32_t>(value) : value));
}
CHECK(memory[0] == combineHiLo(35000000000000ll, 1000000000000ll));
CHECK(memory[1] == 35000000000000ll);
}
void testShuffleRotateMemory()
{
B3::Procedure proc;
Code& code = proc.code();
int32_t memory[2];
memory[0] = 35;
memory[1] = 36;
BasicBlock* root = code.addBlock();
loadConstant(root, 1, Tmp(GPRInfo::regT0));
loadConstant(root, 2, Tmp(GPRInfo::regT1));
root->append(Move, nullptr, Arg::immPtr(&memory), Tmp(GPRInfo::regT2));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Arg::addr(Tmp(GPRInfo::regT2), 0 * sizeof(int32_t)),
Arg::widthArg(Width32),
Arg::addr(Tmp(GPRInfo::regT2), 0 * sizeof(int32_t)),
Arg::addr(Tmp(GPRInfo::regT2), 1 * sizeof(int32_t)), Arg::widthArg(Width32),
Arg::addr(Tmp(GPRInfo::regT2), 1 * sizeof(int32_t)), Tmp(GPRInfo::regT0),
Arg::widthArg(Width32));
int32_t things[2];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move32, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int32_t)));
root->append(Move32, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int32_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 36);
CHECK(things[1] == 1);
CHECK(memory[0] == 2);
CHECK(memory[1] == 35);
}
void testShuffleRotateMemory64()
{
B3::Procedure proc;
Code& code = proc.code();
int64_t memory[2];
memory[0] = 35000000000000ll;
memory[1] = 36000000000000ll;
BasicBlock* root = code.addBlock();
loadConstant(root, 1000000000000ll, Tmp(GPRInfo::regT0));
loadConstant(root, 2000000000000ll, Tmp(GPRInfo::regT1));
root->append(Move, nullptr, Arg::immPtr(&memory), Tmp(GPRInfo::regT2));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width64),
Tmp(GPRInfo::regT1), Arg::addr(Tmp(GPRInfo::regT2), 0 * sizeof(int64_t)),
Arg::widthArg(Width64),
Arg::addr(Tmp(GPRInfo::regT2), 0 * sizeof(int64_t)),
Arg::addr(Tmp(GPRInfo::regT2), 1 * sizeof(int64_t)), Arg::widthArg(Width64),
Arg::addr(Tmp(GPRInfo::regT2), 1 * sizeof(int64_t)), Tmp(GPRInfo::regT0),
Arg::widthArg(Width64));
int64_t things[2];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int64_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 36000000000000ll);
CHECK(things[1] == 1000000000000ll);
CHECK(memory[0] == 2000000000000ll);
CHECK(memory[1] == 35000000000000ll);
}
void testShuffleRotateMemoryMixedWidth()
{
B3::Procedure proc;
Code& code = proc.code();
int64_t memory[2];
memory[0] = 35000000000000ll;
memory[1] = 36000000000000ll;
BasicBlock* root = code.addBlock();
loadConstant(root, 1000000000000ll, Tmp(GPRInfo::regT0));
loadConstant(root, 2000000000000ll, Tmp(GPRInfo::regT1));
root->append(Move, nullptr, Arg::immPtr(&memory), Tmp(GPRInfo::regT2));
root->append(
Shuffle, nullptr,
Tmp(GPRInfo::regT0), Tmp(GPRInfo::regT1), Arg::widthArg(Width32),
Tmp(GPRInfo::regT1), Arg::addr(Tmp(GPRInfo::regT2), 0 * sizeof(int64_t)),
Arg::widthArg(Width64),
Arg::addr(Tmp(GPRInfo::regT2), 0 * sizeof(int64_t)),
Arg::addr(Tmp(GPRInfo::regT2), 1 * sizeof(int64_t)), Arg::widthArg(Width32),
Arg::addr(Tmp(GPRInfo::regT2), 1 * sizeof(int64_t)), Tmp(GPRInfo::regT0),
Arg::widthArg(Width64));
int64_t things[2];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(Move, nullptr, Tmp(GPRInfo::regT0), Arg::addr(base, 0 * sizeof(int64_t)));
root->append(Move, nullptr, Tmp(GPRInfo::regT1), Arg::addr(base, 1 * sizeof(int64_t)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 36000000000000ll);
CHECK(things[1] == static_cast<uint32_t>(1000000000000ll));
CHECK(memory[0] == 2000000000000ll);
CHECK(memory[1] == combineHiLo(36000000000000ll, 35000000000000ll));
}
void testShuffleRotateMemoryAllRegs64()
{
B3::Procedure proc;
Code& code = proc.code();
int64_t memory[2];
memory[0] = 35000000000000ll;
memory[1] = 36000000000000ll;
Vector<Reg> regs = code.regsInPriorityOrder(GP);
regs.removeFirst(Reg(GPRInfo::regT0));
BasicBlock* root = code.addBlock();
for (unsigned i = 0; i < regs.size(); ++i)
loadConstant(root, (i + 1) * 1000000000000ll, Tmp(regs[i]));
root->append(Move, nullptr, Arg::immPtr(&memory), Tmp(GPRInfo::regT0));
Inst& shuffle = root->append(
Shuffle, nullptr,
Tmp(regs[0]), Arg::addr(Tmp(GPRInfo::regT0), 0 * sizeof(int64_t)),
Arg::widthArg(Width64),
Arg::addr(Tmp(GPRInfo::regT0), 0 * sizeof(int64_t)),
Arg::addr(Tmp(GPRInfo::regT0), 1 * sizeof(int64_t)), Arg::widthArg(Width64),
Arg::addr(Tmp(GPRInfo::regT0), 1 * sizeof(int64_t)), Tmp(regs[1]),
Arg::widthArg(Width64),
regs.last(), regs[0], Arg::widthArg(Width64));
for (unsigned i = 2; i < regs.size(); ++i)
shuffle.append(Tmp(regs[i - 1]), Tmp(regs[i]), Arg::widthArg(Width64));
Vector<int64_t> things(regs.size(), 666);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things[0])), Tmp(GPRInfo::regT0));
for (unsigned i = 0; i < regs.size(); ++i) {
root->append(
Move, nullptr, Tmp(regs[i]), Arg::addr(Tmp(GPRInfo::regT0), i * sizeof(int64_t)));
}
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == static_cast<int64_t>(regs.size()) * 1000000000000ll);
CHECK(things[1] == 36000000000000ll);
for (unsigned i = 2; i < regs.size(); ++i)
CHECK(things[i] == static_cast<int64_t>(i) * 1000000000000ll);
CHECK(memory[0] == 1000000000000ll);
CHECK(memory[1] == 35000000000000ll);
}
void testShuffleRotateMemoryAllRegsMixedWidth()
{
B3::Procedure proc;
Code& code = proc.code();
int64_t memory[2];
memory[0] = 35000000000000ll;
memory[1] = 36000000000000ll;
Vector<Reg> regs = code.regsInPriorityOrder(GP);
regs.removeFirst(Reg(GPRInfo::regT0));
BasicBlock* root = code.addBlock();
for (unsigned i = 0; i < regs.size(); ++i)
loadConstant(root, (i + 1) * 1000000000000ll, Tmp(regs[i]));
root->append(Move, nullptr, Arg::immPtr(&memory), Tmp(GPRInfo::regT0));
Inst& shuffle = root->append(
Shuffle, nullptr,
Tmp(regs[0]), Arg::addr(Tmp(GPRInfo::regT0), 0 * sizeof(int64_t)),
Arg::widthArg(Width32),
Arg::addr(Tmp(GPRInfo::regT0), 0 * sizeof(int64_t)),
Arg::addr(Tmp(GPRInfo::regT0), 1 * sizeof(int64_t)), Arg::widthArg(Width64),
Arg::addr(Tmp(GPRInfo::regT0), 1 * sizeof(int64_t)), Tmp(regs[1]),
Arg::widthArg(Width32),
regs.last(), regs[0], Arg::widthArg(Width32));
for (unsigned i = 2; i < regs.size(); ++i)
shuffle.append(Tmp(regs[i - 1]), Tmp(regs[i]), Arg::widthArg(Width64));
Vector<int64_t> things(regs.size(), 666);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things[0])), Tmp(GPRInfo::regT0));
for (unsigned i = 0; i < regs.size(); ++i) {
root->append(
Move, nullptr, Tmp(regs[i]), Arg::addr(Tmp(GPRInfo::regT0), i * sizeof(int64_t)));
}
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == static_cast<uint32_t>(static_cast<int64_t>(regs.size()) * 1000000000000ll));
CHECK(things[1] == static_cast<uint32_t>(36000000000000ll));
for (unsigned i = 2; i < regs.size(); ++i)
CHECK(things[i] == static_cast<int64_t>(i) * 1000000000000ll);
CHECK(memory[0] == combineHiLo(35000000000000ll, 1000000000000ll));
CHECK(memory[1] == 35000000000000ll);
}
void testShuffleSwapDouble()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadDoubleConstant(root, 1, Tmp(FPRInfo::fpRegT0), Tmp(GPRInfo::regT0));
loadDoubleConstant(root, 2, Tmp(FPRInfo::fpRegT1), Tmp(GPRInfo::regT0));
loadDoubleConstant(root, 3, Tmp(FPRInfo::fpRegT2), Tmp(GPRInfo::regT0));
loadDoubleConstant(root, 4, Tmp(FPRInfo::fpRegT3), Tmp(GPRInfo::regT0));
root->append(
Shuffle, nullptr,
Tmp(FPRInfo::fpRegT2), Tmp(FPRInfo::fpRegT3), Arg::widthArg(Width64),
Tmp(FPRInfo::fpRegT3), Tmp(FPRInfo::fpRegT2), Arg::widthArg(Width64));
double things[4];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(MoveDouble, nullptr, Tmp(FPRInfo::fpRegT0), Arg::addr(base, 0 * sizeof(double)));
root->append(MoveDouble, nullptr, Tmp(FPRInfo::fpRegT1), Arg::addr(base, 1 * sizeof(double)));
root->append(MoveDouble, nullptr, Tmp(FPRInfo::fpRegT2), Arg::addr(base, 2 * sizeof(double)));
root->append(MoveDouble, nullptr, Tmp(FPRInfo::fpRegT3), Arg::addr(base, 3 * sizeof(double)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1);
CHECK(things[1] == 2);
CHECK(things[2] == 4);
CHECK(things[3] == 3);
}
void testShuffleShiftDouble()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
loadDoubleConstant(root, 1, Tmp(FPRInfo::fpRegT0), Tmp(GPRInfo::regT0));
loadDoubleConstant(root, 2, Tmp(FPRInfo::fpRegT1), Tmp(GPRInfo::regT0));
loadDoubleConstant(root, 3, Tmp(FPRInfo::fpRegT2), Tmp(GPRInfo::regT0));
loadDoubleConstant(root, 4, Tmp(FPRInfo::fpRegT3), Tmp(GPRInfo::regT0));
root->append(
Shuffle, nullptr,
Tmp(FPRInfo::fpRegT2), Tmp(FPRInfo::fpRegT3), Arg::widthArg(Width64));
double things[4];
Tmp base = code.newTmp(GP);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
root->append(MoveDouble, nullptr, Tmp(FPRInfo::fpRegT0), Arg::addr(base, 0 * sizeof(double)));
root->append(MoveDouble, nullptr, Tmp(FPRInfo::fpRegT1), Arg::addr(base, 1 * sizeof(double)));
root->append(MoveDouble, nullptr, Tmp(FPRInfo::fpRegT2), Arg::addr(base, 2 * sizeof(double)));
root->append(MoveDouble, nullptr, Tmp(FPRInfo::fpRegT3), Arg::addr(base, 3 * sizeof(double)));
root->append(Move, nullptr, Arg::imm(0), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
memset(things, 0, sizeof(things));
CHECK(!compileAndRun<int>(proc));
CHECK(things[0] == 1);
CHECK(things[1] == 2);
CHECK(things[2] == 3);
CHECK(things[3] == 3);
}
#if CPU(X86) || CPU(X86_64)
void testX86VMULSD()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
root->append(MulDouble, nullptr, Tmp(FPRInfo::argumentFPR0), Tmp(FPRInfo::argumentFPR1), Tmp(FPRInfo::argumentFPR2));
root->append(MoveDouble, nullptr, Tmp(FPRInfo::argumentFPR2), Tmp(FPRInfo::returnValueFPR));
root->append(RetDouble, nullptr, Tmp(FPRInfo::returnValueFPR));
CHECK(compileAndRun<double>(proc, 2.4, 4.2, pureNaN()) == 2.4 * 4.2);
}
void testX86VMULSDDestRex()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
root->append(MulDouble, nullptr, Tmp(FPRInfo::argumentFPR0), Tmp(FPRInfo::argumentFPR1), Tmp(X86Registers::xmm15));
root->append(MoveDouble, nullptr, Tmp(X86Registers::xmm15), Tmp(FPRInfo::returnValueFPR));
root->append(RetDouble, nullptr, Tmp(FPRInfo::returnValueFPR));
CHECK(compileAndRun<double>(proc, 2.4, 4.2, pureNaN()) == 2.4 * 4.2);
}
void testX86VMULSDOp1DestRex()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
root->append(MoveDouble, nullptr, Tmp(FPRInfo::argumentFPR0), Tmp(X86Registers::xmm14));
root->append(MulDouble, nullptr, Tmp(X86Registers::xmm14), Tmp(FPRInfo::argumentFPR1), Tmp(X86Registers::xmm15));
root->append(MoveDouble, nullptr, Tmp(X86Registers::xmm15), Tmp(FPRInfo::returnValueFPR));
root->append(RetDouble, nullptr, Tmp(FPRInfo::returnValueFPR));
CHECK(compileAndRun<double>(proc, 2.4, 4.2, pureNaN()) == 2.4 * 4.2);
}
void testX86VMULSDOp2DestRex()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
root->append(MoveDouble, nullptr, Tmp(FPRInfo::argumentFPR1), Tmp(X86Registers::xmm14));
root->append(MulDouble, nullptr, Tmp(FPRInfo::argumentFPR0), Tmp(X86Registers::xmm14), Tmp(X86Registers::xmm15));
root->append(MoveDouble, nullptr, Tmp(X86Registers::xmm15), Tmp(FPRInfo::returnValueFPR));
root->append(RetDouble, nullptr, Tmp(FPRInfo::returnValueFPR));
CHECK(compileAndRun<double>(proc, 2.4, 4.2, pureNaN()) == 2.4 * 4.2);
}
void testX86VMULSDOpsDestRex()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
root->append(MoveDouble, nullptr, Tmp(FPRInfo::argumentFPR0), Tmp(X86Registers::xmm14));
root->append(MoveDouble, nullptr, Tmp(FPRInfo::argumentFPR1), Tmp(X86Registers::xmm13));
root->append(MulDouble, nullptr, Tmp(X86Registers::xmm14), Tmp(X86Registers::xmm13), Tmp(X86Registers::xmm15));
root->append(MoveDouble, nullptr, Tmp(X86Registers::xmm15), Tmp(FPRInfo::returnValueFPR));
root->append(RetDouble, nullptr, Tmp(FPRInfo::returnValueFPR));
CHECK(compileAndRun<double>(proc, 2.4, 4.2, pureNaN()) == 2.4 * 4.2);
}
void testX86VMULSDAddr()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
root->append(MulDouble, nullptr, Tmp(FPRInfo::argumentFPR0), Arg::addr(Tmp(GPRInfo::argumentGPR0), - 16), Tmp(FPRInfo::argumentFPR2));
root->append(MoveDouble, nullptr, Tmp(FPRInfo::argumentFPR2), Tmp(FPRInfo::returnValueFPR));
root->append(RetDouble, nullptr, Tmp(FPRInfo::returnValueFPR));
double secondArg = 4.2;
CHECK(compileAndRun<double>(proc, 2.4, &secondArg + 2, pureNaN()) == 2.4 * 4.2);
}
void testX86VMULSDAddrOpRexAddr()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
root->append(Move, nullptr, Tmp(GPRInfo::argumentGPR0), Tmp(X86Registers::r13));
root->append(MulDouble, nullptr, Tmp(FPRInfo::argumentFPR0), Arg::addr(Tmp(X86Registers::r13), - 16), Tmp(FPRInfo::argumentFPR2));
root->append(MoveDouble, nullptr, Tmp(FPRInfo::argumentFPR2), Tmp(FPRInfo::returnValueFPR));
root->append(RetDouble, nullptr, Tmp(FPRInfo::returnValueFPR));
double secondArg = 4.2;
CHECK(compileAndRun<double>(proc, 2.4, &secondArg + 2, pureNaN()) == 2.4 * 4.2);
}
void testX86VMULSDDestRexAddr()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
root->append(MulDouble, nullptr, Tmp(FPRInfo::argumentFPR0), Arg::addr(Tmp(GPRInfo::argumentGPR0), 16), Tmp(X86Registers::xmm15));
root->append(MoveDouble, nullptr, Tmp(X86Registers::xmm15), Tmp(FPRInfo::returnValueFPR));
root->append(RetDouble, nullptr, Tmp(FPRInfo::returnValueFPR));
double secondArg = 4.2;
CHECK(compileAndRun<double>(proc, 2.4, &secondArg - 2, pureNaN()) == 2.4 * 4.2);
}
void testX86VMULSDRegOpDestRexAddr()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
root->append(MoveDouble, nullptr, Tmp(FPRInfo::argumentFPR0), Tmp(X86Registers::xmm14));
root->append(MulDouble, nullptr, Arg::addr(Tmp(GPRInfo::argumentGPR0)), Tmp(X86Registers::xmm14), Tmp(X86Registers::xmm15));
root->append(MoveDouble, nullptr, Tmp(X86Registers::xmm15), Tmp(FPRInfo::returnValueFPR));
root->append(RetDouble, nullptr, Tmp(FPRInfo::returnValueFPR));
double secondArg = 4.2;
CHECK(compileAndRun<double>(proc, 2.4, &secondArg, pureNaN()) == 2.4 * 4.2);
}
void testX86VMULSDAddrOpDestRexAddr()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
root->append(Move, nullptr, Tmp(GPRInfo::argumentGPR0), Tmp(X86Registers::r13));
root->append(MulDouble, nullptr, Tmp(FPRInfo::argumentFPR0), Arg::addr(Tmp(X86Registers::r13), 8), Tmp(X86Registers::xmm15));
root->append(MoveDouble, nullptr, Tmp(X86Registers::xmm15), Tmp(FPRInfo::returnValueFPR));
root->append(RetDouble, nullptr, Tmp(FPRInfo::returnValueFPR));
double secondArg = 4.2;
CHECK(compileAndRun<double>(proc, 2.4, &secondArg - 1, pureNaN()) == 2.4 * 4.2);
}
void testX86VMULSDBaseNeedsRex()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
root->append(Move, nullptr, Tmp(GPRInfo::argumentGPR0), Tmp(X86Registers::r13));
root->append(MulDouble, nullptr, Arg::index(Tmp(X86Registers::r13), Tmp(GPRInfo::argumentGPR1)), Tmp(FPRInfo::argumentFPR0), Tmp(X86Registers::xmm0));
root->append(MoveDouble, nullptr, Tmp(X86Registers::xmm0), Tmp(FPRInfo::returnValueFPR));
root->append(RetDouble, nullptr, Tmp(FPRInfo::returnValueFPR));
double secondArg = 4.2;
uint64_t index = 8;
CHECK(compileAndRun<double>(proc, 2.4, &secondArg - 1, index, pureNaN()) == 2.4 * 4.2);
}
void testX86VMULSDIndexNeedsRex()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
root->append(Move, nullptr, Tmp(GPRInfo::argumentGPR1), Tmp(X86Registers::r13));
root->append(MulDouble, nullptr, Arg::index(Tmp(GPRInfo::argumentGPR0), Tmp(X86Registers::r13)), Tmp(FPRInfo::argumentFPR0), Tmp(X86Registers::xmm0));
root->append(MoveDouble, nullptr, Tmp(X86Registers::xmm0), Tmp(FPRInfo::returnValueFPR));
root->append(RetDouble, nullptr, Tmp(FPRInfo::returnValueFPR));
double secondArg = 4.2;
uint64_t index = - 8;
CHECK(compileAndRun<double>(proc, 2.4, &secondArg + 1, index, pureNaN()) == 2.4 * 4.2);
}
void testX86VMULSDBaseIndexNeedRex()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
root->append(Move, nullptr, Tmp(GPRInfo::argumentGPR0), Tmp(X86Registers::r12));
root->append(Move, nullptr, Tmp(GPRInfo::argumentGPR1), Tmp(X86Registers::r13));
root->append(MulDouble, nullptr, Arg::index(Tmp(X86Registers::r12), Tmp(X86Registers::r13)), Tmp(FPRInfo::argumentFPR0), Tmp(X86Registers::xmm0));
root->append(MoveDouble, nullptr, Tmp(X86Registers::xmm0), Tmp(FPRInfo::returnValueFPR));
root->append(RetDouble, nullptr, Tmp(FPRInfo::returnValueFPR));
double secondArg = 4.2;
uint64_t index = 16;
CHECK(compileAndRun<double>(proc, 2.4, &secondArg - 2, index, pureNaN()) == 2.4 * 4.2);
}
#endif // #if CPU(X86) || CPU(X86_64)
#if CPU(ARM64)
void testInvalidateCachedTempRegisters()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
int32_t things[4];
things[0] = 0x12000000;
things[1] = 0x340000;
things[2] = 0x5600;
things[3] = 0x78;
Tmp base = code.newTmp(GP);
GPRReg tmp = GPRInfo::regT1;
proc.pinRegister(tmp);
root->append(Move, nullptr, Arg::bigImm(bitwise_cast<intptr_t>(&things)), base);
B3::BasicBlock* patchPoint1Root = proc.addBlock();
B3::Air::Special* patchpointSpecial = code.addSpecial(makeUnique<B3::PatchpointSpecial>());
// In Patchpoint, Load things[0] -> tmp. This will materialize the address in x17 (dataMemoryRegister).
B3::PatchpointValue* patchpoint1 = patchPoint1Root->appendNew<B3::PatchpointValue>(proc, B3::Void, B3::Origin());
patchpoint1->clobber(RegisterSet::macroScratchRegisters());
patchpoint1->setGenerator(
[=] (CCallHelpers& jit, const B3::StackmapGenerationParams&) {
AllowMacroScratchRegisterUsage allowScratch(jit);
jit.load32(&things, tmp);
});
root->append(Patch, patchpoint1, Arg::special(patchpointSpecial));
// Load things[1] -> x17, trashing dataMemoryRegister.
root->append(Move32, nullptr, Arg::addr(base, 1 * sizeof(int32_t)), Tmp(ARM64Registers::x17));
root->append(Add32, nullptr, Tmp(tmp), Tmp(ARM64Registers::x17), Tmp(GPRInfo::returnValueGPR));
// In Patchpoint, Load things[2] -> tmp. This should not reuse the prior contents of x17.
B3::BasicBlock* patchPoint2Root = proc.addBlock();
B3::PatchpointValue* patchpoint2 = patchPoint2Root->appendNew<B3::PatchpointValue>(proc, B3::Void, B3::Origin());
patchpoint2->clobber(RegisterSet::macroScratchRegisters());
patchpoint2->setGenerator(
[=] (CCallHelpers& jit, const B3::StackmapGenerationParams&) {
AllowMacroScratchRegisterUsage allowScratch(jit);
jit.load32(&things[2], tmp);
});
root->append(Patch, patchpoint2, Arg::special(patchpointSpecial));
root->append(Add32, nullptr, Tmp(tmp), Tmp(GPRInfo::returnValueGPR), Tmp(GPRInfo::returnValueGPR));
// In patchpoint, Store 0x78 -> things[3].
// This will use and cache both x16 (dataMemoryRegister) and x17 (dataTempRegister).
B3::BasicBlock* patchPoint3Root = proc.addBlock();
B3::PatchpointValue* patchpoint3 = patchPoint3Root->appendNew<B3::PatchpointValue>(proc, B3::Void, B3::Origin());
patchpoint3->clobber(RegisterSet::macroScratchRegisters());
patchpoint3->setGenerator(
[=] (CCallHelpers& jit, const B3::StackmapGenerationParams&) {
AllowMacroScratchRegisterUsage allowScratch(jit);
jit.store32(CCallHelpers::TrustedImm32(0x78), &things[3]);
});
root->append(Patch, patchpoint3, Arg::special(patchpointSpecial));
// Set x16 to 0xdead, trashing x16.
root->append(Move, nullptr, Arg::bigImm(0xdead), Tmp(ARM64Registers::x16));
root->append(Xor32, nullptr, Tmp(ARM64Registers::x16), Tmp(GPRInfo::returnValueGPR));
// In patchpoint, again Store 0x78 -> things[3].
// This should rematerialize both x16 (dataMemoryRegister) and x17 (dataTempRegister).
B3::BasicBlock* patchPoint4Root = proc.addBlock();
B3::PatchpointValue* patchpoint4 = patchPoint4Root->appendNew<B3::PatchpointValue>(proc, B3::Void, B3::Origin());
patchpoint4->clobber(RegisterSet::macroScratchRegisters());
patchpoint4->setGenerator(
[=] (CCallHelpers& jit, const B3::StackmapGenerationParams&) {
AllowMacroScratchRegisterUsage allowScratch(jit);
jit.store32(CCallHelpers::TrustedImm32(0x78), &things[3]);
});
root->append(Patch, patchpoint4, Arg::special(patchpointSpecial));
root->append(Move, nullptr, Arg::bigImm(0xdead), Tmp(tmp));
root->append(Xor32, nullptr, Tmp(tmp), Tmp(GPRInfo::returnValueGPR));
root->append(Move32, nullptr, Arg::addr(base, 3 * sizeof(int32_t)), Tmp(tmp));
root->append(Add32, nullptr, Tmp(tmp), Tmp(GPRInfo::returnValueGPR), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
int32_t r = compileAndRun<int32_t>(proc);
CHECK(r == 0x12345678);
}
#endif // #if CPU(ARM64)
void testArgumentRegPinned()
{
B3::Procedure proc;
Code& code = proc.code();
GPRReg pinned = GPRInfo::argumentGPR0;
proc.pinRegister(pinned);
B3::Air::Special* patchpointSpecial = code.addSpecial(makeUnique<B3::PatchpointSpecial>());
B3::BasicBlock* b3Root = proc.addBlock();
B3::PatchpointValue* patchpoint = b3Root->appendNew<B3::PatchpointValue>(proc, B3::Void, B3::Origin());
patchpoint->clobber(RegisterSet(pinned));
patchpoint->setGenerator(
[=] (CCallHelpers& jit, const B3::StackmapGenerationParams&) {
jit.move(CCallHelpers::TrustedImm32(42), pinned);
});
BasicBlock* root = code.addBlock();
Tmp t1 = code.newTmp(GP);
Tmp t2 = code.newTmp(GP);
root->append(Move, nullptr, Tmp(pinned), t1);
root->append(Patch, patchpoint, Arg::special(patchpointSpecial));
root->append(Move, nullptr, Tmp(pinned), t2);
root->append(Add32, nullptr, t1, t2, Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
int32_t r = compileAndRun<int32_t>(proc, 10);
CHECK(r == 10 + 42);
}
void testArgumentRegPinned2()
{
B3::Procedure proc;
Code& code = proc.code();
GPRReg pinned = GPRInfo::argumentGPR0;
proc.pinRegister(pinned);
B3::Air::Special* patchpointSpecial = code.addSpecial(makeUnique<B3::PatchpointSpecial>());
B3::BasicBlock* b3Root = proc.addBlock();
B3::PatchpointValue* patchpoint = b3Root->appendNew<B3::PatchpointValue>(proc, B3::Void, B3::Origin());
patchpoint->clobber({ });
patchpoint->setGenerator(
[=] (CCallHelpers& jit, const B3::StackmapGenerationParams&) {
jit.move(CCallHelpers::TrustedImm32(42), pinned);
});
BasicBlock* root = code.addBlock();
Tmp t1 = code.newTmp(GP);
Tmp t2 = code.newTmp(GP);
// Since the patchpoint does not claim to clobber the pinned register,
// the register allocator is allowed to either coalesce the first move,
// the second move, or neither. The allowed results are:
// - No move coalesced: 52
// - The first move is coalesced: 84
// - The second move is coalesced: 52
root->append(Move, nullptr, Tmp(pinned), t1);
root->append(Patch, patchpoint, Arg::special(patchpointSpecial));
root->append(Move, nullptr, Tmp(pinned), t2);
root->append(Add32, nullptr, t1, t2, Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
int32_t r = compileAndRun<int32_t>(proc, 10);
CHECK(r == 52 || r == 84);
}
void testArgumentRegPinned3()
{
B3::Procedure proc;
Code& code = proc.code();
GPRReg pinned = GPRInfo::argumentGPR0;
proc.pinRegister(pinned);
B3::Air::Special* patchpointSpecial = code.addSpecial(makeUnique<B3::PatchpointSpecial>());
B3::BasicBlock* b3Root = proc.addBlock();
B3::PatchpointValue* patchpoint = b3Root->appendNew<B3::PatchpointValue>(proc, B3::Void, B3::Origin());
patchpoint->clobber(RegisterSet(pinned));
patchpoint->setGenerator(
[=] (CCallHelpers& jit, const B3::StackmapGenerationParams&) {
jit.move(CCallHelpers::TrustedImm32(42), pinned);
});
BasicBlock* root = code.addBlock();
Tmp t1 = code.newTmp(GP);
Tmp t2 = code.newTmp(GP);
Tmp t3 = code.newTmp(GP);
root->append(Move, nullptr, Tmp(pinned), t1);
root->append(Patch, patchpoint, Arg::special(patchpointSpecial));
root->append(Move, nullptr, Tmp(pinned), t2);
root->append(Patch, patchpoint, Arg::special(patchpointSpecial));
root->append(Move, nullptr, Tmp(pinned), t3);
root->append(Add32, nullptr, t1, t2, Tmp(GPRInfo::returnValueGPR));
root->append(Add32, nullptr, Tmp(GPRInfo::returnValueGPR), t3, Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
int32_t r = compileAndRun<int32_t>(proc, 10);
CHECK(r == 10 + 42 + 42);
}
void testLea64()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
int64_t a = 0x11223344;
int64_t b = 1 << 13;
root->append(Lea64, nullptr, Arg::addr(Tmp(GPRInfo::argumentGPR0), b), Tmp(GPRInfo::returnValueGPR));
root->append(Ret64, nullptr, Tmp(GPRInfo::returnValueGPR));
int64_t r = compileAndRun<int64_t>(proc, a);
CHECK(r == a + b);
}
void testLea32()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
int32_t a = 0x11223344;
int32_t b = 1 << 13;
root->append(Lea32, nullptr, Arg::addr(Tmp(GPRInfo::argumentGPR0), b), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
int32_t r = compileAndRun<int32_t>(proc, a);
CHECK(r == a + b);
}
inline Vector<String> matchAll(const CString& source, std::regex regex)
{
Vector<String> matches;
std::smatch match;
for (std::string str = source.data(); std::regex_search(str, match, regex); str = match.suffix()) {
ASSERT(match.size() == 1);
matches.append(match[0].str().c_str());
}
return matches;
}
void testElideSimpleMove()
{
for (unsigned tmpCount = 1; tmpCount < 100; tmpCount++) {
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
Tmp tmp = code.newTmp(B3::GP);
root->append(Move, nullptr, Tmp(GPRInfo::argumentGPR0), tmp);
for (unsigned i = 0; i < tmpCount; i++) {
Tmp newTmp = code.newTmp(B3::GP);
root->append(Move, nullptr, tmp, newTmp);
tmp = newTmp;
}
root->append(Move, nullptr, tmp, Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
auto compilation = compile(proc);
CString disassembly = compilation->disassembly();
std::regex findRRMove(isARM64() ? "mov\\s+x\\d+, x\\d+\\n" : "mov %\\w+, %\\w+\\n");
auto result = matchAll(disassembly, findRRMove);
if (isARM64()) {
if (!Options::defaultB3OptLevel())
CHECK(result.size() == 2);
else
CHECK(result.size() == 0);
} else if (isX86()) {
// sp -> fp; arg0 -> ret0; fp -> sp
// fp -> sp only happens in O0 because we don't actually need to move the stack in general.
CHECK(result.size() == 2 + !Options::defaultB3OptLevel());
} else
RELEASE_ASSERT_NOT_REACHED();
}
}
void testElideHandlesEarlyClobber()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
const unsigned tmpCount = RegisterSet::allGPRs().numberOfSetRegisters() * 2;
Vector<Tmp> tmps(tmpCount);
for (unsigned i = 0; i < tmpCount; ++i) {
tmps[i] = code.newTmp(B3::GP);
root->append(Move, nullptr, Arg::imm(i), tmps[i]);
}
RegisterSet registers = RegisterSet::allGPRs();
registers.exclude(RegisterSet::reservedHardwareRegisters());
registers.exclude(RegisterSet::stackRegisters());
Reg firstCalleeSave;
Reg lastCalleeSave;
auto* patch = proc.add<B3::PatchpointValue>(B3::Int32, B3::Origin());
patch->clobberEarly(registers);
for (Reg reg : registers) {
if (!firstCalleeSave)
firstCalleeSave = reg;
lastCalleeSave = reg;
}
ASSERT(firstCalleeSave != lastCalleeSave);
patch->earlyClobbered().clear(firstCalleeSave);
patch->resultConstraints.append({ B3::ValueRep::reg(firstCalleeSave) });
patch->earlyClobbered().clear(lastCalleeSave);
patch->clobber(RegisterSet(lastCalleeSave));
patch->setGenerator([=] (CCallHelpers& jit, const JSC::B3::StackmapGenerationParams&) {
jit.probe([=] (Probe::Context& context) {
for (Reg reg : registers)
context.gpr(reg.gpr()) = 0;
});
});
Inst inst(Patch, patch, Arg::special(code.addSpecial(WTF::makeUnique<JSC::B3::PatchpointSpecial>())));
inst.args.append(Tmp(firstCalleeSave));
root->appendInst(WTFMove(inst));
Tmp result = code.newTmp(B3::GP);
root->append(Move, nullptr, tmps[0], result);
for (Tmp tmp : tmps)
root->append(Add32, nullptr, tmp, result);
root->append(Move, nullptr, result, Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
auto runResult = compileAndRun<uint32_t>(proc);
CHECK(runResult == (tmpCount * (tmpCount - 1)) / 2);
}
void testElideMoveThenRealloc()
{
RegisterSet registers = RegisterSet::allGPRs();
registers.exclude(RegisterSet::stackRegisters());
registers.exclude(RegisterSet::reservedHardwareRegisters());
for (Reg reg : registers) {
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
BasicBlock* taken = code.addBlock();
BasicBlock* notTaken = code.addBlock();
BasicBlock* notTakenReturn = code.addBlock();
BasicBlock* ret = code.addBlock();
BasicBlock* continuation = code.addBlock();
Tmp tmp = code.newTmp(B3::GP);
Arg negOne;
if (isARM64()) {
negOne = code.newTmp(B3::GP);
root->append(Move, nullptr, Arg::bigImm(-1), negOne);
} else if (isX86())
negOne = Arg::bitImm(-1);
else
RELEASE_ASSERT_NOT_REACHED();
{
root->append(Move, nullptr, Arg::imm(1), Tmp(reg));
root->append(BranchTest32, nullptr, Arg::resCond(MacroAssembler::NonZero), Tmp(reg), negOne);
root->setSuccessors(taken, notTaken);
}
{
taken->append(Jump, nullptr);
taken->setSuccessors(continuation);
}
{
notTaken->append(BranchTest32, nullptr, Arg::resCond(MacroAssembler::NonZero), Tmp(reg), negOne);
notTaken->setSuccessors(continuation, notTakenReturn);
}
{
tmp = code.newTmp(B3::GP);
continuation->append(Move, nullptr, Arg::imm(42), tmp);
continuation->append(BranchTest32, nullptr, Arg::resCond(MacroAssembler::NonZero), tmp, negOne);
continuation->setSuccessors(ret, notTakenReturn);
}
{
tmp = code.newTmp(B3::GP);
ret->append(Move, nullptr, Arg::imm(42), tmp);
ret->append(Move, nullptr, tmp, Tmp(reg));
ret->append(Move, nullptr, Tmp(reg), Tmp(GPRInfo::returnValueGPR));
ret->append(Add32, nullptr, Tmp(reg), Tmp(reg));
ret->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
}
{
notTakenReturn->append(Move, nullptr, Tmp(reg), Tmp(GPRInfo::returnValueGPR));
notTakenReturn->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
}
code.resetReachability();
auto runResult = compileAndRun<uint32_t>(proc);
CHECK(runResult == static_cast<unsigned>(42 + (42 * (reg == GPRInfo::returnValueGPR))));
}
}
void testLinearScanSpillRangesLateUse()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
B3::Air::Special* patchpointSpecial = code.addSpecial(makeUnique<B3::PatchpointSpecial>());
Vector<Tmp> tmps;
for (unsigned i = 0; i < 100; ++i) {
Tmp tmp = code.newTmp(GP);
tmps.append(tmp);
root->append(Move, nullptr, Arg::bigImm(i), tmp);
}
for (unsigned i = 0; i + 1 < tmps.size(); ++i) {
Tmp tmp1 = tmps[i];
Tmp tmp2 = tmps[i + 1];
B3::Value* dummyValue = proc.addConstant(B3::Origin(), B3::Int64, 0);
B3::Value* dummyValue2 = proc.addConstant(B3::Origin(), B3::Int64, 0);
B3::PatchpointValue* patchpoint = proc.add<B3::PatchpointValue>(B3::Void, B3::Origin());
patchpoint->append(dummyValue, B3::ValueRep::SomeRegister);
patchpoint->append(dummyValue2, B3::ValueRep::SomeLateRegister);
patchpoint->setGenerator([=] (CCallHelpers& jit, const B3::StackmapGenerationParams& params) {
RELEASE_ASSERT(params[0].gpr() != params[1].gpr());
auto good = jit.branch32(CCallHelpers::Equal, params[0].gpr(), CCallHelpers::TrustedImm32(i));
jit.breakpoint();
good.link(&jit);
good = jit.branch32(CCallHelpers::Equal, params[1].gpr(), CCallHelpers::TrustedImm32(i + 1));
jit.breakpoint();
good.link(&jit);
});
Inst inst(Patch, patchpoint, Arg::special(patchpointSpecial));
inst.args.append(tmp1);
inst.args.append(tmp2);
root->append(inst);
}
root->append(Move32, nullptr, tmps.last(), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
auto runResult = compileAndRun<uint32_t>(proc);
CHECK(runResult == 99);
}
void testLinearScanSpillRangesEarlyDef()
{
B3::Procedure proc;
Code& code = proc.code();
BasicBlock* root = code.addBlock();
B3::Air::Special* patchpointSpecial = code.addSpecial(makeUnique<B3::PatchpointSpecial>());
Vector<Tmp> tmps;
for (unsigned i = 0; i < 100; ++i) {
Tmp tmp = code.newTmp(GP);
tmps.append(tmp);
if (!i)
root->append(Move, nullptr, Arg::bigImm(i), tmp);
}
for (unsigned i = 0; i + 1 < tmps.size(); ++i) {
Tmp tmp1 = tmps[i];
Tmp tmp2 = tmps[i + 1];
B3::Value* dummyValue = proc.addConstant(B3::Origin(), B3::Int64, 0);
B3::PatchpointValue* patchpoint = proc.add<B3::PatchpointValue>(B3::Int32, B3::Origin());
patchpoint->resultConstraints = { B3::ValueRep::SomeEarlyRegister };
patchpoint->append(dummyValue, B3::ValueRep::SomeLateRegister);
patchpoint->setGenerator([=] (CCallHelpers& jit, const B3::StackmapGenerationParams& params) {
RELEASE_ASSERT(params[0].gpr() != params[1].gpr());
auto good = jit.branch32(CCallHelpers::Equal, params[1].gpr(), CCallHelpers::TrustedImm32(i));
jit.breakpoint();
good.link(&jit);
jit.move(CCallHelpers::TrustedImm32(i + 1), params[0].gpr());
});
Inst inst(Patch, patchpoint, Arg::special(patchpointSpecial));
inst.args.append(tmp2); // def
inst.args.append(tmp1); // use
root->append(inst);
}
// Make all tmps live till the end
for (unsigned i = 0; i < tmps.size(); ++i) {
Tmp tmp = tmps[i];
B3::Value* dummyValue = proc.addConstant(B3::Origin(), B3::Int64, 0);
B3::PatchpointValue* patchpoint = proc.add<B3::PatchpointValue>(B3::Void, B3::Origin());
patchpoint->append(dummyValue, B3::ValueRep::SomeRegister);
patchpoint->setGenerator([=] (CCallHelpers& jit, const B3::StackmapGenerationParams& params) {
auto good = jit.branch32(CCallHelpers::Equal, params[0].gpr(), CCallHelpers::TrustedImm32(i));
jit.breakpoint();
good.link(&jit);
});
Inst inst(Patch, patchpoint, Arg::special(patchpointSpecial));
inst.args.append(tmp);
root->append(inst);
}
root->append(Move32, nullptr, tmps.last(), Tmp(GPRInfo::returnValueGPR));
root->append(Ret32, nullptr, Tmp(GPRInfo::returnValueGPR));
auto runResult = compileAndRun<uint32_t>(proc);
CHECK(runResult == 99);
}
#define PREFIX "O", Options::defaultB3OptLevel(), ": "
#define RUN(test) do { \
if (!shouldRun(#test)) \
break; \
tasks.append( \
createSharedTask<void()>( \
[&] () { \
dataLog(PREFIX #test "...\n"); \
test; \
dataLog(PREFIX #test ": OK!\n"); \
})); \
} while (false);
void run(const char* filter)
{
Deque<RefPtr<SharedTask<void()>>> tasks;
auto shouldRun = [&] (const char* testName) -> bool {
return !filter || WTF::findIgnoringASCIICaseWithoutLength(testName, filter) != WTF::notFound;
};
RUN(testSimple());
RUN(testShuffleSimpleSwap());
RUN(testShuffleSimpleShift());
RUN(testShuffleLongShift());
RUN(testShuffleLongShiftBackwards());
RUN(testShuffleSimpleRotate());
RUN(testShuffleSimpleBroadcast());
RUN(testShuffleBroadcastAllRegs());
RUN(testShuffleTreeShift());
RUN(testShuffleTreeShiftBackward());
RUN(testShuffleTreeShiftOtherBackward());
RUN(testShuffleMultipleShifts());
RUN(testShuffleRotateWithFringe());
RUN(testShuffleRotateWithFringeInWeirdOrder());
RUN(testShuffleRotateWithLongFringe());
RUN(testShuffleMultipleRotates());
RUN(testShuffleShiftAndRotate());
RUN(testShuffleShiftAllRegs());
RUN(testShuffleRotateAllRegs());
RUN(testShuffleSimpleSwap64());
RUN(testShuffleSimpleShift64());
RUN(testShuffleSwapMixedWidth());
RUN(testShuffleShiftMixedWidth());
RUN(testShuffleShiftMemory());
RUN(testShuffleShiftMemoryLong());
RUN(testShuffleShiftMemoryAllRegs());
RUN(testShuffleShiftMemoryAllRegs64());
RUN(testShuffleShiftMemoryAllRegsMixedWidth());
RUN(testShuffleRotateMemory());
RUN(testShuffleRotateMemory64());
RUN(testShuffleRotateMemoryMixedWidth());
RUN(testShuffleRotateMemoryAllRegs64());
RUN(testShuffleRotateMemoryAllRegsMixedWidth());
RUN(testShuffleSwapDouble());
RUN(testShuffleShiftDouble());
#if CPU(X86) || CPU(X86_64)
RUN(testX86VMULSD());
RUN(testX86VMULSDDestRex());
RUN(testX86VMULSDOp1DestRex());
RUN(testX86VMULSDOp2DestRex());
RUN(testX86VMULSDOpsDestRex());
RUN(testX86VMULSDAddr());
RUN(testX86VMULSDAddrOpRexAddr());
RUN(testX86VMULSDDestRexAddr());
RUN(testX86VMULSDRegOpDestRexAddr());
RUN(testX86VMULSDAddrOpDestRexAddr());
RUN(testX86VMULSDBaseNeedsRex());
RUN(testX86VMULSDIndexNeedsRex());
RUN(testX86VMULSDBaseIndexNeedRex());
#endif
#if CPU(ARM64)
RUN(testInvalidateCachedTempRegisters());
#endif
RUN(testArgumentRegPinned());
RUN(testArgumentRegPinned2());
RUN(testArgumentRegPinned3());
RUN(testLea32());
RUN(testLea64());
RUN(testElideSimpleMove());
RUN(testElideHandlesEarlyClobber());
RUN(testElideMoveThenRealloc());
RUN(testLinearScanSpillRangesLateUse());
RUN(testLinearScanSpillRangesEarlyDef());
if (tasks.isEmpty())
usage();
Lock lock;
Vector<Ref<Thread>> threads;
for (unsigned i = filter ? 1 : WTF::numberOfProcessorCores(); i--;) {
threads.append(
Thread::create(
"testair thread",
[&] () {
for (;;) {
RefPtr<SharedTask<void()>> task;
{
LockHolder locker(lock);
if (tasks.isEmpty())
return;
task = tasks.takeFirst();
}
task->run();
}
}));
}
for (auto& thread : threads)
thread->waitForCompletion();
crashLock.lock();
crashLock.unlock();
}
} // anonymous namespace
#else // ENABLE(B3_JIT)
static void run(const char*)
{
dataLog("B3 JIT is not enabled.\n");
}
#endif // ENABLE(B3_JIT)
int main(int argc, char** argv)
{
const char* filter = nullptr;
switch (argc) {
case 1:
break;
case 2:
filter = argv[1];
break;
default:
usage();
break;
}
JSC::initialize();
for (unsigned i = 0; i <= 2; ++i) {
JSC::Options::defaultB3OptLevel() = i;
run(filter);
}
return 0;
}
#if OS(WINDOWS)
extern "C" __declspec(dllexport) int WINAPI dllLauncherEntryPoint(int argc, const char* argv[])
{
return main(argc, const_cast<char**>(argv));
}
#endif