blob: 098fab8e571991aaf723dd078ef2d6d5a344b108 [file] [log] [blame]
# Copyright (C) 2019 Apple Inc. All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions
# are met:
# 1. Redistributions of source code must retain the above copyright
# notice, this list of conditions and the following disclaimer.
# 2. Redistributions in binary form must reproduce the above copyright
# notice, this list of conditions and the following disclaimer in the
# documentation and/or other materials provided with the distribution.
#
# THIS SOFTWARE IS PROVIDED BY APPLE INC. AND ITS CONTRIBUTORS ``AS IS''
# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
# THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
# PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR ITS CONTRIBUTORS
# BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
# INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
# CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
# THE POSSIBILITY OF SUCH DAMAGE.
# Calling conventions
const CalleeSaveSpaceAsVirtualRegisters = constexpr Wasm::numberOfLLIntCalleeSaveRegisters
const CalleeSaveSpaceStackAligned = (CalleeSaveSpaceAsVirtualRegisters * SlotSize + StackAlignment - 1) & ~StackAlignmentMask
const WasmEntryPtrTag = constexpr WasmEntryPtrTag
if HAVE_FAST_TLS
const WTF_WASM_CONTEXT_KEY = constexpr WTF_WASM_CONTEXT_KEY
end
if X86_64
const NumberOfWasmArgumentGPRs = 6
elsif ARM64 or ARM64E
const NumberOfWasmArgumentGPRs = 8
else
error
end
const NumberOfWasmArgumentFPRs = 8
const NumberOfWasmArguments = NumberOfWasmArgumentGPRs + NumberOfWasmArgumentFPRs
# All callee saves must match the definition in WasmCallee.cpp
# These must match the definition in WasmMemoryInformation.cpp
const wasmInstance = csr0
const memoryBase = csr3
const memorySize = csr4
# This must match the definition in LowLevelInterpreter.asm
if X86_64
const PB = csr2
elsif ARM64 or ARM64E
const PB = csr7
else
error
end
macro forEachArgumentGPR(fn)
fn(0 * 8, wa0)
fn(1 * 8, wa1)
fn(2 * 8, wa2)
fn(3 * 8, wa3)
fn(4 * 8, wa4)
fn(5 * 8, wa5)
if ARM64 or ARM64E
fn(6 * 8, wa6)
fn(7 * 8, wa7)
end
end
macro forEachArgumentFPR(fn)
fn((NumberOfWasmArgumentGPRs + 0) * 8, wfa0)
fn((NumberOfWasmArgumentGPRs + 1) * 8, wfa1)
fn((NumberOfWasmArgumentGPRs + 2) * 8, wfa2)
fn((NumberOfWasmArgumentGPRs + 3) * 8, wfa3)
fn((NumberOfWasmArgumentGPRs + 4) * 8, wfa4)
fn((NumberOfWasmArgumentGPRs + 5) * 8, wfa5)
fn((NumberOfWasmArgumentGPRs + 6) * 8, wfa6)
fn((NumberOfWasmArgumentGPRs + 7) * 8, wfa7)
end
# Helper macros
# FIXME: Eventually this should be unified with the JS versions
# https://bugs.webkit.org/show_bug.cgi?id=203656
macro wasmDispatch(advanceReg)
addp advanceReg, PC
wasmNextInstruction()
end
macro wasmDispatchIndirect(offsetReg)
wasmDispatch(offsetReg)
end
macro wasmNextInstruction()
loadb [PB, PC, 1], t0
leap _g_opcodeMap, t1
jmp NumberOfJSOpcodeIDs * PtrSize[t1, t0, PtrSize], BytecodePtrTag
end
macro wasmNextInstructionWide16()
loadh 1[PB, PC, 1], t0
leap _g_opcodeMapWide16, t1
jmp NumberOfJSOpcodeIDs * PtrSize[t1, t0, PtrSize], BytecodePtrTag
end
macro wasmNextInstructionWide32()
loadi 1[PB, PC, 1], t0
leap _g_opcodeMapWide32, t1
jmp NumberOfJSOpcodeIDs * PtrSize[t1, t0, PtrSize], BytecodePtrTag
end
macro checkSwitchToJIT(increment, action)
loadp CodeBlock[cfr], ws0
baddis increment, Wasm::FunctionCodeBlock::m_tierUpCounter + Wasm::LLIntTierUpCounter::m_counter[ws0], .continue
action()
.continue:
end
macro checkSwitchToJITForPrologue(codeBlockRegister)
checkSwitchToJIT(
5,
macro()
move cfr, a0
move PC, a1
move wasmInstance, a2
cCall4(_slow_path_wasm_prologue_osr)
btpz r0, .recover
move r0, ws0
forEachArgumentGPR(macro (offset, gpr)
loadq -offset - 8 - CalleeSaveSpaceAsVirtualRegisters * 8[cfr], gpr
end)
forEachArgumentFPR(macro (offset, fpr)
loadd -offset - 8 - CalleeSaveSpaceAsVirtualRegisters * 8[cfr], fpr
end)
restoreCalleeSavesUsedByWasm()
restoreCallerPCAndCFR()
untagReturnAddress sp
jmp ws0, WasmEntryPtrTag
.recover:
notFunctionCodeBlockGetter(codeBlockRegister)
end)
end
macro checkSwitchToJITForLoop()
checkSwitchToJIT(
1,
macro()
storei PC, ArgumentCount + TagOffset[cfr]
prepareStateForCCall()
move cfr, a0
move PC, a1
move wasmInstance, a2
cCall4(_slow_path_wasm_loop_osr)
btpz r1, .recover
restoreCalleeSavesUsedByWasm()
restoreCallerPCAndCFR()
untagReturnAddress sp
move r0, a0
jmp r1, WasmEntryPtrTag
.recover:
loadi ArgumentCount + TagOffset[cfr], PC
end)
end
macro checkSwitchToJITForEpilogue()
checkSwitchToJIT(
10,
macro ()
callWasmSlowPath(_slow_path_wasm_epilogue_osr)
end)
end
# Wasm specific helpers
macro preserveCalleeSavesUsedByWasm()
subp CalleeSaveSpaceStackAligned, sp
if ARM64 or ARM64E
emit "stp x23, x26, [x29, #-16]"
emit "stp x19, x22, [x29, #-32]"
elsif X86_64
storep memorySize, -0x08[cfr]
storep memoryBase, -0x10[cfr]
storep PB, -0x18[cfr]
storep wasmInstance, -0x20[cfr]
else
error
end
end
macro restoreCalleeSavesUsedByWasm()
if ARM64 or ARM64E
emit "ldp x23, x26, [x29, #-16]"
emit "ldp x19, x22, [x29, #-32]"
elsif X86_64
loadp -0x08[cfr], memorySize
loadp -0x10[cfr], memoryBase
loadp -0x18[cfr], PB
loadp -0x20[cfr], wasmInstance
else
error
end
end
macro loadWasmInstanceFromTLS()
if HAVE_FAST_TLS
tls_loadp WTF_WASM_CONTEXT_KEY, wasmInstance
else
crash()
end
end
macro storeWasmInstanceToTLS(instance)
if HAVE_FAST_TLS
tls_storep instance, WTF_WASM_CONTEXT_KEY
else
crash()
end
end
macro reloadMemoryRegistersFromInstance(instance, scratch1, scratch2)
loadp Wasm::Instance::m_cachedMemory[instance], memoryBase
loadi Wasm::Instance::m_cachedMemorySize[instance], memorySize
cagedPrimitive(memoryBase, memorySize, scratch1, scratch2)
end
macro throwException(exception)
storei constexpr Wasm::ExceptionType::%exception%, ArgumentCount + PayloadOffset[cfr]
jmp _wasm_throw_from_slow_path_trampoline
end
macro callWasmSlowPath(slowPath)
prepareStateForCCall()
move cfr, a0
move PC, a1
move wasmInstance, a2
cCall4(slowPath)
restoreStateAfterCCall()
end
macro callWasmCallSlowPath(slowPath, action)
storei PC, ArgumentCount + TagOffset[cfr]
prepareStateForCCall()
move cfr, a0
move PC, a1
move wasmInstance, a2
cCall4(slowPath)
action(r0, r1)
end
macro wasmPrologue(codeBlockGetter, codeBlockSetter, loadWasmInstance)
# Set up the call frame and check if we should OSR.
tagReturnAddress sp
preserveCallerPCAndCFR()
preserveCalleeSavesUsedByWasm()
loadWasmInstance()
reloadMemoryRegistersFromInstance(wasmInstance, ws0, ws1)
codeBlockGetter(ws0)
codeBlockSetter(ws0)
# Get new sp in ws1 and check stack height.
loadi Wasm::FunctionCodeBlock::m_numCalleeLocals[ws0], ws1
lshiftp 3, ws1
addp maxFrameExtentForSlowPathCall, ws1
subp cfr, ws1, ws1
bpa ws1, cfr, .stackOverflow
bpbeq Wasm::Instance::m_cachedStackLimit[wasmInstance], ws1, .stackHeightOK
.stackOverflow:
throwException(StackOverflow)
.stackHeightOK:
move ws1, sp
forEachArgumentGPR(macro (offset, gpr)
storeq gpr, -offset - 8 - CalleeSaveSpaceAsVirtualRegisters * 8[cfr]
end)
forEachArgumentFPR(macro (offset, fpr)
stored fpr, -offset - 8 - CalleeSaveSpaceAsVirtualRegisters * 8[cfr]
end)
checkSwitchToJITForPrologue(ws0)
# Set up the PC.
loadp Wasm::FunctionCodeBlock::m_instructionsRawPointer[ws0], PB
move 0, PC
loadi Wasm::FunctionCodeBlock::m_numVars[ws0], ws1
subi NumberOfWasmArguments + CalleeSaveSpaceAsVirtualRegisters, ws1
btiz ws1, .zeroInitializeLocalsDone
negi ws1
sxi2q ws1, ws1
leap (NumberOfWasmArguments + CalleeSaveSpaceAsVirtualRegisters + 1) * -8[cfr], ws0
.zeroInitializeLocalsLoop:
addq 1, ws1
storeq 0, [ws0, ws1, 8]
btqz ws1, .zeroInitializeLocalsDone
jmp .zeroInitializeLocalsLoop
.zeroInitializeLocalsDone:
end
macro traceExecution()
if TRACING
callWasmSlowPath(_slow_path_wasm_trace)
end
end
# Less convenient, but required for opcodes that collide with reserved instructions (e.g. wasm_nop)
macro unprefixedWasmOp(opcodeName, opcodeStruct, fn)
commonOp(opcodeName, traceExecution, macro(size)
fn(macro(fn2)
fn2(opcodeName, opcodeStruct, size)
end)
end)
end
macro wasmOp(opcodeName, opcodeStruct, fn)
unprefixedWasmOp(wasm_%opcodeName%, opcodeStruct, fn)
end
# Same as unprefixedWasmOp, necessary for e.g. wasm_call
macro unprefixedSlowWasmOp(opcodeName)
unprefixedWasmOp(opcodeName, unusedOpcodeStruct, macro(ctx)
callWasmSlowPath(_slow_path_%opcodeName%)
dispatch(ctx)
end)
end
macro slowWasmOp(opcodeName)
unprefixedSlowWasmOp(wasm_%opcodeName%)
end
# Macro version of load operations: mload[suffix]
# loads field from the instruction stream and performs load[suffix] to dst
macro firstConstantRegisterIndex(ctx, fn)
ctx(macro(opcodeName, opcodeStruct, size)
size(FirstConstantRegisterIndexNarrow, FirstConstantRegisterIndexWide16, FirstConstantRegisterIndexWide32, fn)
end)
end
macro loadConstantOrVariable(ctx, index, loader)
firstConstantRegisterIndex(ctx, macro (firstConstantIndex)
bpgteq index, firstConstantIndex, .constant
loader([cfr, index, 8])
jmp .done
.constant:
loadp CodeBlock[cfr], t6
loadp Wasm::FunctionCodeBlock::m_constants + VectorBufferOffset[t6], t6
subp firstConstantIndex, index
loader([t6, index, 8])
.done:
end)
end
macro mloadq(ctx, field, dst)
wgets(ctx, field, dst)
loadConstantOrVariable(ctx, dst, macro (from)
loadq from, dst
end)
end
macro mloadi(ctx, field, dst)
wgets(ctx, field, dst)
loadConstantOrVariable(ctx, dst, macro (from)
loadi from, dst
end)
end
macro mloadp(ctx, field, dst)
wgets(ctx, field, dst)
loadConstantOrVariable(ctx, dst, macro (from)
loadp from, dst
end)
end
macro mloadf(ctx, field, dst)
wgets(ctx, field, t5)
loadConstantOrVariable(ctx, t5, macro (from)
loadf from, dst
end)
end
macro mloadd(ctx, field, dst)
wgets(ctx, field, t5)
loadConstantOrVariable(ctx, t5, macro (from)
loadd from, dst
end)
end
# Typed returns
macro returnq(ctx, value)
wgets(ctx, m_dst, t5)
storeq value, [cfr, t5, 8]
dispatch(ctx)
end
macro returni(ctx, value)
wgets(ctx, m_dst, t5)
storei value, [cfr, t5, 8]
dispatch(ctx)
end
macro returnf(ctx, value)
wgets(ctx, m_dst, t5)
storef value, [cfr, t5, 8]
dispatch(ctx)
end
macro returnd(ctx, value)
wgets(ctx, m_dst, t5)
stored value, [cfr, t5, 8]
dispatch(ctx)
end
# Wasm wrapper of get/getu that operate on ctx
macro wgets(ctx, field, dst)
ctx(macro(opcodeName, opcodeStruct, size)
size(getOperandNarrow, getOperandWide16, getOperandWide32, macro (get)
get(opcodeStruct, field, dst)
end)
end)
end
macro wgetu(ctx, field, dst)
ctx(macro(opcodeName, opcodeStruct, size)
size(getuOperandNarrow, getuOperandWide16, getuOperandWide32, macro (getu)
getu(opcodeStruct, field, dst)
end)
end)
end
# Control flow helpers
macro dispatch(ctx)
ctx(macro(opcodeName, opcodeStruct, size)
genericDispatchOp(wasmDispatch, size, opcodeName)
end)
end
macro jump(ctx, target)
wgets(ctx, target, t0)
btiz t0, .outOfLineJumpTarget
wasmDispatchIndirect(t0)
.outOfLineJumpTarget:
callWasmSlowPath(_slow_path_wasm_out_of_line_jump_target)
wasmNextInstruction()
end
macro doReturn()
restoreCalleeSavesUsedByWasm()
restoreCallerPCAndCFR()
ret
end
# Entry point
macro wasmCodeBlockGetter(targetRegister)
loadp Callee[cfr], targetRegister
andp ~3, targetRegister
loadp Wasm::LLIntCallee::m_codeBlock[targetRegister], targetRegister
end
op(wasm_function_prologue, macro ()
if not WEBASSEMBLY or not JSVALUE64 or C_LOOP or C_LOOP_WIN
error
end
wasmPrologue(wasmCodeBlockGetter, functionCodeBlockSetter, loadWasmInstanceFromTLS)
wasmNextInstruction()
end)
op(wasm_function_prologue_no_tls, macro ()
if not WEBASSEMBLY or not JSVALUE64 or C_LOOP or C_LOOP_WIN
error
end
wasmPrologue(wasmCodeBlockGetter, functionCodeBlockSetter, macro () end)
wasmNextInstruction()
end)
op(wasm_throw_from_slow_path_trampoline, macro ()
loadp Wasm::Instance::m_pointerToTopEntryFrame[wasmInstance], t5
loadp [t5], t5
copyCalleeSavesToEntryFrameCalleeSavesBuffer(t5)
move cfr, a0
addp PB, PC, a1
move wasmInstance, a2
# Slow paths and the throwException macro store the exception code in the ArgumentCount slot
loadi ArgumentCount + PayloadOffset[cfr], a3
cCall4(_slow_path_wasm_throw_exception)
jmp r0, ExceptionHandlerPtrTag
end)
# Disable wide version of narrow-only opcodes
noWide(wasm_enter)
noWide(wasm_wide16)
noWide(wasm_wide32)
# Opcodes that always invoke the slow path
slowWasmOp(ref_func)
slowWasmOp(table_get)
slowWasmOp(table_set)
slowWasmOp(table_size)
slowWasmOp(table_fill)
slowWasmOp(table_grow)
slowWasmOp(set_global_ref)
slowWasmOp(set_global_ref_portable_binding)
wasmOp(grow_memory, WasmGrowMemory, macro(ctx)
callWasmSlowPath(_slow_path_wasm_grow_memory)
reloadMemoryRegistersFromInstance(wasmInstance, ws0, ws1)
dispatch(ctx)
end)
# Opcodes that should eventually be shared with JS llint
_wasm_wide16:
wasmNextInstructionWide16()
_wasm_wide32:
wasmNextInstructionWide32()
_wasm_enter:
traceExecution()
checkStackPointerAlignment(t2, 0xdead00e1)
loadp CodeBlock[cfr], t2 // t2<CodeBlock> = cfr.CodeBlock
loadi Wasm::FunctionCodeBlock::m_numVars[t2], t2 // t2<size_t> = t2<CodeBlock>.m_numVars
subq CalleeSaveSpaceAsVirtualRegisters + NumberOfWasmArguments, t2
btiz t2, .opEnterDone
move cfr, t1
subq CalleeSaveSpaceAsVirtualRegisters * 8 + NumberOfWasmArguments * 8, t1
negi t2
sxi2q t2, t2
.opEnterLoop:
storeq 0, [t1, t2, 8]
addq 1, t2
btqnz t2, .opEnterLoop
.opEnterDone:
wasmDispatchIndirect(1)
unprefixedWasmOp(wasm_nop, WasmNop, macro(ctx)
dispatch(ctx)
end)
wasmOp(loop_hint, WasmLoopHint, macro(ctx)
checkSwitchToJITForLoop()
dispatch(ctx)
end)
wasmOp(mov, WasmMov, macro(ctx)
mloadq(ctx, m_src, t0)
returnq(ctx, t0)
end)
wasmOp(jtrue, WasmJtrue, macro(ctx)
mloadi(ctx, m_condition, t0)
btiz t0, .continue
jump(ctx, m_targetLabel)
.continue:
dispatch(ctx)
end)
wasmOp(jfalse, WasmJfalse, macro(ctx)
mloadi(ctx, m_condition, t0)
btinz t0, .continue
jump(ctx, m_targetLabel)
.continue:
dispatch(ctx)
end)
wasmOp(switch, WasmSwitch, macro(ctx)
mloadi(ctx, m_scrutinee, t0)
wgetu(ctx, m_tableIndex, t1)
loadp CodeBlock[cfr], t2
loadp Wasm::FunctionCodeBlock::m_jumpTables + VectorBufferOffset[t2], t2
muli sizeof Wasm::FunctionCodeBlock::JumpTable, t1
addp t1, t2
loadi VectorSizeOffset[t2], t3
bib t0, t3, .inBounds
.outOfBounds:
subi t3, 1, t0
.inBounds:
loadp VectorBufferOffset[t2], t2
muli sizeof Wasm::FunctionCodeBlock::JumpTableEntry, t0
loadi Wasm::FunctionCodeBlock::JumpTableEntry::startOffset[t2, t0], t1
loadi Wasm::FunctionCodeBlock::JumpTableEntry::dropCount[t2, t0], t3
loadi Wasm::FunctionCodeBlock::JumpTableEntry::keepCount[t2, t0], t5
dropKeep(t1, t3, t5)
loadis Wasm::FunctionCodeBlock::JumpTableEntry::target[t2, t0], t3
assert(macro(ok) btinz t3, .ok end)
wasmDispatchIndirect(t3)
end)
unprefixedWasmOp(wasm_jmp, WasmJmp, macro(ctx)
jump(ctx, m_targetLabel)
end)
unprefixedWasmOp(wasm_ret, WasmRet, macro(ctx)
checkSwitchToJITForEpilogue()
forEachArgumentGPR(macro (offset, gpr)
loadq -offset - 8 - CalleeSaveSpaceAsVirtualRegisters * 8[cfr], gpr
end)
forEachArgumentFPR(macro (offset, fpr)
loadd -offset - 8 - CalleeSaveSpaceAsVirtualRegisters * 8[cfr], fpr
end)
doReturn()
end)
# Wasm specific bytecodes
wasmOp(unreachable, WasmUnreachable, macro(ctx)
throwException(Unreachable)
end)
wasmOp(ret_void, WasmRetVoid, macro(ctx)
checkSwitchToJITForEpilogue()
doReturn()
end)
wasmOp(ref_is_null, WasmRefIsNull, macro(ctx)
mloadp(ctx, m_ref, t0)
cqeq t0, ValueNull, t0
returni(ctx, t0)
end)
wasmOp(get_global, WasmGetGlobal, macro(ctx)
loadp Wasm::Instance::m_globals[wasmInstance], t0
wgetu(ctx, m_globalIndex, t1)
loadq [t0, t1, 8], t0
returnq(ctx, t0)
end)
wasmOp(set_global, WasmSetGlobal, macro(ctx)
loadp Wasm::Instance::m_globals[wasmInstance], t0
wgetu(ctx, m_globalIndex, t1)
mloadq(ctx, m_value, t2)
storeq t2, [t0, t1, 8]
dispatch(ctx)
end)
wasmOp(get_global_portable_binding, WasmGetGlobalPortableBinding, macro(ctx)
loadp Wasm::Instance::m_globals[wasmInstance], t0
wgetu(ctx, m_globalIndex, t1)
loadq [t0, t1, 8], t0
loadq [t0], t0
returnq(ctx, t0)
end)
wasmOp(set_global_portable_binding, WasmSetGlobalPortableBinding, macro(ctx)
loadp Wasm::Instance::m_globals[wasmInstance], t0
wgetu(ctx, m_globalIndex, t1)
mloadq(ctx, m_value, t2)
loadq [t0, t1, 8], t0
storeq t2, [t0]
dispatch(ctx)
end)
macro slowPathForWasmCall(ctx, slowPath, storeWasmInstance)
callWasmCallSlowPath(
slowPath,
# callee is r0 and targetWasmInstance is r1
macro (callee, targetWasmInstance)
move callee, ws0
loadi ArgumentCount + TagOffset[cfr], PC
# the call might throw (e.g. indirect call with bad signature)
btpz targetWasmInstance, .throw
wgetu(ctx, m_stackOffset, ws1)
lshifti 3, ws1
subp cfr, ws1, sp
wgetu(ctx, m_numberOfStackArgs, ws1)
# Preserve the current instance
move wasmInstance, PB
storeWasmInstance(targetWasmInstance)
reloadMemoryRegistersFromInstance(targetWasmInstance, wa0, wa1)
# Load registers from stack
forEachArgumentGPR(macro (offset, gpr)
loadq CallFrameHeaderSize + offset[sp, ws1, 8], gpr
end)
forEachArgumentFPR(macro (offset, fpr)
loadd CallFrameHeaderSize + offset[sp, ws1, 8], fpr
end)
addp CallerFrameAndPCSize, sp
call ws0, SlowPathPtrTag
loadp CodeBlock[cfr], ws1
loadi Wasm::FunctionCodeBlock::m_numCalleeLocals[ws1], ws1
lshiftp 3, ws1
addp maxFrameExtentForSlowPathCall, ws1
subp cfr, ws1, sp
# We need to set PC to load information from the instruction stream, but we
# need to preserve its current value since it might contain a return value
move PC, memoryBase
move PB, wasmInstance
loadi ArgumentCount + TagOffset[cfr], PC
loadp CodeBlock[cfr], PB
loadp Wasm::FunctionCodeBlock::m_instructionsRawPointer[PB], PB
wgetu(ctx, m_stackOffset, ws1)
lshifti 3, ws1
negi ws1
sxi2q ws1, ws1
addp cfr, ws1
# Argument registers are also return registers, so they must be stored to the stack
# in case they contain return values.
wgetu(ctx, m_numberOfStackArgs, ws0)
move memoryBase, PC
forEachArgumentGPR(macro (offset, gpr)
storeq gpr, CallFrameHeaderSize + offset[ws1, ws0, 8]
end)
forEachArgumentFPR(macro (offset, fpr)
stored fpr, CallFrameHeaderSize + offset[ws1, ws0, 8]
end)
loadi ArgumentCount + TagOffset[cfr], PC
storeWasmInstance(wasmInstance)
reloadMemoryRegistersFromInstance(wasmInstance, ws0, ws1)
# Restore stack limit
loadp Wasm::Instance::m_pointerToActualStackLimit[wasmInstance], t5
loadp [t5], t5
storep t5, Wasm::Instance::m_cachedStackLimit[wasmInstance]
dispatch(ctx)
.throw:
restoreStateAfterCCall()
dispatch(ctx)
end)
end
unprefixedWasmOp(wasm_call, WasmCall, macro(ctx)
slowPathForWasmCall(ctx, _slow_path_wasm_call, storeWasmInstanceToTLS)
end)
unprefixedWasmOp(wasm_call_no_tls, WasmCallNoTls, macro(ctx)
slowPathForWasmCall(ctx, _slow_path_wasm_call_no_tls, macro(targetInstance) move targetInstance, wasmInstance end)
end)
wasmOp(call_indirect, WasmCallIndirect, macro(ctx)
slowPathForWasmCall(ctx, _slow_path_wasm_call_indirect, storeWasmInstanceToTLS)
end)
wasmOp(call_indirect_no_tls, WasmCallIndirectNoTls, macro(ctx)
slowPathForWasmCall(ctx, _slow_path_wasm_call_indirect_no_tls, macro(targetInstance) move targetInstance, wasmInstance end)
end)
wasmOp(current_memory, WasmCurrentMemory, macro(ctx)
loadp Wasm::Instance::m_cachedMemorySize[wasmInstance], t0
urshiftq 16, t0
returnq(ctx, t0)
end)
wasmOp(select, WasmSelect, macro(ctx)
mloadi(ctx, m_condition, t0)
btiz t0, .isZero
mloadq(ctx, m_nonZero, t0)
returnq(ctx, t0)
.isZero:
mloadq(ctx, m_zero, t0)
returnq(ctx, t0)
end)
# uses offset as scratch and returns result on pointer
macro emitCheckAndPreparePointer(ctx, pointer, offset, size)
leap size - 1[pointer, offset], t5
bpb t5, memorySize, .continuation
throwException(OutOfBoundsMemoryAccess)
.continuation:
addp memoryBase, pointer
end
macro wasmLoadOp(name, struct, size, fn)
wasmOp(name, struct, macro(ctx)
mloadi(ctx, m_pointer, t0)
wgetu(ctx, m_offset, t1)
emitCheckAndPreparePointer(ctx, t0, t1, size)
fn([t0, t1], t2)
returnq(ctx, t2)
end)
end
wasmLoadOp(load8_u, WasmLoad8U, 1, macro(mem, dst) loadb mem, dst end)
wasmLoadOp(load16_u, WasmLoad16U, 2, macro(mem, dst) loadh mem, dst end)
wasmLoadOp(load32_u, WasmLoad32U, 4, macro(mem, dst) loadi mem, dst end)
wasmLoadOp(load64_u, WasmLoad64U, 8, macro(mem, dst) loadq mem, dst end)
wasmLoadOp(i32_load8_s, WasmI32Load8S, 1, macro(mem, dst) loadbsi mem, dst end)
wasmLoadOp(i64_load8_s, WasmI64Load8S, 1, macro(mem, dst) loadbsq mem, dst end)
wasmLoadOp(i32_load16_s, WasmI32Load16S, 2, macro(mem, dst) loadhsi mem, dst end)
wasmLoadOp(i64_load16_s, WasmI64Load16S, 2, macro(mem, dst) loadhsq mem, dst end)
wasmLoadOp(i64_load32_s, WasmI64Load32S, 4, macro(mem, dst) loadis mem, dst end)
macro wasmStoreOp(name, struct, size, fn)
wasmOp(name, struct, macro(ctx)
mloadi(ctx, m_pointer, t0)
wgetu(ctx, m_offset, t1)
emitCheckAndPreparePointer(ctx, t0, t1, size)
mloadq(ctx, m_value, t2)
fn(t2, [t0, t1])
dispatch(ctx)
end)
end
wasmStoreOp(store8, WasmStore8, 1, macro(value, mem) storeb value, mem end)
wasmStoreOp(store16, WasmStore16, 2, macro(value, mem) storeh value, mem end)
wasmStoreOp(store32, WasmStore32, 4, macro(value, mem) storei value, mem end)
wasmStoreOp(store64, WasmStore64, 8, macro(value, mem) storeq value, mem end)
# Opcodes that don't have the `b3op` entry in wasm.json. This should be kept in sync
wasmOp(i32_div_s, WasmI32DivS, macro (ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
btiz t1, .throwDivisionByZero
bineq t1, -1, .safe
bieq t0, constexpr INT32_MIN, .throwIntegerOverflow
.safe:
if X86_64
# FIXME: Add a way to static_asset that t0 is rax and t2 is rdx
# https://bugs.webkit.org/show_bug.cgi?id=203692
cdqi
idivi t1
elsif ARM64 or ARM64E
divis t1, t0
else
error
end
returni(ctx, t0)
.throwDivisionByZero:
throwException(DivisionByZero)
.throwIntegerOverflow:
throwException(IntegerOverflow)
end)
wasmOp(i32_div_u, WasmI32DivU, macro (ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
btiz t1, .throwDivisionByZero
if X86_64
xori t2, t2
udivi t1
elsif ARM64 or ARM64E
divi t1, t0
else
error
end
returni(ctx, t0)
.throwDivisionByZero:
throwException(DivisionByZero)
end)
wasmOp(i32_rem_s, WasmI32RemS, macro (ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
btiz t1, .throwDivisionByZero
bineq t1, -1, .safe
bineq t0, constexpr INT32_MIN, .safe
move 0, t2
jmp .return
.safe:
if X86_64
# FIXME: Add a way to static_asset that t0 is rax and t2 is rdx
# https://bugs.webkit.org/show_bug.cgi?id=203692
cdqi
idivi t1
elsif ARM64 or ARM64E
divis t1, t0, t2
muli t1, t2
subi t0, t2, t2
else
error
end
.return:
returni(ctx, t2)
.throwDivisionByZero:
throwException(DivisionByZero)
end)
wasmOp(i32_rem_u, WasmI32RemU, macro (ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
btiz t1, .throwDivisionByZero
if X86_64
xori t2, t2
udivi t1
elsif ARM64 or ARM64E
divi t1, t0, t2
muli t1, t2
subi t0, t2, t2
else
error
end
returni(ctx, t2)
.throwDivisionByZero:
throwException(DivisionByZero)
end)
wasmOp(i32_ctz, WasmI32Ctz, macro (ctx)
mloadq(ctx, m_operand, t0)
tzcnti t0, t0
returni(ctx, t0)
end)
wasmOp(i32_popcnt, WasmI32Popcnt, macro (ctx)
mloadi(ctx, m_operand, a1)
prepareStateForCCall()
move PC, a0
cCall2(_slow_path_wasm_popcount)
restoreStateAfterCCall()
returni(ctx, r1)
end)
wasmOp(i64_div_s, WasmI64DivS, macro (ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
btqz t1, .throwDivisionByZero
bqneq t1, -1, .safe
bqeq t0, constexpr INT64_MIN, .throwIntegerOverflow
.safe:
if X86_64
# FIXME: Add a way to static_asset that t0 is rax and t2 is rdx
# https://bugs.webkit.org/show_bug.cgi?id=203692
cqoq
idivq t1
elsif ARM64 or ARM64E
divqs t1, t0
else
error
end
returnq(ctx, t0)
.throwDivisionByZero:
throwException(DivisionByZero)
.throwIntegerOverflow:
throwException(IntegerOverflow)
end)
wasmOp(i64_div_u, WasmI64DivU, macro (ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
btqz t1, .throwDivisionByZero
if X86_64
xorq t2, t2
udivq t1
elsif ARM64 or ARM64E
divq t1, t0
else
error
end
returnq(ctx, t0)
.throwDivisionByZero:
throwException(DivisionByZero)
end)
wasmOp(i64_rem_s, WasmI64RemS, macro (ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
btqz t1, .throwDivisionByZero
bqneq t1, -1, .safe
bqneq t0, constexpr INT64_MIN, .safe
move 0, t2
jmp .return
.safe:
if X86_64
# FIXME: Add a way to static_asset that t0 is rax and t2 is rdx
# https://bugs.webkit.org/show_bug.cgi?id=203692
cqoq
idivq t1
elsif ARM64 or ARM64E
divqs t1, t0, t2
mulq t1, t2
subq t0, t2, t2
else
error
end
.return:
returnq(ctx, t2) # rdx has the remainder
.throwDivisionByZero:
throwException(DivisionByZero)
end)
wasmOp(i64_rem_u, WasmI64RemU, macro (ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
btqz t1, .throwDivisionByZero
if X86_64
xorq t2, t2
udivq t1
elsif ARM64 or ARM64E
divq t1, t0, t2
mulq t1, t2
subq t0, t2, t2
else
error
end
returnq(ctx, t2)
.throwDivisionByZero:
throwException(DivisionByZero)
end)
wasmOp(i64_ctz, WasmI64Ctz, macro (ctx)
mloadq(ctx, m_operand, t0)
tzcntq t0, t0
returnq(ctx, t0)
end)
wasmOp(i64_popcnt, WasmI64Popcnt, macro (ctx)
mloadq(ctx, m_operand, a1)
prepareStateForCCall()
move PC, a0
cCall2(_slow_path_wasm_popcountll)
restoreStateAfterCCall()
returnq(ctx, r1)
end)
wasmOp(f32_trunc, WasmF32Trunc, macro (ctx)
mloadf(ctx, m_operand, ft0)
truncatef ft0, ft0
returnf(ctx, ft0)
end)
wasmOp(f32_nearest, WasmF32Nearest, macro (ctx)
mloadf(ctx, m_operand, ft0)
roundf ft0, ft0
returnf(ctx, ft0)
end)
wasmOp(f64_trunc, WasmF64Trunc, macro (ctx)
mloadd(ctx, m_operand, ft0)
truncated ft0, ft0
returnd(ctx, ft0)
end)
wasmOp(f64_nearest, WasmF64Nearest, macro (ctx)
mloadd(ctx, m_operand, ft0)
roundd ft0, ft0
returnd(ctx, ft0)
end)
wasmOp(i32_trunc_s_f32, WasmI32TruncSF32, macro (ctx)
mloadf(ctx, m_operand, ft0)
move 0xcf000000, t0 # INT32_MIN
fi2f t0, ft1
bfltun ft0, ft1, .outOfBoundsTrunc
move 0x4f000000, t0 # -INT32_MIN
fi2f t0, ft1
bfgtequn ft0, ft1, .outOfBoundsTrunc
truncatef2is ft0, t0
returni(ctx, t0)
.outOfBoundsTrunc:
throwException(OutOfBoundsTrunc)
end)
wasmOp(i32_trunc_s_f64, WasmI32TruncSF64, macro (ctx)
mloadd(ctx, m_operand, ft0)
move 0xc1e0000000000000, t0 # INT32_MIN
fq2d t0, ft1
bdltun ft0, ft1, .outOfBoundsTrunc
move 0x41e0000000000000, t0 # -INT32_MIN
fq2d t0, ft1
bdgtequn ft0, ft1, .outOfBoundsTrunc
truncated2is ft0, t0
returni(ctx, t0)
.outOfBoundsTrunc:
throwException(OutOfBoundsTrunc)
end)
wasmOp(i32_trunc_u_f32, WasmI32TruncUF32, macro (ctx)
mloadf(ctx, m_operand, ft0)
move 0xbf800000, t0 # -1.0
fi2f t0, ft1
bfltequn ft0, ft1, .outOfBoundsTrunc
move 0x4f800000, t0 # INT32_MIN * -2.0
fi2f t0, ft1
bfgtequn ft0, ft1, .outOfBoundsTrunc
truncatef2i ft0, t0
returni(ctx, t0)
.outOfBoundsTrunc:
throwException(OutOfBoundsTrunc)
end)
wasmOp(i32_trunc_u_f64, WasmI32TruncUF64, macro (ctx)
mloadd(ctx, m_operand, ft0)
move 0xbff0000000000000, t0 # -1.0
fq2d t0, ft1
bdltequn ft0, ft1, .outOfBoundsTrunc
move 0x41f0000000000000, t0 # INT32_MIN * -2.0
fq2d t0, ft1
bdgtequn ft0, ft1, .outOfBoundsTrunc
truncated2i ft0, t0
returni(ctx, t0)
.outOfBoundsTrunc:
throwException(OutOfBoundsTrunc)
end)
wasmOp(i64_trunc_s_f32, WasmI64TruncSF32, macro (ctx)
mloadd(ctx, m_operand, ft0)
move 0xdf000000, t0 # INT64_MIN
fi2f t0, ft1
bfltun ft0, ft1, .outOfBoundsTrunc
move 0x5f000000, t0 # -INT64_MIN
fi2f t0, ft1
bfgtequn ft0, ft1, .outOfBoundsTrunc
truncatef2qs ft0, t0
returnq(ctx, t0)
.outOfBoundsTrunc:
throwException(OutOfBoundsTrunc)
end)
wasmOp(i64_trunc_s_f64, WasmI64TruncSF64, macro (ctx)
mloadd(ctx, m_operand, ft0)
move 0xc3e0000000000000, t0 # INT64_MIN
fq2d t0, ft1
bdltun ft0, ft1, .outOfBoundsTrunc
move 0x43e0000000000000, t0 # -INT64_MIN
fq2d t0, ft1
bdgtequn ft0, ft1, .outOfBoundsTrunc
truncated2qs ft0, t0
returnq(ctx, t0)
.outOfBoundsTrunc:
throwException(OutOfBoundsTrunc)
end)
wasmOp(i64_trunc_u_f32, WasmI64TruncUF32, macro (ctx)
mloadf(ctx, m_operand, ft0)
move 0xbf800000, t0 # -1.0
fi2f t0, ft1
bfltequn ft0, ft1, .outOfBoundsTrunc
move 0x5f800000, t0 # INT64_MIN * -2.0
fi2f t0, ft1
bfgtequn ft0, ft1, .outOfBoundsTrunc
truncatef2q ft0, t0
returnq(ctx, t0)
.outOfBoundsTrunc:
throwException(OutOfBoundsTrunc)
end)
wasmOp(i64_trunc_u_f64, WasmI64TruncUF64, macro (ctx)
mloadd(ctx, m_operand, ft0)
move 0xbff0000000000000, t0 # -1.0
fq2d t0, ft1
bdltequn ft0, ft1, .outOfBoundsTrunc
move 0x43f0000000000000, t0 # INT64_MIN * -2.0
fq2d t0, ft1
bdgtequn ft0, ft1, .outOfBoundsTrunc
truncated2q ft0, t0
returnq(ctx, t0)
.outOfBoundsTrunc:
throwException(OutOfBoundsTrunc)
end)
wasmOp(f32_convert_u_i64, WasmF32ConvertUI64, macro (ctx)
mloadq(ctx, m_operand, t0)
if X86_64
cq2f t0, t1, ft0
elsif ARM64 or ARM64E
cq2f t0, ft0
else
error
end
returnf(ctx, ft0)
end)
wasmOp(f64_convert_u_i64, WasmF64ConvertUI64, macro (ctx)
mloadq(ctx, m_operand, t0)
if X86_64
cq2d t0, t1, ft0
elsif ARM64 or ARM64E
cq2d t0, ft0
else
error
end
returnd(ctx, ft0)
end)
wasmOp(i32_eqz, WasmI32Eqz, macro(ctx)
mloadi(ctx, m_operand, t0)
cieq t0, 0, t0
returni(ctx, t0)
end)
wasmOp(i64_shl, WasmI64Shl, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
lshiftq t1, t0
returnq(ctx, t0)
end)
wasmOp(i64_shr_u, WasmI64ShrU, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
urshiftq t1, t0
returnq(ctx, t0)
end)
wasmOp(i64_shr_s, WasmI64ShrS, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
rshiftq t1, t0
returnq(ctx, t0)
end)
wasmOp(i64_rotr, WasmI64Rotr, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
rrotateq t1, t0
returnq(ctx, t0)
end)
wasmOp(i64_rotl, WasmI64Rotl, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
lrotateq t1, t0
returnq(ctx, t0)
end)
wasmOp(i64_eqz, WasmI64Eqz, macro(ctx)
mloadq(ctx, m_operand, t0)
cqeq t0, 0, t0
returni(ctx, t0)
end)
wasmOp(f32_min, WasmF32Min, macro(ctx)
mloadf(ctx, m_lhs, ft0)
mloadf(ctx, m_rhs, ft1)
bfeq ft0, ft1, .equal
bflt ft0, ft1, .lt
bfgt ft0, ft1, .return
.NaN:
addf ft0, ft1
jmp .return
.equal:
orf ft0, ft1
jmp .return
.lt:
moved ft0, ft1
.return:
returnf(ctx, ft1)
end)
wasmOp(f32_max, WasmF32Max, macro(ctx)
mloadf(ctx, m_lhs, ft0)
mloadf(ctx, m_rhs, ft1)
bfeq ft1, ft0, .equal
bflt ft1, ft0, .lt
bfgt ft1, ft0, .return
.NaN:
addf ft0, ft1
jmp .return
.equal:
andf ft0, ft1
jmp .return
.lt:
moved ft0, ft1
.return:
returnf(ctx, ft1)
end)
wasmOp(f32_copysign, WasmF32Copysign, macro(ctx)
mloadf(ctx, m_lhs, ft0)
mloadf(ctx, m_rhs, ft1)
ff2i ft1, t1
move 0x80000000, t2
andi t2, t1
ff2i ft0, t0
move 0x7fffffff, t2
andi t2, t0
ori t1, t0
fi2f t0, ft0
returnf(ctx, ft0)
end)
wasmOp(f64_min, WasmF64Min, macro(ctx)
mloadd(ctx, m_lhs, ft0)
mloadd(ctx, m_rhs, ft1)
bdeq ft0, ft1, .equal
bdlt ft0, ft1, .lt
bdgt ft0, ft1, .return
.NaN:
addd ft0, ft1
jmp .return
.equal:
ord ft0, ft1
jmp .return
.lt:
moved ft0, ft1
.return:
returnd(ctx, ft1)
end)
wasmOp(f64_max, WasmF64Max, macro(ctx)
mloadd(ctx, m_lhs, ft0)
mloadd(ctx, m_rhs, ft1)
bdeq ft1, ft0, .equal
bdlt ft1, ft0, .lt
bdgt ft1, ft0, .return
.NaN:
addd ft0, ft1
jmp .return
.equal:
andd ft0, ft1
jmp .return
.lt:
moved ft0, ft1
.return:
returnd(ctx, ft1)
end)
wasmOp(f64_copysign, WasmF64Copysign, macro(ctx)
mloadd(ctx, m_lhs, ft0)
mloadd(ctx, m_rhs, ft1)
fd2q ft1, t1
move 0x8000000000000000, t2
andq t2, t1
fd2q ft0, t0
move 0x7fffffffffffffff, t2
andq t2, t0
orq t1, t0
fq2d t0, ft0
returnd(ctx, ft0)
end)
wasmOp(f32_convert_u_i32, WasmF32ConvertUI32, macro(ctx)
mloadi(ctx, m_operand, t0)
ci2f t0, ft0
returnf(ctx, ft0)
end)
wasmOp(f64_convert_u_i32, WasmF64ConvertUI32, macro(ctx)
mloadi(ctx, m_operand, t0)
ci2d t0, ft0
returnd(ctx, ft0)
end)
wasmOp(i32_add, WasmI32Add, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
addi t0, t1, t2
returni(ctx, t2)
end)
wasmOp(i32_sub, WasmI32Sub, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
subi t1, t0
returni(ctx, t0)
end)
wasmOp(i32_mul, WasmI32Mul, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
muli t0, t1
returni(ctx, t1)
end)
wasmOp(i32_and, WasmI32And, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
andi t0, t1
returni(ctx, t1)
end)
wasmOp(i32_or, WasmI32Or, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
ori t0, t1
returni(ctx, t1)
end)
wasmOp(i32_xor, WasmI32Xor, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
xori t0, t1
returni(ctx, t1)
end)
wasmOp(i32_shl, WasmI32Shl, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
lshifti t1, t0
returni(ctx, t0)
end)
wasmOp(i32_shr_u, WasmI32ShrU, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
urshifti t1, t0
returni(ctx, t0)
end)
wasmOp(i32_shr_s, WasmI32ShrS, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
rshifti t1, t0
returni(ctx, t0)
end)
wasmOp(i32_rotr, WasmI32Rotr, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
rrotatei t1, t0
returni(ctx, t0)
end)
wasmOp(i32_rotl, WasmI32Rotl, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
lrotatei t1, t0
returni(ctx, t0)
end)
wasmOp(i32_eq, WasmI32Eq, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
cieq t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i32_ne, WasmI32Ne, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
cineq t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i32_lt_s, WasmI32LtS, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
cilt t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i32_le_s, WasmI32LeS, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
cilteq t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i32_lt_u, WasmI32LtU, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
cib t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i32_le_u, WasmI32LeU, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
cibeq t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i32_gt_s, WasmI32GtS, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
cigt t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i32_ge_s, WasmI32GeS, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
cigteq t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i32_gt_u, WasmI32GtU, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
cia t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i32_ge_u, WasmI32GeU, macro(ctx)
mloadi(ctx, m_lhs, t0)
mloadi(ctx, m_rhs, t1)
ciaeq t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i32_clz, WasmI32Clz, macro(ctx)
mloadi(ctx, m_operand, t0)
lzcnti t0, t1
returni(ctx, t1)
end)
wasmOp(i64_add, WasmI64Add, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
addq t0, t1
returnq(ctx, t1)
end)
wasmOp(i64_sub, WasmI64Sub, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
subq t1, t0
returnq(ctx, t0)
end)
wasmOp(i64_mul, WasmI64Mul, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
mulq t0, t1
returnq(ctx, t1)
end)
wasmOp(i64_and, WasmI64And, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
andq t0, t1
returnq(ctx, t1)
end)
wasmOp(i64_or, WasmI64Or, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
orq t0, t1
returnq(ctx, t1)
end)
wasmOp(i64_xor, WasmI64Xor, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
xorq t0, t1
returnq(ctx, t1)
end)
wasmOp(i64_eq, WasmI64Eq, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
cqeq t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i64_ne, WasmI64Ne, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
cqneq t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i64_lt_s, WasmI64LtS, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
cqlt t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i64_le_s, WasmI64LeS, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
cqlteq t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i64_lt_u, WasmI64LtU, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
cqb t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i64_le_u, WasmI64LeU, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
cqbeq t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i64_gt_s, WasmI64GtS, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
cqgt t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i64_ge_s, WasmI64GeS, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
cqgteq t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i64_gt_u, WasmI64GtU, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
cqa t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i64_ge_u, WasmI64GeU, macro(ctx)
mloadq(ctx, m_lhs, t0)
mloadq(ctx, m_rhs, t1)
cqaeq t0, t1, t2
andi 1, t2
returni(ctx, t2)
end)
wasmOp(i64_clz, WasmI64Clz, macro(ctx)
mloadq(ctx, m_operand, t0)
lzcntq t0, t1
returnq(ctx, t1)
end)
wasmOp(f32_add, WasmF32Add, macro(ctx)
mloadf(ctx, m_lhs, ft0)
mloadf(ctx, m_rhs, ft1)
addf ft0, ft1
returnf(ctx, ft1)
end)
wasmOp(f32_sub, WasmF32Sub, macro(ctx)
mloadf(ctx, m_lhs, ft0)
mloadf(ctx, m_rhs, ft1)
subf ft1, ft0
returnf(ctx, ft0)
end)
wasmOp(f32_mul, WasmF32Mul, macro(ctx)
mloadf(ctx, m_lhs, ft0)
mloadf(ctx, m_rhs, ft1)
mulf ft0, ft1
returnf(ctx, ft1)
end)
wasmOp(f32_div, WasmF32Div, macro(ctx)
mloadf(ctx, m_lhs, ft0)
mloadf(ctx, m_rhs, ft1)
divf ft1, ft0
returnf(ctx, ft0)
end)
wasmOp(f32_abs, WasmF32Abs, macro(ctx)
mloadf(ctx, m_operand, ft0)
absf ft0, ft1
returnf(ctx, ft1)
end)
wasmOp(f32_neg, WasmF32Neg, macro(ctx)
mloadf(ctx, m_operand, ft0)
negf ft0, ft1
returnf(ctx, ft1)
end)
wasmOp(f32_ceil, WasmF32Ceil, macro(ctx)
mloadf(ctx, m_operand, ft0)
ceilf ft0, ft1
returnf(ctx, ft1)
end)
wasmOp(f32_floor, WasmF32Floor, macro(ctx)
mloadf(ctx, m_operand, ft0)
floorf ft0, ft1
returnf(ctx, ft1)
end)
wasmOp(f32_sqrt, WasmF32Sqrt, macro(ctx)
mloadf(ctx, m_operand, ft0)
sqrtf ft0, ft1
returnf(ctx, ft1)
end)
wasmOp(f32_eq, WasmF32Eq, macro(ctx)
mloadf(ctx, m_lhs, ft0)
mloadf(ctx, m_rhs, ft1)
cfeq ft0, ft1, t0
returni(ctx, t0)
end)
wasmOp(f32_ne, WasmF32Ne, macro(ctx)
mloadf(ctx, m_lhs, ft0)
mloadf(ctx, m_rhs, ft1)
cfnequn ft0, ft1, t0
returni(ctx, t0)
end)
wasmOp(f32_lt, WasmF32Lt, macro(ctx)
mloadf(ctx, m_lhs, ft0)
mloadf(ctx, m_rhs, ft1)
cflt ft0, ft1, t0
returni(ctx, t0)
end)
wasmOp(f32_le, WasmF32Le, macro(ctx)
mloadf(ctx, m_lhs, ft0)
mloadf(ctx, m_rhs, ft1)
cflteq ft0, ft1, t0
returni(ctx, t0)
end)
wasmOp(f32_gt, WasmF32Gt, macro(ctx)
mloadf(ctx, m_lhs, ft0)
mloadf(ctx, m_rhs, ft1)
cfgt ft0, ft1, t0
returni(ctx, t0)
end)
wasmOp(f32_ge, WasmF32Ge, macro(ctx)
mloadf(ctx, m_lhs, ft0)
mloadf(ctx, m_rhs, ft1)
cfgteq ft0, ft1, t0
returni(ctx, t0)
end)
wasmOp(f64_add, WasmF64Add, macro(ctx)
mloadd(ctx, m_lhs, ft0)
mloadd(ctx, m_rhs, ft1)
addd ft0, ft1
returnd(ctx, ft1)
end)
wasmOp(f64_sub, WasmF64Sub, macro(ctx)
mloadd(ctx, m_lhs, ft0)
mloadd(ctx, m_rhs, ft1)
subd ft1, ft0
returnd(ctx, ft0)
end)
wasmOp(f64_mul, WasmF64Mul, macro(ctx)
mloadd(ctx, m_lhs, ft0)
mloadd(ctx, m_rhs, ft1)
muld ft0, ft1
returnd(ctx, ft1)
end)
wasmOp(f64_div, WasmF64Div, macro(ctx)
mloadd(ctx, m_lhs, ft0)
mloadd(ctx, m_rhs, ft1)
divd ft1, ft0
returnd(ctx, ft0)
end)
wasmOp(f64_abs, WasmF64Abs, macro(ctx)
mloadd(ctx, m_operand, ft0)
absd ft0, ft1
returnd(ctx, ft1)
end)
wasmOp(f64_neg, WasmF64Neg, macro(ctx)
mloadd(ctx, m_operand, ft0)
negd ft0, ft1
returnd(ctx, ft1)
end)
wasmOp(f64_ceil, WasmF64Ceil, macro(ctx)
mloadd(ctx, m_operand, ft0)
ceild ft0, ft1
returnd(ctx, ft1)
end)
wasmOp(f64_floor, WasmF64Floor, macro(ctx)
mloadd(ctx, m_operand, ft0)
floord ft0, ft1
returnd(ctx, ft1)
end)
wasmOp(f64_sqrt, WasmF64Sqrt, macro(ctx)
mloadd(ctx, m_operand, ft0)
sqrtd ft0, ft1
returnd(ctx, ft1)
end)
wasmOp(f64_eq, WasmF64Eq, macro(ctx)
mloadd(ctx, m_lhs, ft0)
mloadd(ctx, m_rhs, ft1)
cdeq ft0, ft1, t0
returni(ctx, t0)
end)
wasmOp(f64_ne, WasmF64Ne, macro(ctx)
mloadd(ctx, m_lhs, ft0)
mloadd(ctx, m_rhs, ft1)
cdnequn ft0, ft1, t0
returni(ctx, t0)
end)
wasmOp(f64_lt, WasmF64Lt, macro(ctx)
mloadd(ctx, m_lhs, ft0)
mloadd(ctx, m_rhs, ft1)
cdlt ft0, ft1, t0
returni(ctx, t0)
end)
wasmOp(f64_le, WasmF64Le, macro(ctx)
mloadd(ctx, m_lhs, ft0)
mloadd(ctx, m_rhs, ft1)
cdlteq ft0, ft1, t0
returni(ctx, t0)
end)
wasmOp(f64_gt, WasmF64Gt, macro(ctx)
mloadd(ctx, m_lhs, ft0)
mloadd(ctx, m_rhs, ft1)
cdgt ft0, ft1, t0
returni(ctx, t0)
end)
wasmOp(f64_ge, WasmF64Ge, macro(ctx)
mloadd(ctx, m_lhs, ft0)
mloadd(ctx, m_rhs, ft1)
cdgteq ft0, ft1, t0
returni(ctx, t0)
end)
wasmOp(i32_wrap_i64, WasmI32WrapI64, macro(ctx)
mloadq(ctx, m_operand, t0)
returni(ctx, t0)
end)
wasmOp(i64_extend_s_i32, WasmI64ExtendSI32, macro(ctx)
mloadi(ctx, m_operand, t0)
sxi2q t0, t1
returnq(ctx, t1)
end)
wasmOp(i64_extend_u_i32, WasmI64ExtendUI32, macro(ctx)
mloadi(ctx, m_operand, t0)
zxi2q t0, t1
returnq(ctx, t1)
end)
wasmOp(f32_convert_s_i32, WasmF32ConvertSI32, macro(ctx)
mloadi(ctx, m_operand, t0)
ci2fs t0, ft0
returnf(ctx, ft0)
end)
wasmOp(f32_convert_s_i64, WasmF32ConvertSI64, macro(ctx)
mloadq(ctx, m_operand, t0)
cq2fs t0, ft0
returnf(ctx, ft0)
end)
wasmOp(f32_demote_f64, WasmF32DemoteF64, macro(ctx)
mloadd(ctx, m_operand, ft0)
cd2f ft0, ft1
returnf(ctx, ft1)
end)
wasmOp(f32_reinterpret_i32, WasmF32ReinterpretI32, macro(ctx)
mloadi(ctx, m_operand, t0)
fi2f t0, ft0
returnf(ctx, ft0)
end)
wasmOp(f64_convert_s_i32, WasmF64ConvertSI32, macro(ctx)
mloadi(ctx, m_operand, t0)
ci2ds t0, ft0
returnd(ctx, ft0)
end)
wasmOp(f64_convert_s_i64, WasmF64ConvertSI64, macro(ctx)
mloadq(ctx, m_operand, t0)
cq2ds t0, ft0
returnd(ctx, ft0)
end)
wasmOp(f64_promote_f32, WasmF64PromoteF32, macro(ctx)
mloadf(ctx, m_operand, ft0)
cf2d ft0, ft1
returnd(ctx, ft1)
end)
wasmOp(f64_reinterpret_i64, WasmF64ReinterpretI64, macro(ctx)
mloadq(ctx, m_operand, t0)
fq2d t0, ft0
returnd(ctx, ft0)
end)
wasmOp(i32_reinterpret_f32, WasmI32ReinterpretF32, macro(ctx)
mloadf(ctx, m_operand, ft0)
ff2i ft0, t0
returni(ctx, t0)
end)
wasmOp(i64_reinterpret_f64, WasmI64ReinterpretF64, macro(ctx)
mloadd(ctx, m_operand, ft0)
fd2q ft0, t0
returnq(ctx, t0)
end)
macro dropKeep(startOffset, drop, keep)
lshifti 3, startOffset
subp cfr, startOffset, startOffset
negi drop
sxi2q drop, drop
.copyLoop:
btiz keep, .done
loadq [startOffset, drop, 8], t6
storeq t6, [startOffset]
subi 1, keep
subp 8, startOffset
jmp .copyLoop
.done:
end
wasmOp(drop_keep, WasmDropKeep, macro(ctx)
wgetu(ctx, m_startOffset, t0)
wgetu(ctx, m_dropCount, t1)
wgetu(ctx, m_keepCount, t2)
dropKeep(t0, t1, t2)
dispatch(ctx)
end)