| # Copyright (C) 2011-2015 Apple Inc. All rights reserved. |
| # |
| # Redistribution and use in source and binary forms, with or without |
| # modification, are permitted provided that the following conditions |
| # are met: |
| # 1. Redistributions of source code must retain the above copyright |
| # notice, this list of conditions and the following disclaimer. |
| # 2. Redistributions in binary form must reproduce the above copyright |
| # notice, this list of conditions and the following disclaimer in the |
| # documentation and/or other materials provided with the distribution. |
| # |
| # THIS SOFTWARE IS PROVIDED BY APPLE INC. AND ITS CONTRIBUTORS ``AS IS'' |
| # AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, |
| # THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR |
| # PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR ITS CONTRIBUTORS |
| # BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR |
| # CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF |
| # SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS |
| # INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN |
| # CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) |
| # ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF |
| # THE POSSIBILITY OF SUCH DAMAGE. |
| |
| # First come the common protocols that both interpreters use. Note that each |
| # of these must have an ASSERT() in LLIntData.cpp |
| |
| # Work-around for the fact that the toolchain's awareness of armv7s results in |
| # a separate slab in the fat binary, yet the offlineasm doesn't know to expect |
| # it. |
| if ARMv7s |
| end |
| |
| # These declarations must match interpreter/JSStack.h. |
| |
| if JSVALUE64 |
| const PtrSize = 8 |
| const CallFrameHeaderSlots = 5 |
| else |
| const PtrSize = 4 |
| const CallFrameHeaderSlots = 4 |
| const CallFrameAlignSlots = 1 |
| end |
| const SlotSize = 8 |
| |
| const StackAlignment = 16 |
| const StackAlignmentMask = StackAlignment - 1 |
| |
| const CallerFrameAndPCSize = 2 * PtrSize |
| |
| const CallerFrame = 0 |
| const ReturnPC = CallerFrame + PtrSize |
| const CodeBlock = ReturnPC + PtrSize |
| const Callee = CodeBlock + SlotSize |
| const ArgumentCount = Callee + SlotSize |
| const ThisArgumentOffset = ArgumentCount + SlotSize |
| const FirstArgumentOffset = ThisArgumentOffset + SlotSize |
| const CallFrameHeaderSize = ThisArgumentOffset |
| |
| # Some value representation constants. |
| if JSVALUE64 |
| const TagBitTypeOther = 0x2 |
| const TagBitBool = 0x4 |
| const TagBitUndefined = 0x8 |
| const ValueEmpty = 0x0 |
| const ValueFalse = TagBitTypeOther | TagBitBool |
| const ValueTrue = TagBitTypeOther | TagBitBool | 1 |
| const ValueUndefined = TagBitTypeOther | TagBitUndefined |
| const ValueNull = TagBitTypeOther |
| const TagTypeNumber = 0xffff000000000000 |
| const TagMask = TagTypeNumber | TagBitTypeOther |
| else |
| const Int32Tag = -1 |
| const BooleanTag = -2 |
| const NullTag = -3 |
| const UndefinedTag = -4 |
| const CellTag = -5 |
| const EmptyValueTag = -6 |
| const DeletedValueTag = -7 |
| const LowestTag = DeletedValueTag |
| end |
| |
| const CallOpCodeSize = 9 |
| |
| if X86_64 or ARM64 or C_LOOP |
| const maxFrameExtentForSlowPathCall = 0 |
| elsif ARM or ARMv7_TRADITIONAL or ARMv7 or SH4 |
| const maxFrameExtentForSlowPathCall = 24 |
| elsif X86 or X86_WIN |
| const maxFrameExtentForSlowPathCall = 40 |
| elsif MIPS |
| const maxFrameExtentForSlowPathCall = 40 |
| elsif X86_64_WIN |
| const maxFrameExtentForSlowPathCall = 64 |
| end |
| |
| # Watchpoint states |
| const ClearWatchpoint = 0 |
| const IsWatched = 1 |
| const IsInvalidated = 2 |
| |
| # Some register conventions. |
| if JSVALUE64 |
| # - Use a pair of registers to represent the PC: one register for the |
| # base of the bytecodes, and one register for the index. |
| # - The PC base (or PB for short) should be stored in the csr. It will |
| # get clobbered on calls to other JS code, but will get saved on calls |
| # to C functions. |
| # - C calls are still given the Instruction* rather than the PC index. |
| # This requires an add before the call, and a sub after. |
| const PC = t5 |
| const PB = t6 |
| const tagTypeNumber = csr1 |
| const tagMask = csr2 |
| |
| macro loadisFromInstruction(offset, dest) |
| loadis offset * 8[PB, PC, 8], dest |
| end |
| |
| macro loadpFromInstruction(offset, dest) |
| loadp offset * 8[PB, PC, 8], dest |
| end |
| |
| macro storepToInstruction(value, offset) |
| storep value, offset * 8[PB, PC, 8] |
| end |
| |
| else |
| const PC = t5 |
| macro loadisFromInstruction(offset, dest) |
| loadis offset * 4[PC], dest |
| end |
| |
| macro loadpFromInstruction(offset, dest) |
| loadp offset * 4[PC], dest |
| end |
| end |
| |
| # Constants for reasoning about value representation. |
| if BIG_ENDIAN |
| const TagOffset = 0 |
| const PayloadOffset = 4 |
| else |
| const TagOffset = 4 |
| const PayloadOffset = 0 |
| end |
| |
| # Constant for reasoning about butterflies. |
| const IsArray = 1 |
| const IndexingShapeMask = 30 |
| const NoIndexingShape = 0 |
| const Int32Shape = 20 |
| const DoubleShape = 22 |
| const ContiguousShape = 26 |
| const ArrayStorageShape = 28 |
| const SlowPutArrayStorageShape = 30 |
| |
| # Type constants. |
| const StringType = 6 |
| const ObjectType = 18 |
| const FinalObjectType = 19 |
| |
| # Type flags constants. |
| const MasqueradesAsUndefined = 1 |
| const ImplementsHasInstance = 2 |
| const ImplementsDefaultHasInstance = 8 |
| |
| # Bytecode operand constants. |
| const FirstConstantRegisterIndex = 0x40000000 |
| |
| # Code type constants. |
| const GlobalCode = 0 |
| const EvalCode = 1 |
| const FunctionCode = 2 |
| |
| # The interpreter steals the tag word of the argument count. |
| const LLIntReturnPC = ArgumentCount + TagOffset |
| |
| # String flags. |
| const HashFlags8BitBuffer = 32 |
| |
| # Copied from PropertyOffset.h |
| const firstOutOfLineOffset = 100 |
| |
| # ResolveType |
| const GlobalProperty = 0 |
| const GlobalVar = 1 |
| const ClosureVar = 2 |
| const LocalClosureVar = 3 |
| const GlobalPropertyWithVarInjectionChecks = 4 |
| const GlobalVarWithVarInjectionChecks = 5 |
| const ClosureVarWithVarInjectionChecks = 6 |
| const Dynamic = 7 |
| |
| const ResolveModeMask = 0xffff |
| |
| const MarkedBlockSize = 64 * 1024 |
| const MarkedBlockMask = ~(MarkedBlockSize - 1) |
| # Constants for checking mark bits. |
| const AtomNumberShift = 3 |
| const BitMapWordShift = 4 |
| |
| # Allocation constants |
| if JSVALUE64 |
| const JSFinalObjectSizeClassIndex = 1 |
| else |
| const JSFinalObjectSizeClassIndex = 3 |
| end |
| |
| # This must match wtf/Vector.h |
| const VectorBufferOffset = 0 |
| if JSVALUE64 |
| const VectorSizeOffset = 12 |
| else |
| const VectorSizeOffset = 8 |
| end |
| |
| # Some common utilities. |
| macro crash() |
| if C_LOOP |
| cloopCrash |
| else |
| call _llint_crash |
| end |
| end |
| |
| macro assert(assertion) |
| if ASSERT_ENABLED |
| assertion(.ok) |
| crash() |
| .ok: |
| end |
| end |
| |
| macro checkStackPointerAlignment(tempReg, location) |
| if ARM64 or C_LOOP or SH4 |
| # ARM64 will check for us! |
| # C_LOOP does not need the alignment, and can use a little perf |
| # improvement from avoiding useless work. |
| # SH4 does not need specific alignment (4 bytes). |
| else |
| if ARM or ARMv7 or ARMv7_TRADITIONAL |
| # ARM can't do logical ops with the sp as a source |
| move sp, tempReg |
| andp StackAlignmentMask, tempReg |
| else |
| andp sp, StackAlignmentMask, tempReg |
| end |
| btpz tempReg, .stackPointerOkay |
| move location, tempReg |
| break |
| .stackPointerOkay: |
| end |
| end |
| |
| if C_LOOP |
| const CalleeSaveRegisterCount = 0 |
| elsif ARM or ARMv7_TRADITIONAL or ARMv7 |
| const CalleeSaveRegisterCount = 7 |
| elsif ARM64 |
| const CalleeSaveRegisterCount = 10 |
| elsif SH4 or X86_64 or MIPS |
| const CalleeSaveRegisterCount = 5 |
| elsif X86 or X86_WIN |
| const CalleeSaveRegisterCount = 3 |
| elsif X86_64_WIN |
| const CalleeSaveRegisterCount = 7 |
| end |
| |
| const CalleeRegisterSaveSize = CalleeSaveRegisterCount * PtrSize |
| |
| # VMEntryTotalFrameSize includes the space for struct VMEntryRecord and the |
| # callee save registers rounded up to keep the stack aligned |
| const VMEntryTotalFrameSize = (CalleeRegisterSaveSize + sizeof VMEntryRecord + StackAlignment - 1) & ~StackAlignmentMask |
| |
| macro pushCalleeSaves() |
| if C_LOOP |
| elsif ARM or ARMv7_TRADITIONAL |
| emit "push {r4-r10}" |
| elsif ARMv7 |
| emit "push {r4-r6, r8-r11}" |
| elsif ARM64 |
| emit "stp x20, x19, [sp, #-16]!" |
| emit "stp x22, x21, [sp, #-16]!" |
| emit "stp x24, x23, [sp, #-16]!" |
| emit "stp x26, x25, [sp, #-16]!" |
| emit "stp x28, x27, [sp, #-16]!" |
| elsif MIPS |
| emit "addiu $sp, $sp, -20" |
| emit "sw $20, 16($sp)" |
| emit "sw $19, 12($sp)" |
| emit "sw $18, 8($sp)" |
| emit "sw $17, 4($sp)" |
| emit "sw $16, 0($sp)" |
| elsif SH4 |
| emit "mov.l r13, @-r15" |
| emit "mov.l r11, @-r15" |
| emit "mov.l r10, @-r15" |
| emit "mov.l r9, @-r15" |
| emit "mov.l r8, @-r15" |
| elsif X86 |
| emit "push %esi" |
| emit "push %edi" |
| emit "push %ebx" |
| elsif X86_WIN |
| emit "push esi" |
| emit "push edi" |
| emit "push ebx" |
| elsif X86_64 |
| emit "push %r12" |
| emit "push %r13" |
| emit "push %r14" |
| emit "push %r15" |
| emit "push %rbx" |
| elsif X86_64_WIN |
| emit "push r12" |
| emit "push r13" |
| emit "push r14" |
| emit "push r15" |
| emit "push rbx" |
| emit "push rdi" |
| emit "push rsi" |
| end |
| end |
| |
| macro popCalleeSaves() |
| if C_LOOP |
| elsif ARM or ARMv7_TRADITIONAL |
| emit "pop {r4-r10}" |
| elsif ARMv7 |
| emit "pop {r4-r6, r8-r11}" |
| elsif ARM64 |
| emit "ldp x28, x27, [sp], #16" |
| emit "ldp x26, x25, [sp], #16" |
| emit "ldp x24, x23, [sp], #16" |
| emit "ldp x22, x21, [sp], #16" |
| emit "ldp x20, x19, [sp], #16" |
| elsif MIPS |
| emit "lw $16, 0($sp)" |
| emit "lw $17, 4($sp)" |
| emit "lw $18, 8($sp)" |
| emit "lw $19, 12($sp)" |
| emit "lw $20, 16($sp)" |
| emit "addiu $sp, $sp, 20" |
| elsif SH4 |
| emit "mov.l @r15+, r8" |
| emit "mov.l @r15+, r9" |
| emit "mov.l @r15+, r10" |
| emit "mov.l @r15+, r11" |
| emit "mov.l @r15+, r13" |
| elsif X86 |
| emit "pop %ebx" |
| emit "pop %edi" |
| emit "pop %esi" |
| elsif X86_WIN |
| emit "pop ebx" |
| emit "pop edi" |
| emit "pop esi" |
| elsif X86_64 |
| emit "pop %rbx" |
| emit "pop %r15" |
| emit "pop %r14" |
| emit "pop %r13" |
| emit "pop %r12" |
| elsif X86_64_WIN |
| emit "pop rsi" |
| emit "pop rdi" |
| emit "pop rbx" |
| emit "pop r15" |
| emit "pop r14" |
| emit "pop r13" |
| emit "pop r12" |
| end |
| end |
| |
| macro preserveCallerPCAndCFR() |
| if C_LOOP or ARM or ARMv7 or ARMv7_TRADITIONAL or MIPS or SH4 |
| push lr |
| push cfr |
| elsif X86 or X86_WIN or X86_64 or X86_64_WIN |
| push cfr |
| elsif ARM64 |
| push cfr, lr |
| else |
| error |
| end |
| move sp, cfr |
| end |
| |
| macro restoreCallerPCAndCFR() |
| move cfr, sp |
| if C_LOOP or ARM or ARMv7 or ARMv7_TRADITIONAL or MIPS or SH4 |
| pop cfr |
| pop lr |
| elsif X86 or X86_WIN or X86_64 or X86_64_WIN |
| pop cfr |
| elsif ARM64 |
| pop lr, cfr |
| end |
| end |
| |
| macro preserveReturnAddressAfterCall(destinationRegister) |
| if C_LOOP or ARM or ARMv7 or ARMv7_TRADITIONAL or ARM64 or MIPS or SH4 |
| # In C_LOOP case, we're only preserving the bytecode vPC. |
| move lr, destinationRegister |
| elsif X86 or X86_WIN or X86_64 or X86_64_WIN |
| pop destinationRegister |
| else |
| error |
| end |
| end |
| |
| macro restoreReturnAddressBeforeReturn(sourceRegister) |
| if C_LOOP or ARM or ARMv7 or ARMv7_TRADITIONAL or ARM64 or MIPS or SH4 |
| # In C_LOOP case, we're only restoring the bytecode vPC. |
| move sourceRegister, lr |
| elsif X86 or X86_WIN or X86_64 or X86_64_WIN |
| push sourceRegister |
| else |
| error |
| end |
| end |
| |
| macro functionPrologue() |
| if X86 or X86_WIN or X86_64 or X86_64_WIN |
| push cfr |
| elsif ARM64 |
| push cfr, lr |
| elsif C_LOOP or ARM or ARMv7 or ARMv7_TRADITIONAL or MIPS or SH4 |
| push lr |
| push cfr |
| end |
| move sp, cfr |
| end |
| |
| macro functionEpilogue() |
| if X86 or X86_WIN or X86_64 or X86_64_WIN |
| pop cfr |
| elsif ARM64 |
| pop lr, cfr |
| elsif C_LOOP or ARM or ARMv7 or ARMv7_TRADITIONAL or MIPS or SH4 |
| pop cfr |
| pop lr |
| end |
| end |
| |
| macro vmEntryRecord(entryFramePointer, resultReg) |
| subp entryFramePointer, VMEntryTotalFrameSize, resultReg |
| end |
| |
| macro getFrameRegisterSizeForCodeBlock(codeBlock, size) |
| loadi CodeBlock::m_numCalleeRegisters[codeBlock], size |
| lshiftp 3, size |
| addp maxFrameExtentForSlowPathCall, size |
| end |
| |
| macro restoreStackPointerAfterCall() |
| loadp CodeBlock[cfr], t2 |
| getFrameRegisterSizeForCodeBlock(t2, t4) |
| if ARMv7 |
| subp cfr, t4, t4 |
| move t4, sp |
| else |
| subp cfr, t4, sp |
| end |
| end |
| |
| macro traceExecution() |
| if EXECUTION_TRACING |
| callSlowPath(_llint_trace) |
| end |
| end |
| |
| macro callTargetFunction(callLinkInfo, calleeFramePtr) |
| move calleeFramePtr, sp |
| if C_LOOP |
| cloopCallJSFunction LLIntCallLinkInfo::machineCodeTarget[callLinkInfo] |
| else |
| call LLIntCallLinkInfo::machineCodeTarget[callLinkInfo] |
| end |
| restoreStackPointerAfterCall() |
| dispatchAfterCall() |
| end |
| |
| macro slowPathForCall(slowPath) |
| callCallSlowPath( |
| slowPath, |
| macro (callee) |
| btpz t1, .dontUpdateSP |
| if ARMv7 |
| addp CallerFrameAndPCSize, t1, t1 |
| move t1, sp |
| else |
| addp CallerFrameAndPCSize, t1, sp |
| end |
| .dontUpdateSP: |
| if C_LOOP |
| cloopCallJSFunction callee |
| else |
| call callee |
| end |
| restoreStackPointerAfterCall() |
| dispatchAfterCall() |
| end) |
| end |
| |
| macro arrayProfile(cellAndIndexingType, profile, scratch) |
| const cell = cellAndIndexingType |
| const indexingType = cellAndIndexingType |
| loadi JSCell::m_structureID[cell], scratch |
| storei scratch, ArrayProfile::m_lastSeenStructureID[profile] |
| loadb JSCell::m_indexingType[cell], indexingType |
| end |
| |
| macro skipIfIsRememberedOrInEden(cell, scratch1, scratch2, continuation) |
| loadb JSCell::m_gcData[cell], scratch1 |
| continuation(scratch1) |
| end |
| |
| macro checkSwitchToJIT(increment, action) |
| loadp CodeBlock[cfr], t0 |
| baddis increment, CodeBlock::m_llintExecuteCounter + BaselineExecutionCounter::m_counter[t0], .continue |
| action() |
| .continue: |
| end |
| |
| macro checkSwitchToJITForEpilogue() |
| checkSwitchToJIT( |
| 10, |
| macro () |
| callSlowPath(_llint_replace) |
| end) |
| end |
| |
| macro assertNotConstant(index) |
| assert(macro (ok) bilt index, FirstConstantRegisterIndex, ok end) |
| end |
| |
| macro functionForCallCodeBlockGetter(targetRegister) |
| if JSVALUE64 |
| loadp Callee[cfr], targetRegister |
| else |
| loadp Callee + PayloadOffset[cfr], targetRegister |
| end |
| loadp JSFunction::m_executable[targetRegister], targetRegister |
| loadp FunctionExecutable::m_codeBlockForCall[targetRegister], targetRegister |
| end |
| |
| macro functionForConstructCodeBlockGetter(targetRegister) |
| if JSVALUE64 |
| loadp Callee[cfr], targetRegister |
| else |
| loadp Callee + PayloadOffset[cfr], targetRegister |
| end |
| loadp JSFunction::m_executable[targetRegister], targetRegister |
| loadp FunctionExecutable::m_codeBlockForConstruct[targetRegister], targetRegister |
| end |
| |
| macro notFunctionCodeBlockGetter(targetRegister) |
| loadp CodeBlock[cfr], targetRegister |
| end |
| |
| macro functionCodeBlockSetter(sourceRegister) |
| storep sourceRegister, CodeBlock[cfr] |
| end |
| |
| macro notFunctionCodeBlockSetter(sourceRegister) |
| # Nothing to do! |
| end |
| |
| # Do the bare minimum required to execute code. Sets up the PC, leave the CodeBlock* |
| # in t1. May also trigger prologue entry OSR. |
| macro prologue(codeBlockGetter, codeBlockSetter, osrSlowPath, traceSlowPath) |
| # Set up the call frame and check if we should OSR. |
| preserveCallerPCAndCFR() |
| |
| if EXECUTION_TRACING |
| subp maxFrameExtentForSlowPathCall, sp |
| callSlowPath(traceSlowPath) |
| addp maxFrameExtentForSlowPathCall, sp |
| end |
| codeBlockGetter(t1) |
| if not C_LOOP |
| baddis 5, CodeBlock::m_llintExecuteCounter + BaselineExecutionCounter::m_counter[t1], .continue |
| if JSVALUE64 |
| cCall2(osrSlowPath, cfr, PC) |
| else |
| # We are after the function prologue, but before we have set up sp from the CodeBlock. |
| # Temporarily align stack pointer for this call. |
| subp 8, sp |
| cCall2(osrSlowPath, cfr, PC) |
| addp 8, sp |
| end |
| btpz t0, .recover |
| move cfr, sp # restore the previous sp |
| # pop the callerFrame since we will jump to a function that wants to save it |
| if ARM64 |
| pop lr, cfr |
| elsif ARM or ARMv7 or ARMv7_TRADITIONAL or MIPS or SH4 |
| pop cfr |
| pop lr |
| else |
| pop cfr |
| end |
| jmp t0 |
| .recover: |
| codeBlockGetter(t1) |
| .continue: |
| end |
| |
| codeBlockSetter(t1) |
| |
| # Set up the PC. |
| if JSVALUE64 |
| loadp CodeBlock::m_instructions[t1], PB |
| move 0, PC |
| else |
| loadp CodeBlock::m_instructions[t1], PC |
| end |
| |
| # Get new sp in t0 and check stack height. |
| getFrameRegisterSizeForCodeBlock(t1, t0) |
| subp cfr, t0, t0 |
| loadp CodeBlock::m_vm[t1], t2 |
| bpbeq VM::m_jsStackLimit[t2], t0, .stackHeightOK |
| |
| # Stack height check failed - need to call a slow_path. |
| subp maxFrameExtentForSlowPathCall, sp # Set up temporary stack pointer for call |
| callSlowPath(_llint_stack_check) |
| bpeq t1, 0, .stackHeightOKGetCodeBlock |
| move t1, cfr |
| dispatch(0) # Go to exception handler in PC |
| |
| .stackHeightOKGetCodeBlock: |
| # Stack check slow path returned that the stack was ok. |
| # Since they were clobbered, need to get CodeBlock and new sp |
| codeBlockGetter(t1) |
| getFrameRegisterSizeForCodeBlock(t1, t0) |
| subp cfr, t0, t0 |
| |
| .stackHeightOK: |
| move t0, sp |
| end |
| |
| # Expects that CodeBlock is in t1, which is what prologue() leaves behind. |
| # Must call dispatch(0) after calling this. |
| macro functionInitialization(profileArgSkip) |
| # Profile the arguments. Unfortunately, we have no choice but to do this. This |
| # code is pretty horrendous because of the difference in ordering between |
| # arguments and value profiles, the desire to have a simple loop-down-to-zero |
| # loop, and the desire to use only three registers so as to preserve the PC and |
| # the code block. It is likely that this code should be rewritten in a more |
| # optimal way for architectures that have more than five registers available |
| # for arbitrary use in the interpreter. |
| loadi CodeBlock::m_numParameters[t1], t0 |
| addp -profileArgSkip, t0 # Use addi because that's what has the peephole |
| assert(macro (ok) bpgteq t0, 0, ok end) |
| btpz t0, .argumentProfileDone |
| loadp CodeBlock::m_argumentValueProfiles + VectorBufferOffset[t1], t3 |
| mulp sizeof ValueProfile, t0, t2 # Aaaaahhhh! Need strength reduction! |
| lshiftp 3, t0 |
| addp t2, t3 |
| .argumentProfileLoop: |
| if JSVALUE64 |
| loadq ThisArgumentOffset - 8 + profileArgSkip * 8[cfr, t0], t2 |
| subp sizeof ValueProfile, t3 |
| storeq t2, profileArgSkip * sizeof ValueProfile + ValueProfile::m_buckets[t3] |
| else |
| loadi ThisArgumentOffset + TagOffset - 8 + profileArgSkip * 8[cfr, t0], t2 |
| subp sizeof ValueProfile, t3 |
| storei t2, profileArgSkip * sizeof ValueProfile + ValueProfile::m_buckets + TagOffset[t3] |
| loadi ThisArgumentOffset + PayloadOffset - 8 + profileArgSkip * 8[cfr, t0], t2 |
| storei t2, profileArgSkip * sizeof ValueProfile + ValueProfile::m_buckets + PayloadOffset[t3] |
| end |
| baddpnz -8, t0, .argumentProfileLoop |
| .argumentProfileDone: |
| end |
| |
| macro allocateJSObject(allocator, structure, result, scratch1, slowCase) |
| const offsetOfFirstFreeCell = |
| MarkedAllocator::m_freeList + |
| MarkedBlock::FreeList::head |
| |
| # Get the object from the free list. |
| loadp offsetOfFirstFreeCell[allocator], result |
| btpz result, slowCase |
| |
| # Remove the object from the free list. |
| loadp [result], scratch1 |
| storep scratch1, offsetOfFirstFreeCell[allocator] |
| |
| # Initialize the object. |
| storep 0, JSObject::m_butterfly[result] |
| storeStructureWithTypeInfo(result, structure, scratch1) |
| end |
| |
| macro doReturn() |
| restoreCallerPCAndCFR() |
| ret |
| end |
| |
| # stub to call into JavaScript or Native functions |
| # EncodedJSValue vmEntryToJavaScript(void* code, VM* vm, ProtoCallFrame* protoFrame) |
| # EncodedJSValue vmEntryToNativeFunction(void* code, VM* vm, ProtoCallFrame* protoFrame) |
| |
| if C_LOOP |
| _llint_vm_entry_to_javascript: |
| else |
| global _vmEntryToJavaScript |
| _vmEntryToJavaScript: |
| end |
| doVMEntry(makeJavaScriptCall) |
| |
| |
| if C_LOOP |
| _llint_vm_entry_to_native: |
| else |
| global _vmEntryToNative |
| _vmEntryToNative: |
| end |
| doVMEntry(makeHostFunctionCall) |
| |
| |
| if not C_LOOP |
| # void sanitizeStackForVMImpl(VM* vm) |
| global _sanitizeStackForVMImpl |
| _sanitizeStackForVMImpl: |
| if X86_64 |
| const vm = t4 |
| const address = t1 |
| const zeroValue = t0 |
| elsif X86_64_WIN |
| const vm = t2 |
| const address = t1 |
| const zeroValue = t0 |
| elsif X86 or X86_WIN |
| const vm = t2 |
| const address = t1 |
| const zeroValue = t0 |
| else |
| const vm = a0 |
| const address = t1 |
| const zeroValue = t2 |
| end |
| |
| if X86 or X86_WIN |
| loadp 4[sp], vm |
| end |
| |
| loadp VM::m_lastStackTop[vm], address |
| bpbeq sp, address, .zeroFillDone |
| |
| move 0, zeroValue |
| .zeroFillLoop: |
| storep zeroValue, [address] |
| addp PtrSize, address |
| bpa sp, address, .zeroFillLoop |
| |
| .zeroFillDone: |
| move sp, address |
| storep address, VM::m_lastStackTop[vm] |
| ret |
| |
| # VMEntryRecord* vmEntryRecord(const VMEntryFrame* entryFrame) |
| global _vmEntryRecord |
| _vmEntryRecord: |
| if X86_64 |
| const entryFrame = t4 |
| const result = t0 |
| elsif X86 or X86_WIN or X86_64_WIN |
| const entryFrame = t2 |
| const result = t0 |
| else |
| const entryFrame = a0 |
| const result = t0 |
| end |
| |
| if X86 or X86_WIN |
| loadp 4[sp], entryFrame |
| end |
| |
| vmEntryRecord(entryFrame, result) |
| ret |
| end |
| |
| if C_LOOP |
| # Dummy entry point the C Loop uses to initialize. |
| _llint_entry: |
| crash() |
| else |
| macro initPCRelative(pcBase) |
| if X86_64 or X86_64_WIN |
| call _relativePCBase |
| _relativePCBase: |
| pop pcBase |
| elsif X86 or X86_WIN |
| call _relativePCBase |
| _relativePCBase: |
| pop pcBase |
| loadp 20[sp], t4 |
| elsif ARM64 |
| elsif ARMv7 |
| _relativePCBase: |
| move pc, pcBase |
| subp 3, pcBase # Need to back up the PC and set the Thumb2 bit |
| elsif ARM or ARMv7_TRADITIONAL |
| _relativePCBase: |
| move pc, pcBase |
| subp 8, pcBase |
| elsif MIPS |
| la _relativePCBase, pcBase |
| _relativePCBase: |
| elsif SH4 |
| mova _relativePCBase, t0 |
| move t0, pcBase |
| alignformova |
| _relativePCBase: |
| end |
| end |
| |
| macro setEntryAddress(index, label) |
| if X86_64 |
| leap (label - _relativePCBase)[t1], t0 |
| move index, t2 |
| storep t0, [t4, t2, 8] |
| elsif X86_64_WIN |
| leap (label - _relativePCBase)[t1], t0 |
| move index, t4 |
| storep t0, [t2, t4, 8] |
| elsif X86 or X86_WIN |
| leap (label - _relativePCBase)[t1], t0 |
| move index, t2 |
| storep t0, [t4, t2, 4] |
| elsif ARM64 |
| pcrtoaddr label, t1 |
| move index, t2 |
| storep t1, [a0, t2, 8] |
| elsif ARM or ARMv7 or ARMv7_TRADITIONAL |
| mvlbl (label - _relativePCBase), t2 |
| addp t2, t1, t2 |
| move index, t3 |
| storep t2, [a0, t3, 4] |
| elsif SH4 |
| move (label - _relativePCBase), t2 |
| addp t2, t1, t2 |
| move index, t3 |
| storep t2, [a0, t3, 4] |
| flushcp # Force constant pool flush to avoid "pcrel too far" link error. |
| elsif MIPS |
| la label, t2 |
| la _relativePCBase, t3 |
| subp t3, t2 |
| addp t2, t1, t2 |
| move index, t3 |
| storep t2, [a0, t3, 4] |
| end |
| end |
| |
| global _llint_entry |
| # Entry point for the llint to initialize. |
| _llint_entry: |
| functionPrologue() |
| pushCalleeSaves() |
| initPCRelative(t1) |
| |
| # Include generated bytecode initialization file. |
| include InitBytecodes |
| |
| popCalleeSaves() |
| functionEpilogue() |
| ret |
| end |
| |
| _llint_program_prologue: |
| prologue(notFunctionCodeBlockGetter, notFunctionCodeBlockSetter, _llint_entry_osr, _llint_trace_prologue) |
| dispatch(0) |
| |
| |
| _llint_eval_prologue: |
| prologue(notFunctionCodeBlockGetter, notFunctionCodeBlockSetter, _llint_entry_osr, _llint_trace_prologue) |
| dispatch(0) |
| |
| |
| _llint_function_for_call_prologue: |
| prologue(functionForCallCodeBlockGetter, functionCodeBlockSetter, _llint_entry_osr_function_for_call, _llint_trace_prologue_function_for_call) |
| functionInitialization(0) |
| dispatch(0) |
| |
| |
| _llint_function_for_construct_prologue: |
| prologue(functionForConstructCodeBlockGetter, functionCodeBlockSetter, _llint_entry_osr_function_for_construct, _llint_trace_prologue_function_for_construct) |
| functionInitialization(1) |
| dispatch(0) |
| |
| |
| _llint_function_for_call_arity_check: |
| prologue(functionForCallCodeBlockGetter, functionCodeBlockSetter, _llint_entry_osr_function_for_call_arityCheck, _llint_trace_arityCheck_for_call) |
| functionArityCheck(.functionForCallBegin, _slow_path_call_arityCheck) |
| .functionForCallBegin: |
| functionInitialization(0) |
| dispatch(0) |
| |
| |
| _llint_function_for_construct_arity_check: |
| prologue(functionForConstructCodeBlockGetter, functionCodeBlockSetter, _llint_entry_osr_function_for_construct_arityCheck, _llint_trace_arityCheck_for_construct) |
| functionArityCheck(.functionForConstructBegin, _slow_path_construct_arityCheck) |
| .functionForConstructBegin: |
| functionInitialization(1) |
| dispatch(0) |
| |
| |
| # Value-representation-specific code. |
| if JSVALUE64 |
| include LowLevelInterpreter64 |
| else |
| include LowLevelInterpreter32_64 |
| end |
| |
| |
| # Value-representation-agnostic code. |
| _llint_op_touch_entry: |
| traceExecution() |
| callSlowPath(_slow_path_touch_entry) |
| dispatch(1) |
| |
| |
| _llint_op_new_array: |
| traceExecution() |
| callSlowPath(_llint_slow_path_new_array) |
| dispatch(5) |
| |
| |
| _llint_op_new_array_with_size: |
| traceExecution() |
| callSlowPath(_llint_slow_path_new_array_with_size) |
| dispatch(4) |
| |
| |
| _llint_op_new_array_buffer: |
| traceExecution() |
| callSlowPath(_llint_slow_path_new_array_buffer) |
| dispatch(5) |
| |
| |
| _llint_op_new_regexp: |
| traceExecution() |
| callSlowPath(_llint_slow_path_new_regexp) |
| dispatch(3) |
| |
| |
| _llint_op_less: |
| traceExecution() |
| callSlowPath(_slow_path_less) |
| dispatch(4) |
| |
| |
| _llint_op_lesseq: |
| traceExecution() |
| callSlowPath(_slow_path_lesseq) |
| dispatch(4) |
| |
| |
| _llint_op_greater: |
| traceExecution() |
| callSlowPath(_slow_path_greater) |
| dispatch(4) |
| |
| |
| _llint_op_greatereq: |
| traceExecution() |
| callSlowPath(_slow_path_greatereq) |
| dispatch(4) |
| |
| |
| _llint_op_mod: |
| traceExecution() |
| callSlowPath(_slow_path_mod) |
| dispatch(4) |
| |
| |
| _llint_op_typeof: |
| traceExecution() |
| callSlowPath(_slow_path_typeof) |
| dispatch(3) |
| |
| |
| _llint_op_is_object_or_null: |
| traceExecution() |
| callSlowPath(_slow_path_is_object_or_null) |
| dispatch(3) |
| |
| _llint_op_is_function: |
| traceExecution() |
| callSlowPath(_slow_path_is_function) |
| dispatch(3) |
| |
| |
| _llint_op_in: |
| traceExecution() |
| callSlowPath(_slow_path_in) |
| dispatch(4) |
| |
| macro withInlineStorage(object, propertyStorage, continuation) |
| # Indicate that the object is the property storage, and that the |
| # property storage register is unused. |
| continuation(object, propertyStorage) |
| end |
| |
| macro withOutOfLineStorage(object, propertyStorage, continuation) |
| loadp JSObject::m_butterfly[object], propertyStorage |
| # Indicate that the propertyStorage register now points to the |
| # property storage, and that the object register may be reused |
| # if the object pointer is not needed anymore. |
| continuation(propertyStorage, object) |
| end |
| |
| |
| _llint_op_del_by_id: |
| traceExecution() |
| callSlowPath(_llint_slow_path_del_by_id) |
| dispatch(4) |
| |
| |
| _llint_op_del_by_val: |
| traceExecution() |
| callSlowPath(_llint_slow_path_del_by_val) |
| dispatch(4) |
| |
| |
| _llint_op_put_by_index: |
| traceExecution() |
| callSlowPath(_llint_slow_path_put_by_index) |
| dispatch(4) |
| |
| |
| _llint_op_put_getter_setter: |
| traceExecution() |
| callSlowPath(_llint_slow_path_put_getter_setter) |
| dispatch(5) |
| |
| |
| _llint_op_jtrue: |
| traceExecution() |
| jumpTrueOrFalse( |
| macro (value, target) btinz value, target end, |
| _llint_slow_path_jtrue) |
| |
| |
| _llint_op_jfalse: |
| traceExecution() |
| jumpTrueOrFalse( |
| macro (value, target) btiz value, target end, |
| _llint_slow_path_jfalse) |
| |
| |
| _llint_op_jless: |
| traceExecution() |
| compare( |
| macro (left, right, target) bilt left, right, target end, |
| macro (left, right, target) bdlt left, right, target end, |
| _llint_slow_path_jless) |
| |
| |
| _llint_op_jnless: |
| traceExecution() |
| compare( |
| macro (left, right, target) bigteq left, right, target end, |
| macro (left, right, target) bdgtequn left, right, target end, |
| _llint_slow_path_jnless) |
| |
| |
| _llint_op_jgreater: |
| traceExecution() |
| compare( |
| macro (left, right, target) bigt left, right, target end, |
| macro (left, right, target) bdgt left, right, target end, |
| _llint_slow_path_jgreater) |
| |
| |
| _llint_op_jngreater: |
| traceExecution() |
| compare( |
| macro (left, right, target) bilteq left, right, target end, |
| macro (left, right, target) bdltequn left, right, target end, |
| _llint_slow_path_jngreater) |
| |
| |
| _llint_op_jlesseq: |
| traceExecution() |
| compare( |
| macro (left, right, target) bilteq left, right, target end, |
| macro (left, right, target) bdlteq left, right, target end, |
| _llint_slow_path_jlesseq) |
| |
| |
| _llint_op_jnlesseq: |
| traceExecution() |
| compare( |
| macro (left, right, target) bigt left, right, target end, |
| macro (left, right, target) bdgtun left, right, target end, |
| _llint_slow_path_jnlesseq) |
| |
| |
| _llint_op_jgreatereq: |
| traceExecution() |
| compare( |
| macro (left, right, target) bigteq left, right, target end, |
| macro (left, right, target) bdgteq left, right, target end, |
| _llint_slow_path_jgreatereq) |
| |
| |
| _llint_op_jngreatereq: |
| traceExecution() |
| compare( |
| macro (left, right, target) bilt left, right, target end, |
| macro (left, right, target) bdltun left, right, target end, |
| _llint_slow_path_jngreatereq) |
| |
| |
| _llint_op_loop_hint: |
| traceExecution() |
| loadp CodeBlock[cfr], t1 |
| loadp CodeBlock::m_vm[t1], t1 |
| loadp VM::watchdog[t1], t0 |
| btpnz t0, .handleWatchdogTimer |
| .afterWatchdogTimerCheck: |
| checkSwitchToJITForLoop() |
| dispatch(1) |
| .handleWatchdogTimer: |
| loadb Watchdog::m_timerDidFire[t0], t0 |
| btbz t0, .afterWatchdogTimerCheck |
| callWatchdogTimerHandler(.throwHandler) |
| jmp .afterWatchdogTimerCheck |
| .throwHandler: |
| jmp _llint_throw_from_slow_path_trampoline |
| |
| _llint_op_switch_string: |
| traceExecution() |
| callSlowPath(_llint_slow_path_switch_string) |
| dispatch(0) |
| |
| |
| _llint_op_new_func_exp: |
| traceExecution() |
| callSlowPath(_llint_slow_path_new_func_exp) |
| dispatch(4) |
| |
| |
| _llint_op_call: |
| traceExecution() |
| arrayProfileForCall() |
| doCall(_llint_slow_path_call) |
| |
| |
| _llint_op_construct: |
| traceExecution() |
| doCall(_llint_slow_path_construct) |
| |
| |
| _llint_op_call_varargs: |
| traceExecution() |
| callSlowPath(_llint_slow_path_size_frame_for_varargs) |
| branchIfException(_llint_throw_from_slow_path_trampoline) |
| # calleeFrame in t1 |
| if JSVALUE64 |
| move t1, sp |
| else |
| # The calleeFrame is not stack aligned, move down by CallerFrameAndPCSize to align |
| if ARMv7 |
| subp t1, CallerFrameAndPCSize, t2 |
| move t2, sp |
| else |
| subp t1, CallerFrameAndPCSize, sp |
| end |
| end |
| slowPathForCall(_llint_slow_path_call_varargs) |
| |
| _llint_op_construct_varargs: |
| traceExecution() |
| callSlowPath(_llint_slow_path_size_frame_for_varargs) |
| branchIfException(_llint_throw_from_slow_path_trampoline) |
| # calleeFrame in t1 |
| if JSVALUE64 |
| move t1, sp |
| else |
| # The calleeFrame is not stack aligned, move down by CallerFrameAndPCSize to align |
| if ARMv7 |
| subp t1, CallerFrameAndPCSize, t2 |
| move t2, sp |
| else |
| subp t1, CallerFrameAndPCSize, sp |
| end |
| end |
| slowPathForCall(_llint_slow_path_construct_varargs) |
| |
| |
| _llint_op_call_eval: |
| traceExecution() |
| |
| # Eval is executed in one of two modes: |
| # |
| # 1) We find that we're really invoking eval() in which case the |
| # execution is perfomed entirely inside the slow_path, and it |
| # returns the PC of a function that just returns the return value |
| # that the eval returned. |
| # |
| # 2) We find that we're invoking something called eval() that is not |
| # the real eval. Then the slow_path returns the PC of the thing to |
| # call, and we call it. |
| # |
| # This allows us to handle two cases, which would require a total of |
| # up to four pieces of state that cannot be easily packed into two |
| # registers (C functions can return up to two registers, easily): |
| # |
| # - The call frame register. This may or may not have been modified |
| # by the slow_path, but the convention is that it returns it. It's not |
| # totally clear if that's necessary, since the cfr is callee save. |
| # But that's our style in this here interpreter so we stick with it. |
| # |
| # - A bit to say if the slow_path successfully executed the eval and has |
| # the return value, or did not execute the eval but has a PC for us |
| # to call. |
| # |
| # - Either: |
| # - The JS return value (two registers), or |
| # |
| # - The PC to call. |
| # |
| # It turns out to be easier to just always have this return the cfr |
| # and a PC to call, and that PC may be a dummy thunk that just |
| # returns the JS value that the eval returned. |
| |
| slowPathForCall(_llint_slow_path_call_eval) |
| |
| |
| _llint_generic_return_point: |
| dispatchAfterCall() |
| |
| |
| _llint_op_strcat: |
| traceExecution() |
| callSlowPath(_slow_path_strcat) |
| dispatch(4) |
| |
| |
| _llint_op_push_with_scope: |
| traceExecution() |
| callSlowPath(_llint_slow_path_push_with_scope) |
| dispatch(3) |
| |
| |
| _llint_op_pop_scope: |
| traceExecution() |
| callSlowPath(_llint_slow_path_pop_scope) |
| dispatch(2) |
| |
| |
| _llint_op_push_name_scope: |
| traceExecution() |
| callSlowPath(_llint_slow_path_push_name_scope) |
| dispatch(5) |
| |
| |
| _llint_op_throw: |
| traceExecution() |
| callSlowPath(_llint_slow_path_throw) |
| dispatch(2) |
| |
| |
| _llint_op_throw_static_error: |
| traceExecution() |
| callSlowPath(_llint_slow_path_throw_static_error) |
| dispatch(3) |
| |
| |
| _llint_op_profile_will_call: |
| traceExecution() |
| loadp CodeBlock[cfr], t0 |
| loadp CodeBlock::m_vm[t0], t0 |
| loadi VM::m_enabledProfiler[t0], t0 |
| btpz t0, .opProfilerWillCallDone |
| callSlowPath(_llint_slow_path_profile_will_call) |
| .opProfilerWillCallDone: |
| dispatch(2) |
| |
| |
| _llint_op_profile_did_call: |
| traceExecution() |
| loadp CodeBlock[cfr], t0 |
| loadp CodeBlock::m_vm[t0], t0 |
| loadi VM::m_enabledProfiler[t0], t0 |
| btpz t0, .opProfilerDidCallDone |
| callSlowPath(_llint_slow_path_profile_did_call) |
| .opProfilerDidCallDone: |
| dispatch(2) |
| |
| |
| _llint_op_debug: |
| traceExecution() |
| loadp CodeBlock[cfr], t0 |
| loadi CodeBlock::m_debuggerRequests[t0], t0 |
| btiz t0, .opDebugDone |
| callSlowPath(_llint_slow_path_debug) |
| .opDebugDone: |
| dispatch(3) |
| |
| |
| _llint_native_call_trampoline: |
| nativeCallTrampoline(NativeExecutable::m_function) |
| |
| |
| _llint_native_construct_trampoline: |
| nativeCallTrampoline(NativeExecutable::m_constructor) |
| |
| _llint_op_get_enumerable_length: |
| traceExecution() |
| callSlowPath(_slow_path_get_enumerable_length) |
| dispatch(3) |
| |
| _llint_op_has_indexed_property: |
| traceExecution() |
| callSlowPath(_slow_path_has_indexed_property) |
| dispatch(5) |
| |
| _llint_op_has_structure_property: |
| traceExecution() |
| callSlowPath(_slow_path_has_structure_property) |
| dispatch(5) |
| |
| _llint_op_has_generic_property: |
| traceExecution() |
| callSlowPath(_slow_path_has_generic_property) |
| dispatch(4) |
| |
| _llint_op_get_direct_pname: |
| traceExecution() |
| callSlowPath(_slow_path_get_direct_pname) |
| dispatch(7) |
| |
| _llint_op_get_property_enumerator: |
| traceExecution() |
| callSlowPath(_slow_path_get_property_enumerator) |
| dispatch(3) |
| |
| _llint_op_enumerator_structure_pname: |
| traceExecution() |
| callSlowPath(_slow_path_next_structure_enumerator_pname) |
| dispatch(4) |
| |
| _llint_op_enumerator_generic_pname: |
| traceExecution() |
| callSlowPath(_slow_path_next_generic_enumerator_pname) |
| dispatch(4) |
| |
| _llint_op_to_index_string: |
| traceExecution() |
| callSlowPath(_slow_path_to_index_string) |
| dispatch(3) |
| |
| _llint_op_profile_control_flow: |
| traceExecution() |
| loadpFromInstruction(1, t0) |
| storeb 1, BasicBlockLocation::m_hasExecuted[t0] |
| dispatch(2) |
| |
| # Lastly, make sure that we can link even though we don't support all opcodes. |
| # These opcodes should never arise when using LLInt or either JIT. We assert |
| # as much. |
| |
| macro notSupported() |
| if ASSERT_ENABLED |
| crash() |
| else |
| # We should use whatever the smallest possible instruction is, just to |
| # ensure that there is a gap between instruction labels. If multiple |
| # smallest instructions exist, we should pick the one that is most |
| # likely result in execution being halted. Currently that is the break |
| # instruction on all architectures we're interested in. (Break is int3 |
| # on Intel, which is 1 byte, and bkpt on ARMv7, which is 2 bytes.) |
| break |
| end |
| end |
| |
| _llint_op_init_global_const_nop: |
| dispatch(5) |