/* -*- Mode: C++; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 2 -*- * vim: set ts=8 sts=2 et sw=2 tw=80: * This Source Code Form is subject to the terms of the Mozilla Public * License, v. 2.0. If a copy of the MPL was not distributed with this * file, You can obtain one at http://mozilla.org/MPL/2.0/. */ #ifndef jit_MacroAssembler_h #define jit_MacroAssembler_h #include "mozilla/EndianUtils.h" #include "mozilla/MacroForEach.h" #include "mozilla/MathAlgorithms.h" #include "mozilla/Maybe.h" #include "mozilla/Variant.h" #if defined(JS_CODEGEN_X86) # include "jit/x86/MacroAssembler-x86.h" #elif defined(JS_CODEGEN_X64) # include "jit/x64/MacroAssembler-x64.h" #elif defined(JS_CODEGEN_ARM) # include "jit/arm/MacroAssembler-arm.h" #elif defined(JS_CODEGEN_ARM64) # include "jit/arm64/MacroAssembler-arm64.h" #elif defined(JS_CODEGEN_MIPS32) # include "jit/mips32/MacroAssembler-mips32.h" #elif defined(JS_CODEGEN_MIPS64) # include "jit/mips64/MacroAssembler-mips64.h" #elif defined(JS_CODEGEN_LOONG64) # include "jit/loong64/MacroAssembler-loong64.h" #elif defined(JS_CODEGEN_WASM32) # include "jit/wasm32/MacroAssembler-wasm32.h" #elif defined(JS_CODEGEN_NONE) # include "jit/none/MacroAssembler-none.h" #else # error "Unknown architecture!" #endif #include "jit/ABIArgGenerator.h" #include "jit/ABIFunctions.h" #include "jit/AtomicOp.h" #include "jit/IonTypes.h" #include "jit/MoveResolver.h" #include "jit/VMFunctions.h" #include "js/ScalarType.h" // js::Scalar::Type #include "util/Memory.h" #include "vm/FunctionFlags.h" #include "vm/Opcodes.h" #include "wasm/WasmCodegenTypes.h" #include "wasm/WasmFrame.h" // [SMDOC] MacroAssembler multi-platform overview // // * How to read/write MacroAssembler method declarations: // // The following macros are made to avoid #ifdef around each method declarations // of the Macro Assembler, and they are also used as an hint on the location of // the implementations of each method. For example, the following declaration // // void Pop(FloatRegister t) DEFINED_ON(x86_shared, arm); // // suggests the MacroAssembler::Pop(FloatRegister) method is implemented in // x86-shared/MacroAssembler-x86-shared.h, and also in arm/MacroAssembler-arm.h. // // - If there is no annotation, then there is only one generic definition in // MacroAssembler.cpp. // // - If the declaration is "inline", then the method definition(s) would be in // the "-inl.h" variant of the same file(s). // // The script check_macroassembler_style.py (which runs on every build) is // used to verify that method definitions match the annotation on the method // declarations. If there is any difference, then you either forgot to define // the method in one of the macro assembler, or you forgot to update the // annotation of the macro assembler declaration. // // Some convenient short-cuts are used to avoid repeating the same list of // architectures on each method declaration, such as PER_ARCH and // PER_SHARED_ARCH. // // Functions that are architecture-agnostic and are the same for all // architectures, that it's necessary to define inline *in this header* to // avoid used-before-defined warnings/errors that would occur if the // definitions were in MacroAssembler-inl.h, should use the OOL_IN_HEADER // marker at end of the declaration: // // inline uint32_t framePushed() const OOL_IN_HEADER; // // Such functions should then be defined immediately after MacroAssembler's // definition, for example: // // //{{{ check_macroassembler_style // inline uint32_t // MacroAssembler::framePushed() const // { // return framePushed_; // } // ////}}} check_macroassembler_style #define ALL_ARCH mips32, mips64, arm, arm64, x86, x64, loong64, wasm32 #define ALL_SHARED_ARCH arm, arm64, loong64, x86_shared, mips_shared, wasm32 // * How this macro works: // // DEFINED_ON is a macro which check if, for the current architecture, the // method is defined on the macro assembler or not. // // For each architecture, we have a macro named DEFINED_ON_arch. This macro is // empty if this is not the current architecture. Otherwise it must be either // set to "define" or "crash" (only used for the none target so far). // // The DEFINED_ON macro maps the list of architecture names given as arguments // to a list of macro names. For example, // // DEFINED_ON(arm, x86_shared) // // is expanded to // // DEFINED_ON_none DEFINED_ON_arm DEFINED_ON_x86_shared // // which are later expanded on ARM, x86, x64 by DEFINED_ON_EXPAND_ARCH_RESULTS // to // // define // // or if the JIT is disabled or set to no architecture to // // crash // // or to nothing, if the current architecture is not listed in the list of // arguments of DEFINED_ON. Note, only one of the DEFINED_ON_arch macro // contributes to the non-empty result, which is the macro of the current // architecture if it is listed in the arguments of DEFINED_ON. // // This result is appended to DEFINED_ON_RESULT_ before expanding the macro, // which results in either no annotation, a MOZ_CRASH(), or a "= delete" // annotation on the method declaration. #define DEFINED_ON_x86 #define DEFINED_ON_x64 #define DEFINED_ON_x86_shared #define DEFINED_ON_arm #define DEFINED_ON_arm64 #define DEFINED_ON_mips32 #define DEFINED_ON_mips64 #define DEFINED_ON_mips_shared #define DEFINED_ON_loong64 #define DEFINED_ON_wasm32 #define DEFINED_ON_none // Specialize for each architecture. #if defined(JS_CODEGEN_X86) # undef DEFINED_ON_x86 # define DEFINED_ON_x86 define # undef DEFINED_ON_x86_shared # define DEFINED_ON_x86_shared define #elif defined(JS_CODEGEN_X64) # undef DEFINED_ON_x64 # define DEFINED_ON_x64 define # undef DEFINED_ON_x86_shared # define DEFINED_ON_x86_shared define #elif defined(JS_CODEGEN_ARM) # undef DEFINED_ON_arm # define DEFINED_ON_arm define #elif defined(JS_CODEGEN_ARM64) # undef DEFINED_ON_arm64 # define DEFINED_ON_arm64 define #elif defined(JS_CODEGEN_MIPS32) # undef DEFINED_ON_mips32 # define DEFINED_ON_mips32 define # undef DEFINED_ON_mips_shared # define DEFINED_ON_mips_shared define #elif defined(JS_CODEGEN_MIPS64) # undef DEFINED_ON_mips64 # define DEFINED_ON_mips64 define # undef DEFINED_ON_mips_shared # define DEFINED_ON_mips_shared define #elif defined(JS_CODEGEN_LOONG64) # undef DEFINED_ON_loong64 # define DEFINED_ON_loong64 define #elif defined(JS_CODEGEN_WASM32) # undef DEFINED_ON_wasm32 # define DEFINED_ON_wasm32 define #elif defined(JS_CODEGEN_NONE) # undef DEFINED_ON_none # define DEFINED_ON_none crash #else # error "Unknown architecture!" #endif #define DEFINED_ON_RESULT_crash \ { MOZ_CRASH(); } #define DEFINED_ON_RESULT_define #define DEFINED_ON_RESULT_ = delete #define DEFINED_ON_DISPATCH_RESULT_2(Macro, Result) Macro##Result #define DEFINED_ON_DISPATCH_RESULT(...) \ DEFINED_ON_DISPATCH_RESULT_2(DEFINED_ON_RESULT_, __VA_ARGS__) // We need to let the evaluation of MOZ_FOR_EACH terminates. #define DEFINED_ON_EXPAND_ARCH_RESULTS_3(ParenResult) \ DEFINED_ON_DISPATCH_RESULT ParenResult #define DEFINED_ON_EXPAND_ARCH_RESULTS_2(ParenResult) \ DEFINED_ON_EXPAND_ARCH_RESULTS_3(ParenResult) #define DEFINED_ON_EXPAND_ARCH_RESULTS(ParenResult) \ DEFINED_ON_EXPAND_ARCH_RESULTS_2(ParenResult) #define DEFINED_ON_FWDARCH(Arch) DEFINED_ON_##Arch #define DEFINED_ON_MAP_ON_ARCHS(ArchList) \ DEFINED_ON_EXPAND_ARCH_RESULTS( \ (MOZ_FOR_EACH(DEFINED_ON_FWDARCH, (), ArchList))) #define DEFINED_ON(...) DEFINED_ON_MAP_ON_ARCHS((none, __VA_ARGS__)) #define PER_ARCH DEFINED_ON(ALL_ARCH) #define PER_SHARED_ARCH DEFINED_ON(ALL_SHARED_ARCH) #define OOL_IN_HEADER namespace JS { struct ExpandoAndGeneration; } namespace js { class StaticStrings; class TypedArrayObject; namespace wasm { class CalleeDesc; class CallSiteDesc; class BytecodeOffset; class MemoryAccessDesc; struct ModuleEnvironment; enum class FailureMode : uint8_t; enum class SimdOp; enum class SymbolicAddress; enum class Trap; } // namespace wasm namespace jit { // Defined in JitFrames.h enum class ExitFrameType : uint8_t; class AutoSaveLiveRegisters; class CompileZone; class TemplateNativeObject; class TemplateObject; enum class CheckUnsafeCallWithABI { // Require the callee to use AutoUnsafeCallWithABI. Check, // We pushed an exit frame so this callWithABI can safely GC and walk the // stack. DontCheckHasExitFrame, // Don't check this callWithABI uses AutoUnsafeCallWithABI, for instance // because we're calling a simple helper function (like malloc or js_free) // that we can't change and/or that we know won't GC. DontCheckOther, }; // This is a global function made to create the DynFn type in a controlled // environment which would check if the function signature has been registered // as an ABI function signature. template static inline DynFn DynamicFunction(Sig fun); enum class CharEncoding { Latin1, TwoByte }; constexpr uint32_t WasmCallerInstanceOffsetBeforeCall = wasm::FrameWithInstances::callerInstanceOffsetWithoutFrame(); constexpr uint32_t WasmCalleeInstanceOffsetBeforeCall = wasm::FrameWithInstances::calleeInstanceOffsetWithoutFrame(); // Allocation sites may be passed to GC thing allocation methods either via a // register (for baseline compilation) or an enum indicating one of the // catch-all allocation sites (for optimized compilation). struct AllocSiteInput : public mozilla::Variant { using Base = mozilla::Variant; AllocSiteInput() : Base(gc::CatchAllAllocSite::Unknown) {} explicit AllocSiteInput(gc::CatchAllAllocSite catchAll) : Base(catchAll) {} explicit AllocSiteInput(Register reg) : Base(reg) {} }; // [SMDOC] Code generation invariants (incomplete) // // ## 64-bit GPRs carrying 32-bit values // // At least at the end of every JS or Wasm operation (= SpiderMonkey bytecode or // Wasm bytecode; this is necessarily a little vague), if a 64-bit GPR has a // 32-bit value, then the upper 32 bits of the register may be predictable in // accordance with platform-specific rules, as follows. // // - On x64 and arm64, the upper bits are zero // - On mips64 and loongarch64 the upper bits are the sign extension of the // lower bits // - (On risc-v we have no rule, having no port yet. Sign extension is the most // likely rule, but "unpredictable" is an option.) // // In most cases no extra work needs to be done to maintain the invariant: // // - 32-bit operations on x64 and arm64 zero-extend the result to 64 bits. // These operations ignore the upper bits of the inputs. // - 32-bit operations on mips64 sign-extend the result to 64 bits (even many // that are labeled as "unsigned", eg ADDU, though not all, eg LU). // Additionally, the inputs to many 32-bit operations must be properly // sign-extended to avoid "unpredictable" behavior, and our simulators check // that inputs conform. // - (32-bit operations on risc-v and loongarch64 sign-extend, much as mips, but // appear to ignore the upper bits of the inputs.) // // The upshot of these invariants is, among other things, that: // // - No code needs to be generated when a 32-bit value is extended to 64 bits // or a 64-bit value is wrapped to 32 bits, if the upper bits are known to be // correct because they resulted from an operation that produced them // predictably. // - Literal loads must be careful to avoid instructions that might extend the // literal in the wrong way. // - Code that produces values using intermediate values with non-canonical // extensions must extend according to platform conventions before being // "done". // // All optimizations are necessarily platform-specific and should only be used // in platform-specific code. We may add architectures in the future that do // not follow the patterns of the few architectures we already have. // // Also see MacroAssembler::debugAssertCanonicalInt32(). // The public entrypoint for emitting assembly. Note that a MacroAssembler can // use cx->lifoAlloc, so take care not to interleave masm use with other // lifoAlloc use if one will be destroyed before the other. class MacroAssembler : public MacroAssemblerSpecific { private: // Information about the current JSRuntime. This is nullptr only for Wasm // compilations. CompileRuntime* maybeRuntime_ = nullptr; // Information about the current Realm. This is nullptr for Wasm compilations // and when compiling JitRuntime trampolines. CompileRealm* maybeRealm_ = nullptr; // Labels for handling exceptions and failures. NonAssertingLabel failureLabel_; protected: // Constructor is protected. Use one of the derived classes! explicit MacroAssembler(TempAllocator& alloc, CompileRuntime* maybeRuntime = nullptr, CompileRealm* maybeRealm = nullptr); public: MoveResolver& moveResolver() { // As an optimization, the MoveResolver is a persistent data structure // shared between visitors in the CodeGenerator. This assertion // checks that state is not leaking from visitor to visitor // via an unresolved addMove(). MOZ_ASSERT(moveResolver_.hasNoPendingMoves()); return moveResolver_; } size_t instructionsSize() const { return size(); } CompileRealm* realm() const { MOZ_ASSERT(maybeRealm_); return maybeRealm_; } CompileRuntime* runtime() const { MOZ_ASSERT(maybeRuntime_); return maybeRuntime_; } #ifdef JS_HAS_HIDDEN_SP void Push(RegisterOrSP reg); #endif #ifdef ENABLE_WASM_SIMD // `op` should be a shift operation. Return true if a variable-width shift // operation on this architecture should pre-mask the shift count, and if so, // return the mask in `*mask`. static bool MustMaskShiftCountSimd128(wasm::SimdOp op, int32_t* mask); #endif private: // The value returned by GetMaxOffsetGuardLimit() in WasmTypes.h uint32_t wasmMaxOffsetGuardLimit_; public: uint32_t wasmMaxOffsetGuardLimit() const { return wasmMaxOffsetGuardLimit_; } void setWasmMaxOffsetGuardLimit(uint32_t limit) { wasmMaxOffsetGuardLimit_ = limit; } //{{{ check_macroassembler_decl_style public: // =============================================================== // MacroAssembler high-level usage. // Flushes the assembly buffer, on platforms that need it. void flush() PER_SHARED_ARCH; // Add a comment that is visible in the pretty printed assembly code. void comment(const char* msg) PER_SHARED_ARCH; // =============================================================== // Frame manipulation functions. inline uint32_t framePushed() const OOL_IN_HEADER; inline void setFramePushed(uint32_t framePushed) OOL_IN_HEADER; inline void adjustFrame(int32_t value) OOL_IN_HEADER; // Adjust the frame, to account for implicit modification of the stack // pointer, such that callee can remove arguments on the behalf of the // caller. inline void implicitPop(uint32_t bytes) OOL_IN_HEADER; private: // This field is used to statically (at compilation time) emulate a frame // pointer by keeping track of stack manipulations. // // It is maintained by all stack manipulation functions below. uint32_t framePushed_; public: // =============================================================== // Stack manipulation functions -- sets of registers. // Approximately speaking, the following routines must use the same memory // layout. Any inconsistencies will certainly lead to crashing in generated // code: // // MacroAssembler::PushRegsInMaskSizeInBytes // MacroAssembler::PushRegsInMask // MacroAssembler::storeRegsInMask // MacroAssembler::PopRegsInMask // MacroAssembler::PopRegsInMaskIgnore // FloatRegister::getRegisterDumpOffsetInBytes // (no class) PushRegisterDump // (union) RegisterContent // JitRuntime::generateInvalidator // JitRuntime::generateBailoutHandler // JSJitFrameIter::machineState // // To be more exact, the invariants are: // // * The save area is conceptually viewed as starting at a highest address // (really, at "highest address - 1") and working down to some lower // address. // // * PushRegsInMask, storeRegsInMask and PopRegsInMask{Ignore} must use // exactly the same memory layout, when starting from the abovementioned // highest address. // // * PushRegsInMaskSizeInBytes must produce a value which is exactly equal // to the change in the machine's stack pointer register as a result of // calling PushRegsInMask or PopRegsInMask{Ignore}. This value must be at // least uintptr_t-aligned on the target, and may be more aligned than that. // // * PushRegsInMaskSizeInBytes must produce a value which is greater than or // equal to the amount of space used by storeRegsInMask. // // * Hence, regardless of whether the save area is created with // storeRegsInMask or PushRegsInMask, it is guaranteed to fit inside an // area of size calculated by PushRegsInMaskSizeInBytes. // // * For the `ignore` argument of PopRegsInMaskIgnore, equality checking // for the floating point/SIMD registers is done on the basis of the // underlying physical register, regardless of width. For example, if the // to-restore set contains v17 (the SIMD register with encoding 17) and // the ignore set contains d17 (the double register with encoding 17) then // no part of the physical register with encoding 17 will be restored. // (This is probably not true on arm32, since that has aliased float32 // registers; but none of our other targets do.) // // * {Push,store}RegsInMask/storeRegsInMask are further constrained as // follows: when given the argument AllFloatRegisters, the resulting // memory area must contain exactly all the SIMD/FP registers for the // target at their widest width (that we care about). [We have no targets // where the SIMD registers and FP register sets are disjoint.] They must // be packed end-to-end with no holes, with the register with the lowest // encoding number (0), as returned by FloatRegister::encoding(), at the // abovementioned highest address, register 1 just below that, etc. // // Furthermore the sizeof(RegisterContent) must equal the size of a SIMD // register in the abovementioned array. // // Furthermore the value returned by // FloatRegister::getRegisterDumpOffsetInBytes must be a correct index // into the abovementioned array. Given the constraints, the only correct // value is `reg.encoding() * sizeof(RegisterContent)`. // // Note that some of the routines listed above are JS-only, and do not support // SIMD registers. They are otherwise part of the same equivalence class. // Register spilling for e.g. OOL VM calls is implemented using // PushRegsInMask, and recovered on bailout using machineState. This requires // the same layout to be used in machineState, and therefore in all other code // that can spill registers that are recovered on bailout. Implementations of // JitRuntime::generate{Invalidator,BailoutHandler} should either call // PushRegsInMask, or check carefully to be sure that they generate the same // layout. // The size of the area used by PushRegsInMask. size_t PushRegsInMaskSizeInBytes(LiveRegisterSet set) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); void PushRegsInMask(LiveRegisterSet set) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); void PushRegsInMask(LiveGeneralRegisterSet set); // Like PushRegsInMask, but instead of pushing the registers, store them to // |dest|. |dest| should point to the end of the reserved space, so the // first register will be stored at |dest.offset - sizeof(register)|. It is // required that |dest.offset| is at least as large as the value computed by // PushRegsInMaskSizeInBytes for this |set|. In other words, |dest.base| // must point to either the lowest address in the save area, or some address // below that. void storeRegsInMask(LiveRegisterSet set, Address dest, Register scratch) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); void PopRegsInMask(LiveRegisterSet set); void PopRegsInMask(LiveGeneralRegisterSet set); void PopRegsInMaskIgnore(LiveRegisterSet set, LiveRegisterSet ignore) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); // =============================================================== // Stack manipulation functions -- single registers/values. void Push(const Operand op) DEFINED_ON(x86_shared); void Push(Register reg) PER_SHARED_ARCH; void Push(Register reg1, Register reg2, Register reg3, Register reg4) DEFINED_ON(arm64); void Push(const Imm32 imm) PER_SHARED_ARCH; void Push(const ImmWord imm) PER_SHARED_ARCH; void Push(const ImmPtr imm) PER_SHARED_ARCH; void Push(const ImmGCPtr ptr) PER_SHARED_ARCH; void Push(FloatRegister reg) PER_SHARED_ARCH; void PushBoxed(FloatRegister reg) PER_ARCH; void PushFlags() DEFINED_ON(x86_shared); void Push(PropertyKey key, Register scratchReg); void Push(const Address& addr); void Push(TypedOrValueRegister v); void Push(const ConstantOrRegister& v); void Push(const ValueOperand& val); void Push(const Value& val); void Push(JSValueType type, Register reg); void Push(const Register64 reg); void PushEmptyRooted(VMFunctionData::RootType rootType); inline CodeOffset PushWithPatch(ImmWord word); inline CodeOffset PushWithPatch(ImmPtr imm); void Pop(const Operand op) DEFINED_ON(x86_shared); void Pop(Register reg) PER_SHARED_ARCH; void Pop(FloatRegister t) PER_SHARED_ARCH; void Pop(const ValueOperand& val) PER_SHARED_ARCH; void PopFlags() DEFINED_ON(x86_shared); void PopStackPtr() DEFINED_ON(arm, mips_shared, x86_shared, loong64, wasm32); void popRooted(VMFunctionData::RootType rootType, Register cellReg, const ValueOperand& valueReg); // Move the stack pointer based on the requested amount. void adjustStack(int amount); void freeStack(uint32_t amount); // Warning: This method does not update the framePushed() counter. void freeStack(Register amount); private: // =============================================================== // Register allocation fields. #ifdef DEBUG friend AutoRegisterScope; friend AutoFloatRegisterScope; // Used to track register scopes for debug builds. // Manipulated by the AutoGenericRegisterScope class. AllocatableRegisterSet debugTrackedRegisters_; #endif // DEBUG public: // =============================================================== // Simple call functions. // The returned CodeOffset is the assembler offset for the instruction // immediately following the call; that is, for the return point. CodeOffset call(Register reg) PER_SHARED_ARCH; CodeOffset call(Label* label) PER_SHARED_ARCH; void call(const Address& addr) PER_SHARED_ARCH; void call(ImmWord imm) PER_SHARED_ARCH; // Call a target native function, which is neither traceable nor movable. void call(ImmPtr imm) PER_SHARED_ARCH; CodeOffset call(wasm::SymbolicAddress imm) PER_SHARED_ARCH; inline CodeOffset call(const wasm::CallSiteDesc& desc, wasm::SymbolicAddress imm); // Call a target JitCode, which must be traceable, and may be movable. void call(JitCode* c) PER_SHARED_ARCH; inline void call(TrampolinePtr code); inline CodeOffset call(const wasm::CallSiteDesc& desc, const Register reg); inline CodeOffset call(const wasm::CallSiteDesc& desc, uint32_t funcDefIndex); inline void call(const wasm::CallSiteDesc& desc, wasm::Trap trap); CodeOffset callWithPatch() PER_SHARED_ARCH; void patchCall(uint32_t callerOffset, uint32_t calleeOffset) PER_SHARED_ARCH; // Push the return address and make a call. On platforms where this function // is not defined, push the link register (pushReturnAddress) at the entry // point of the callee. void callAndPushReturnAddress(Register reg) DEFINED_ON(x86_shared); void callAndPushReturnAddress(Label* label) DEFINED_ON(x86_shared); // These do not adjust framePushed(). void pushReturnAddress() DEFINED_ON(mips_shared, arm, arm64, loong64, wasm32); void popReturnAddress() DEFINED_ON(mips_shared, arm, arm64, loong64, wasm32); // Useful for dealing with two-valued returns. void moveRegPair(Register src0, Register src1, Register dst0, Register dst1, MoveOp::Type type = MoveOp::GENERAL); public: // =============================================================== // Patchable near/far jumps. // "Far jumps" provide the ability to jump to any uint32_t offset from any // other uint32_t offset without using a constant pool (thus returning a // simple CodeOffset instead of a CodeOffsetJump). CodeOffset farJumpWithPatch() PER_SHARED_ARCH; void patchFarJump(CodeOffset farJump, uint32_t targetOffset) PER_SHARED_ARCH; // Emit a nop that can be patched to and from a nop and a call with int32 // relative displacement. CodeOffset nopPatchableToCall() PER_SHARED_ARCH; void nopPatchableToCall(const wasm::CallSiteDesc& desc); static void patchNopToCall(uint8_t* callsite, uint8_t* target) PER_SHARED_ARCH; static void patchCallToNop(uint8_t* callsite) PER_SHARED_ARCH; // These methods are like movWithPatch/PatchDataWithValueCheck but allow // using pc-relative addressing on certain platforms (RIP-relative LEA on x64, // ADR instruction on arm64). // // Note: "Near" applies to ARM64 where the target must be within 1 MB (this is // release-asserted). CodeOffset moveNearAddressWithPatch(Register dest) DEFINED_ON(x86, x64, arm, arm64, loong64, wasm32, mips_shared); static void patchNearAddressMove(CodeLocationLabel loc, CodeLocationLabel target) DEFINED_ON(x86, x64, arm, arm64, loong64, wasm32, mips_shared); public: // =============================================================== // [SMDOC] JIT-to-C++ Function Calls (callWithABI) // // callWithABI is used to make a call using the standard C/C++ system ABI. // // callWithABI is a low level interface for making calls, as such every call // made with callWithABI should be organized with 6 steps: spilling live // registers, aligning the stack, listing arguments of the called function, // calling a function pointer, extracting the returned value and restoring // live registers. // // A more detailed example of the six stages: // // 1) Saving of registers that are live. This will vary depending on which // SpiderMonkey compiler you are working on. Registers that shouldn't be // restored can be excluded. // // LiveRegisterSet volatileRegs(...); // volatileRegs.take(scratch); // masm.PushRegsInMask(volatileRegs); // // 2) Align the stack to perform the call with the correct stack alignment. // // When the stack pointer alignment is unknown and cannot be corrected // when generating the code, setupUnalignedABICall must be used to // dynamically align the stack pointer to the expectation of the ABI. // When the stack pointer is known at JIT compilation time, the stack can // be fixed manually and setupAlignedABICall and setupWasmABICall can be // used. // // setupWasmABICall is a special case of setupAlignedABICall as // SpiderMonkey's WebAssembly implementation mostly follow the system // ABI, except for float/double arguments, which always use floating // point registers, even if this is not supported by the system ABI. // // masm.setupUnalignedABICall(scratch); // // 3) Passing arguments. Arguments are passed left-to-right. // // masm.passABIArg(scratch); // masm.passABIArg(FloatOp0, MoveOp::Double); // // Note how float register arguments are annotated with MoveOp::Double. // // Concerning stack-relative address, see the note on passABIArg. // // 4) Make the call: // // using Fn = int32_t (*)(int32_t) // masm.callWithABI(); // // In the case where the call returns a double, that needs to be // indicated to the callWithABI like this: // // using Fn = double (*)(int32_t) // masm.callWithABI(MoveOp::DOUBLE); // // There are overloads to allow calls to registers and addresses. // // 5) Take care of the result // // masm.storeCallPointerResult(scratch1); // masm.storeCallBoolResult(scratch1); // masm.storeCallInt32Result(scratch1); // masm.storeCallFloatResult(scratch1); // // 6) Restore the potentially clobbered volatile registers // // masm.PopRegsInMask(volatileRegs); // // If expecting a returned value, this call should use // PopRegsInMaskIgnore to filter out the registers which are containing // the returned value. // // Unless an exit frame is pushed prior to the setupABICall, the callee // should not GC. To ensure this is the case callWithABI is instrumented to // make sure that in the default case callees are annotated with an // AutoUnsafeCallWithABI on the stack. // // A callWithABI can opt out of checking, if for example it is known there // is an exit frame, or the callee is known not to GC. // // If your callee needs to be able to GC, consider using a VMFunction, or // create a fake exit frame, and instrument the TraceJitExitFrame // accordingly. // Setup a call to C/C++ code, given the assumption that the framePushed // accurately defines the state of the stack, and that the top of the stack // was properly aligned. Note that this only supports cdecl. // // As a rule of thumb, this can be used in CodeGenerator but not in CacheIR or // Baseline code (because the stack is not aligned to ABIStackAlignment). void setupAlignedABICall(); // As setupAlignedABICall, but for WebAssembly native ABI calls, which pass // through a builtin thunk that uses the wasm ABI. All the wasm ABI calls // can be native, since we always know the stack alignment a priori. void setupWasmABICall(); // Setup an ABI call for when the alignment is not known. This may need a // scratch register. void setupUnalignedABICall(Register scratch) PER_ARCH; // Arguments must be assigned to a C/C++ call in order. They are moved // in parallel immediately before performing the call. This process may // temporarily use more stack, in which case esp-relative addresses will be // automatically adjusted. It is extremely important that esp-relative // addresses are computed *after* setupABICall(). Furthermore, no // operations should be emitted while setting arguments. void passABIArg(const MoveOperand& from, MoveOp::Type type); inline void passABIArg(Register reg); inline void passABIArg(FloatRegister reg, MoveOp::Type type); inline void callWithABI( DynFn fun, MoveOp::Type result = MoveOp::GENERAL, CheckUnsafeCallWithABI check = CheckUnsafeCallWithABI::Check); template inline void callWithABI( MoveOp::Type result = MoveOp::GENERAL, CheckUnsafeCallWithABI check = CheckUnsafeCallWithABI::Check); inline void callWithABI(Register fun, MoveOp::Type result = MoveOp::GENERAL); inline void callWithABI(const Address& fun, MoveOp::Type result = MoveOp::GENERAL); CodeOffset callWithABI(wasm::BytecodeOffset offset, wasm::SymbolicAddress fun, mozilla::Maybe instanceOffset, MoveOp::Type result = MoveOp::GENERAL); void callDebugWithABI(wasm::SymbolicAddress fun, MoveOp::Type result = MoveOp::GENERAL); private: // Reinitialize the variables which have to be cleared before making a call // with callWithABI. template void setupABICallHelper(); // Reinitialize the variables which have to be cleared before making a call // with native abi. void setupNativeABICall(); // Reserve the stack and resolve the arguments move. void callWithABIPre(uint32_t* stackAdjust, bool callFromWasm = false) PER_ARCH; // Emits a call to a C/C++ function, resolving all argument moves. void callWithABINoProfiler(void* fun, MoveOp::Type result, CheckUnsafeCallWithABI check); void callWithABINoProfiler(Register fun, MoveOp::Type result) PER_ARCH; void callWithABINoProfiler(const Address& fun, MoveOp::Type result) PER_ARCH; // Restore the stack to its state before the setup function call. void callWithABIPost(uint32_t stackAdjust, MoveOp::Type result, bool callFromWasm = false) PER_ARCH; // Create the signature to be able to decode the arguments of a native // function, when calling a function within the simulator. inline void appendSignatureType(MoveOp::Type type); inline ABIFunctionType signature() const; // Private variables used to handle moves between registers given as // arguments to passABIArg and the list of ABI registers expected for the // signature of the function. MoveResolver moveResolver_; // Architecture specific implementation which specify how registers & stack // offsets are used for calling a function. ABIArgGenerator abiArgs_; #ifdef DEBUG // Flag use to assert that we use ABI function in the right context. bool inCall_; #endif // If set by setupUnalignedABICall then callWithABI will pop the stack // register which is on the stack. bool dynamicAlignment_; #ifdef JS_SIMULATOR // The signature is used to accumulate all types of arguments which are used // by the caller. This is used by the simulators to decode the arguments // properly, and cast the function pointer to the right type. uint32_t signature_; #endif public: // =============================================================== // Jit Frames. // // These functions are used to build the content of the Jit frames. See // CommonFrameLayout class, and all its derivatives. The content should be // pushed in the opposite order as the fields of the structures, such that // the structures can be used to interpret the content of the stack. // Call the Jit function, and push the return address (or let the callee // push the return address). // // These functions return the offset of the return address, in order to use // the return address to index the safepoints, which are used to list all // live registers. inline uint32_t callJitNoProfiler(Register callee); inline uint32_t callJit(Register callee); inline uint32_t callJit(JitCode* code); inline uint32_t callJit(TrampolinePtr code); inline uint32_t callJit(ImmPtr callee); // The frame descriptor is the second field of all Jit frames, pushed before // calling the Jit function. See CommonFrameLayout::descriptor_. inline void pushFrameDescriptor(FrameType type); inline void PushFrameDescriptor(FrameType type); // For JitFrameLayout, the descriptor also stores the number of arguments // passed by the caller. See MakeFrameDescriptorForJitCall. inline void pushFrameDescriptorForJitCall(FrameType type, uint32_t argc); inline void pushFrameDescriptorForJitCall(FrameType type, Register argc, Register scratch); inline void PushFrameDescriptorForJitCall(FrameType type, uint32_t argc); inline void PushFrameDescriptorForJitCall(FrameType type, Register argc, Register scratch); // Load the number of actual arguments from the frame's JitFrameLayout. inline void loadNumActualArgs(Register framePtr, Register dest); // Push the callee token of a JSFunction which pointer is stored in the // |callee| register. The callee token is packed with a |constructing| flag // which correspond to the fact that the JS function is called with "new" or // not. inline void PushCalleeToken(Register callee, bool constructing); // Unpack a callee token located at the |token| address, and return the // JSFunction pointer in the |dest| register. inline void loadFunctionFromCalleeToken(Address token, Register dest); // This function emulates a call by pushing an exit frame on the stack, // except that the fake-function is inlined within the body of the caller. // // This function assumes that the current frame is an IonJS frame. // // This function returns the offset of the /fake/ return address, in order to // use the return address to index the safepoints, which are used to list all // live registers. // // This function should be balanced with a call to adjustStack, to pop the // exit frame and emulate the return statement of the inlined function. inline uint32_t buildFakeExitFrame(Register scratch); private: // This function is used by buildFakeExitFrame to push a fake return address // on the stack. This fake return address should never be used for resuming // any execution, and can even be an invalid pointer into the instruction // stream, as long as it does not alias any other. uint32_t pushFakeReturnAddress(Register scratch) PER_SHARED_ARCH; public: // =============================================================== // Exit frame footer. // // When calling outside the Jit we push an exit frame. To mark the stack // correctly, we have to push additional information, called the Exit frame // footer, which is used to identify how the stack is marked. // // See JitFrames.h, and TraceJitExitFrame in JitFrames.cpp. // Push stub code and the VMFunctionData pointer. inline void enterExitFrame(Register cxreg, Register scratch, const VMFunctionData* f); // Push an exit frame token to identify which fake exit frame this footer // corresponds to. inline void enterFakeExitFrame(Register cxreg, Register scratch, ExitFrameType type); // Push an exit frame token for a native call. inline void enterFakeExitFrameForNative(Register cxreg, Register scratch, bool isConstructing); // Pop ExitFrame footer in addition to the extra frame. inline void leaveExitFrame(size_t extraFrame = 0); private: // Save the top of the stack into JitActivation::packedExitFP of the // current thread, which should be the location of the latest exit frame. void linkExitFrame(Register cxreg, Register scratch); public: // =============================================================== // Move instructions inline void move64(Imm64 imm, Register64 dest) PER_ARCH; inline void move64(Register64 src, Register64 dest) PER_ARCH; inline void moveFloat32ToGPR(FloatRegister src, Register dest) PER_SHARED_ARCH; inline void moveGPRToFloat32(Register src, FloatRegister dest) PER_SHARED_ARCH; inline void moveDoubleToGPR64(FloatRegister src, Register64 dest) PER_ARCH; inline void moveGPR64ToDouble(Register64 src, FloatRegister dest) PER_ARCH; inline void move8SignExtend(Register src, Register dest) PER_SHARED_ARCH; inline void move16SignExtend(Register src, Register dest) PER_SHARED_ARCH; // move64To32 will clear the high bits of `dest` on 64-bit systems. inline void move64To32(Register64 src, Register dest) PER_ARCH; inline void move32To64ZeroExtend(Register src, Register64 dest) PER_ARCH; inline void move8To64SignExtend(Register src, Register64 dest) PER_ARCH; inline void move16To64SignExtend(Register src, Register64 dest) PER_ARCH; inline void move32To64SignExtend(Register src, Register64 dest) PER_ARCH; inline void move32SignExtendToPtr(Register src, Register dest) PER_ARCH; inline void move32ZeroExtendToPtr(Register src, Register dest) PER_ARCH; // Copy a constant, typed-register, or a ValueOperand into a ValueOperand // destination. inline void moveValue(const ConstantOrRegister& src, const ValueOperand& dest); void moveValue(const TypedOrValueRegister& src, const ValueOperand& dest) PER_ARCH; void moveValue(const ValueOperand& src, const ValueOperand& dest) PER_ARCH; void moveValue(const Value& src, const ValueOperand& dest) PER_ARCH; void movePropertyKey(PropertyKey key, Register dest); // =============================================================== // Load instructions inline void load32SignExtendToPtr(const Address& src, Register dest) PER_ARCH; inline void loadAbiReturnAddress(Register dest) PER_SHARED_ARCH; public: // =============================================================== // Logical instructions inline void not32(Register reg) PER_SHARED_ARCH; inline void notPtr(Register reg) PER_ARCH; inline void and32(Register src, Register dest) PER_SHARED_ARCH; inline void and32(Imm32 imm, Register dest) PER_SHARED_ARCH; inline void and32(Imm32 imm, Register src, Register dest) DEFINED_ON(arm64); inline void and32(Imm32 imm, const Address& dest) PER_SHARED_ARCH; inline void and32(const Address& src, Register dest) PER_SHARED_ARCH; inline void andPtr(Register src, Register dest) PER_ARCH; inline void andPtr(Imm32 imm, Register dest) PER_ARCH; inline void and64(Imm64 imm, Register64 dest) PER_ARCH; inline void or64(Imm64 imm, Register64 dest) PER_ARCH; inline void xor64(Imm64 imm, Register64 dest) PER_ARCH; inline void or32(Register src, Register dest) PER_SHARED_ARCH; inline void or32(Imm32 imm, Register dest) PER_SHARED_ARCH; inline void or32(Imm32 imm, const Address& dest) PER_SHARED_ARCH; inline void orPtr(Register src, Register dest) PER_ARCH; inline void orPtr(Imm32 imm, Register dest) PER_ARCH; inline void and64(Register64 src, Register64 dest) PER_ARCH; inline void or64(Register64 src, Register64 dest) PER_ARCH; inline void xor64(Register64 src, Register64 dest) PER_ARCH; inline void xor32(Register src, Register dest) PER_SHARED_ARCH; inline void xor32(Imm32 imm, Register dest) PER_SHARED_ARCH; inline void xor32(Imm32 imm, const Address& dest) PER_SHARED_ARCH; inline void xor32(const Address& src, Register dest) PER_SHARED_ARCH; inline void xorPtr(Register src, Register dest) PER_ARCH; inline void xorPtr(Imm32 imm, Register dest) PER_ARCH; inline void and64(const Operand& src, Register64 dest) DEFINED_ON(x64, mips64, loong64); inline void or64(const Operand& src, Register64 dest) DEFINED_ON(x64, mips64, loong64); inline void xor64(const Operand& src, Register64 dest) DEFINED_ON(x64, mips64, loong64); // =============================================================== // Swap instructions // Swap the two lower bytes and sign extend the result to 32-bit. inline void byteSwap16SignExtend(Register reg) PER_SHARED_ARCH; // Swap the two lower bytes and zero extend the result to 32-bit. inline void byteSwap16ZeroExtend(Register reg) PER_SHARED_ARCH; // Swap all four bytes in a 32-bit integer. inline void byteSwap32(Register reg) PER_SHARED_ARCH; // Swap all eight bytes in a 64-bit integer. inline void byteSwap64(Register64 reg) PER_ARCH; // =============================================================== // Arithmetic functions inline void add32(Register src, Register dest) PER_SHARED_ARCH; inline void add32(Imm32 imm, Register dest) PER_SHARED_ARCH; inline void add32(Imm32 imm, const Address& dest) PER_SHARED_ARCH; inline void add32(Imm32 imm, const AbsoluteAddress& dest) DEFINED_ON(x86_shared); inline void addPtr(Register src, Register dest) PER_ARCH; inline void addPtr(Register src1, Register src2, Register dest) DEFINED_ON(arm64); inline void addPtr(Imm32 imm, Register dest) PER_ARCH; inline void addPtr(Imm32 imm, Register src, Register dest) DEFINED_ON(arm64); inline void addPtr(ImmWord imm, Register dest) PER_ARCH; inline void addPtr(ImmPtr imm, Register dest); inline void addPtr(Imm32 imm, const Address& dest) DEFINED_ON(mips_shared, arm, arm64, x86, x64, loong64, wasm32); inline void addPtr(Imm32 imm, const AbsoluteAddress& dest) DEFINED_ON(x86, x64); inline void addPtr(const Address& src, Register dest) DEFINED_ON(mips_shared, arm, arm64, x86, x64, loong64, wasm32); inline void add64(Register64 src, Register64 dest) PER_ARCH; inline void add64(Imm32 imm, Register64 dest) PER_ARCH; inline void add64(Imm64 imm, Register64 dest) PER_ARCH; inline void add64(const Operand& src, Register64 dest) DEFINED_ON(x64, mips64, loong64); inline void addFloat32(FloatRegister src, FloatRegister dest) PER_SHARED_ARCH; // Compute dest=SP-imm where dest is a pointer registers and not SP. The // offset returned from sub32FromStackPtrWithPatch() must be passed to // patchSub32FromStackPtr(). inline CodeOffset sub32FromStackPtrWithPatch(Register dest) PER_ARCH; inline void patchSub32FromStackPtr(CodeOffset offset, Imm32 imm) PER_ARCH; inline void addDouble(FloatRegister src, FloatRegister dest) PER_SHARED_ARCH; inline void addConstantDouble(double d, FloatRegister dest) DEFINED_ON(x86); inline void sub32(const Address& src, Register dest) PER_SHARED_ARCH; inline void sub32(Register src, Register dest) PER_SHARED_ARCH; inline void sub32(Imm32 imm, Register dest) PER_SHARED_ARCH; inline void subPtr(Register src, Register dest) PER_ARCH; inline void subPtr(Register src, const Address& dest) DEFINED_ON(mips_shared, arm, arm64, x86, x64, loong64, wasm32); inline void subPtr(Imm32 imm, Register dest) PER_ARCH; inline void subPtr(ImmWord imm, Register dest) DEFINED_ON(x64); inline void subPtr(const Address& addr, Register dest) DEFINED_ON(mips_shared, arm, arm64, x86, x64, loong64, wasm32); inline void sub64(Register64 src, Register64 dest) PER_ARCH; inline void sub64(Imm64 imm, Register64 dest) PER_ARCH; inline void sub64(const Operand& src, Register64 dest) DEFINED_ON(x64, mips64, loong64); inline void subFloat32(FloatRegister src, FloatRegister dest) PER_SHARED_ARCH; inline void subDouble(FloatRegister src, FloatRegister dest) PER_SHARED_ARCH; inline void mul32(Register rhs, Register srcDest) PER_SHARED_ARCH; inline void mul32(Imm32 imm, Register srcDest) PER_SHARED_ARCH; inline void mul32(Register src1, Register src2, Register dest, Label* onOver) DEFINED_ON(arm64); // Return the high word of the unsigned multiplication into |dest|. inline void mulHighUnsigned32(Imm32 imm, Register src, Register dest) PER_ARCH; inline void mulPtr(Register rhs, Register srcDest) PER_ARCH; inline void mul64(const Operand& src, const Register64& dest) DEFINED_ON(x64); inline void mul64(const Operand& src, const Register64& dest, const Register temp) DEFINED_ON(x64, mips64, loong64); inline void mul64(Imm64 imm, const Register64& dest) PER_ARCH; inline void mul64(Imm64 imm, const Register64& dest, const Register temp) DEFINED_ON(x86, x64, arm, mips32, mips64, loong64); inline void mul64(const Register64& src, const Register64& dest, const Register temp) PER_ARCH; inline void mul64(const Register64& src1, const Register64& src2, const Register64& dest) DEFINED_ON(arm64); inline void mul64(Imm64 src1, const Register64& src2, const Register64& dest) DEFINED_ON(arm64); inline void mulBy3(Register src, Register dest) PER_ARCH; inline void mulFloat32(FloatRegister src, FloatRegister dest) PER_SHARED_ARCH; inline void mulDouble(FloatRegister src, FloatRegister dest) PER_SHARED_ARCH; inline void mulDoublePtr(ImmPtr imm, Register temp, FloatRegister dest) DEFINED_ON(mips_shared, arm, arm64, x86, x64, loong64, wasm32); // Perform an integer division, returning the integer part rounded toward // zero. rhs must not be zero, and the division must not overflow. // // On ARM, the chip must have hardware division instructions. inline void quotient32(Register rhs, Register srcDest, bool isUnsigned) DEFINED_ON(mips_shared, arm, arm64, loong64, wasm32); // As above, but srcDest must be eax and tempEdx must be edx. inline void quotient32(Register rhs, Register srcDest, Register tempEdx, bool isUnsigned) DEFINED_ON(x86_shared); // Perform an integer division, returning the remainder part. // rhs must not be zero, and the division must not overflow. // // On ARM, the chip must have hardware division instructions. inline void remainder32(Register rhs, Register srcDest, bool isUnsigned) DEFINED_ON(mips_shared, arm, arm64, loong64, wasm32); // As above, but srcDest must be eax and tempEdx must be edx. inline void remainder32(Register rhs, Register srcDest, Register tempEdx, bool isUnsigned) DEFINED_ON(x86_shared); // Perform an integer division, returning the integer part rounded toward // zero. rhs must not be zero, and the division must not overflow. // // This variant preserves registers, and doesn't require hardware division // instructions on ARM (will call out to a runtime routine). // // rhs is preserved, srdDest is clobbered. void flexibleRemainder32(Register rhs, Register srcDest, bool isUnsigned, const LiveRegisterSet& volatileLiveRegs) DEFINED_ON(mips_shared, arm, arm64, x86_shared, loong64, wasm32); // Perform an integer division, returning the integer part rounded toward // zero. rhs must not be zero, and the division must not overflow. // // This variant preserves registers, and doesn't require hardware division // instructions on ARM (will call out to a runtime routine). // // rhs is preserved, srdDest is clobbered. void flexibleQuotient32(Register rhs, Register srcDest, bool isUnsigned, const LiveRegisterSet& volatileLiveRegs) DEFINED_ON(mips_shared, arm, arm64, x86_shared, loong64); // Perform an integer division, returning the integer part rounded toward // zero. rhs must not be zero, and the division must not overflow. The // remainder is stored into the third argument register here. // // This variant preserves registers, and doesn't require hardware division // instructions on ARM (will call out to a runtime routine). // // rhs is preserved, srdDest and remOutput are clobbered. void flexibleDivMod32(Register rhs, Register srcDest, Register remOutput, bool isUnsigned, const LiveRegisterSet& volatileLiveRegs) DEFINED_ON(mips_shared, arm, arm64, x86_shared, loong64, wasm32); inline void divFloat32(FloatRegister src, FloatRegister dest) PER_SHARED_ARCH; inline void divDouble(FloatRegister src, FloatRegister dest) PER_SHARED_ARCH; inline void inc64(AbsoluteAddress dest) PER_ARCH; inline void neg32(Register reg) PER_SHARED_ARCH; inline void neg64(Register64 reg) PER_ARCH; inline void negPtr(Register reg) PER_ARCH; inline void negateFloat(FloatRegister reg) PER_SHARED_ARCH; inline void negateDouble(FloatRegister reg) PER_SHARED_ARCH; inline void abs32(Register src, Register dest) PER_SHARED_ARCH; inline void absFloat32(FloatRegister src, FloatRegister dest) PER_SHARED_ARCH; inline void absDouble(FloatRegister src, FloatRegister dest) PER_SHARED_ARCH; inline void sqrtFloat32(FloatRegister src, FloatRegister dest) PER_SHARED_ARCH; inline void sqrtDouble(FloatRegister src, FloatRegister dest) PER_SHARED_ARCH; void floorFloat32ToInt32(FloatRegister src, Register dest, Label* fail) PER_SHARED_ARCH; void floorDoubleToInt32(FloatRegister src, Register dest, Label* fail) PER_SHARED_ARCH; void ceilFloat32ToInt32(FloatRegister src, Register dest, Label* fail) PER_SHARED_ARCH; void ceilDoubleToInt32(FloatRegister src, Register dest, Label* fail) PER_SHARED_ARCH; void roundFloat32ToInt32(FloatRegister src, Register dest, FloatRegister temp, Label* fail) PER_SHARED_ARCH; void roundDoubleToInt32(FloatRegister src, Register dest, FloatRegister temp, Label* fail) PER_SHARED_ARCH; void truncFloat32ToInt32(FloatRegister src, Register dest, Label* fail) PER_SHARED_ARCH; void truncDoubleToInt32(FloatRegister src, Register dest, Label* fail) PER_SHARED_ARCH; void nearbyIntDouble(RoundingMode mode, FloatRegister src, FloatRegister dest) PER_SHARED_ARCH; void nearbyIntFloat32(RoundingMode mode, FloatRegister src, FloatRegister dest) PER_SHARED_ARCH; void signInt32(Register input, Register output); void signDouble(FloatRegister input, FloatRegister output); void signDoubleToInt32(FloatRegister input, Register output, FloatRegister temp, Label* fail); void copySignDouble(FloatRegister lhs, FloatRegister rhs, FloatRegister output) PER_SHARED_ARCH; void copySignFloat32(FloatRegister lhs, FloatRegister rhs, FloatRegister output) DEFINED_ON(x86_shared, arm64); // Returns a random double in range [0, 1) in |dest|. The |rng| register must // hold a pointer to a mozilla::non_crypto::XorShift128PlusRNG. void randomDouble(Register rng, FloatRegister dest, Register64 temp0, Register64 temp1); // srcDest = {min,max}{Float32,Double}(srcDest, other) // For min and max, handle NaN specially if handleNaN is true. inline void minFloat32(FloatRegister other, FloatRegister srcDest, bool handleNaN) PER_SHARED_ARCH; inline void minDouble(FloatRegister other, FloatRegister srcDest, bool handleNaN) PER_SHARED_ARCH; inline void maxFloat32(FloatRegister other, FloatRegister srcDest, bool handleNaN) PER_SHARED_ARCH; inline void maxDouble(FloatRegister other, FloatRegister srcDest, bool handleNaN) PER_SHARED_ARCH; void minMaxArrayInt32(Register array, Register result, Register temp1, Register temp2, Register temp3, bool isMax, Label* fail); void minMaxArrayNumber(Register array, FloatRegister result, FloatRegister floatTemp, Register temp1, Register temp2, bool isMax, Label* fail); // Compute |pow(base, power)| and store the result in |dest|. If the result // exceeds the int32 range, jumps to |onOver|. // |base| and |power| are preserved, the other input registers are clobbered. void pow32(Register base, Register power, Register dest, Register temp1, Register temp2, Label* onOver); void sameValueDouble(FloatRegister left, FloatRegister right, FloatRegister temp, Register dest); void branchIfNotRegExpPrototypeOptimizable(Register proto, Register temp, Label* label); void branchIfNotRegExpInstanceOptimizable(Register regexp, Register temp, Label* label); // =============================================================== // Shift functions // For shift-by-register there may be platform-specific variations, for // example, x86 will perform the shift mod 32 but ARM will perform the shift // mod 256. // // For shift-by-immediate the platform assembler may restrict the immediate, // for example, the ARM assembler requires the count for 32-bit shifts to be // in the range [0,31]. inline void lshift32(Imm32 shift, Register srcDest) PER_SHARED_ARCH; inline void rshift32(Imm32 shift, Register srcDest) PER_SHARED_ARCH; inline void rshift32Arithmetic(Imm32 shift, Register srcDest) PER_SHARED_ARCH; inline void lshiftPtr(Imm32 imm, Register dest) PER_ARCH; inline void rshiftPtr(Imm32 imm, Register dest) PER_ARCH; inline void rshiftPtr(Imm32 imm, Register src, Register dest) DEFINED_ON(arm64); inline void rshiftPtrArithmetic(Imm32 imm, Register dest) PER_ARCH; inline void lshift64(Imm32 imm, Register64 dest) PER_ARCH; inline void rshift64(Imm32 imm, Register64 dest) PER_ARCH; inline void rshift64Arithmetic(Imm32 imm, Register64 dest) PER_ARCH; // On x86_shared these have the constraint that shift must be in CL. inline void lshift32(Register shift, Register srcDest) PER_SHARED_ARCH; inline void rshift32(Register shift, Register srcDest) PER_SHARED_ARCH; inline void rshift32Arithmetic(Register shift, Register srcDest) PER_SHARED_ARCH; inline void lshiftPtr(Register shift, Register srcDest) PER_ARCH; inline void rshiftPtr(Register shift, Register srcDest) PER_ARCH; // These variants do not have the above constraint, but may emit some extra // instructions on x86_shared. They also handle shift >= 32 consistently by // masking with 0x1F (either explicitly or relying on the hardware to do // that). inline void flexibleLshift32(Register shift, Register srcDest) PER_SHARED_ARCH; inline void flexibleRshift32(Register shift, Register srcDest) PER_SHARED_ARCH; inline void flexibleRshift32Arithmetic(Register shift, Register srcDest) PER_SHARED_ARCH; inline void lshift64(Register shift, Register64 srcDest) PER_ARCH; inline void rshift64(Register shift, Register64 srcDest) PER_ARCH; inline void rshift64Arithmetic(Register shift, Register64 srcDest) PER_ARCH; // =============================================================== // Rotation functions // Note: - on x86 and x64 the count register must be in CL. // - on x64 the temp register should be InvalidReg. inline void rotateLeft(Imm32 count, Register input, Register dest) PER_SHARED_ARCH; inline void rotateLeft(Register count, Register input, Register dest) PER_SHARED_ARCH; inline void rotateLeft64(Imm32 count, Register64 input, Register64 dest) DEFINED_ON(x64); inline void rotateLeft64(Register count, Register64 input, Register64 dest) DEFINED_ON(x64); inline void rotateLeft64(Imm32 count, Register64 input, Register64 dest, Register temp) PER_ARCH; inline void rotateLeft64(Register count, Register64 input, Register64 dest, Register temp) PER_ARCH; inline void rotateRight(Imm32 count, Register input, Register dest) PER_SHARED_ARCH; inline void rotateRight(Register count, Register input, Register dest) PER_SHARED_ARCH; inline void rotateRight64(Imm32 count, Register64 input, Register64 dest) DEFINED_ON(x64); inline void rotateRight64(Register count, Register64 input, Register64 dest) DEFINED_ON(x64); inline void rotateRight64(Imm32 count, Register64 input, Register64 dest, Register temp) PER_ARCH; inline void rotateRight64(Register count, Register64 input, Register64 dest, Register temp) PER_ARCH; // =============================================================== // Bit counting functions // knownNotZero may be true only if the src is known not to be zero. inline void clz32(Register src, Register dest, bool knownNotZero) PER_SHARED_ARCH; inline void ctz32(Register src, Register dest, bool knownNotZero) PER_SHARED_ARCH; inline void clz64(Register64 src, Register dest) PER_ARCH; inline void ctz64(Register64 src, Register dest) PER_ARCH; // On x86_shared, temp may be Invalid only if the chip has the POPCNT // instruction. On ARM, temp may never be Invalid. inline void popcnt32(Register src, Register dest, Register temp) PER_SHARED_ARCH; // temp may be invalid only if the chip has the POPCNT instruction. inline void popcnt64(Register64 src, Register64 dest, Register temp) PER_ARCH; // =============================================================== // Condition functions inline void cmp8Set(Condition cond, Address lhs, Imm32 rhs, Register dest) PER_SHARED_ARCH; inline void cmp16Set(Condition cond, Address lhs, Imm32 rhs, Register dest) PER_SHARED_ARCH; template inline void cmp32Set(Condition cond, T1 lhs, T2 rhs, Register dest) DEFINED_ON(x86_shared, arm, arm64, mips32, mips64, loong64, wasm32); // Only the NotEqual and Equal conditions are allowed. inline void cmp64Set(Condition cond, Address lhs, Imm64 rhs, Register dest) PER_ARCH; template inline void cmpPtrSet(Condition cond, T1 lhs, T2 rhs, Register dest) PER_ARCH; // =============================================================== // Branch functions inline void branch8(Condition cond, const Address& lhs, Imm32 rhs, Label* label) PER_SHARED_ARCH; // Compares the byte in |lhs| against |rhs| using a 8-bit comparison on // x86/x64 or a 32-bit comparison (all other platforms). The caller should // ensure |rhs| is a zero- resp. sign-extended byte value for cross-platform // compatible code. inline void branch8(Condition cond, const BaseIndex& lhs, Register rhs, Label* label) PER_SHARED_ARCH; inline void branch16(Condition cond, const Address& lhs, Imm32 rhs, Label* label) PER_SHARED_ARCH; template inline void branch32(Condition cond, Register lhs, Register rhs, L label) PER_SHARED_ARCH; template inline void branch32(Condition cond, Register lhs, Imm32 rhs, L label) PER_SHARED_ARCH; inline void branch32(Condition cond, Register lhs, const Address& rhs, Label* label) DEFINED_ON(arm64); inline void branch32(Condition cond, const Address& lhs, Register rhs, Label* label) PER_SHARED_ARCH; inline void branch32(Condition cond, const Address& lhs, Imm32 rhs, Label* label) PER_SHARED_ARCH; inline void branch32(Condition cond, const AbsoluteAddress& lhs, Register rhs, Label* label) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); inline void branch32(Condition cond, const AbsoluteAddress& lhs, Imm32 rhs, Label* label) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); inline void branch32(Condition cond, const BaseIndex& lhs, Register rhs, Label* label) DEFINED_ON(arm, x86_shared); inline void branch32(Condition cond, const BaseIndex& lhs, Imm32 rhs, Label* label) PER_SHARED_ARCH; inline void branch32(Condition cond, const Operand& lhs, Register rhs, Label* label) DEFINED_ON(x86_shared); inline void branch32(Condition cond, const Operand& lhs, Imm32 rhs, Label* label) DEFINED_ON(x86_shared); inline void branch32(Condition cond, wasm::SymbolicAddress lhs, Imm32 rhs, Label* label) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); // The supported condition are Equal, NotEqual, LessThan(orEqual), // GreaterThan(orEqual), Below(orEqual) and Above(orEqual). When a fail label // is not defined it will fall through to next instruction, else jump to the // fail label. inline void branch64(Condition cond, Register64 lhs, Imm64 val, Label* success, Label* fail = nullptr) PER_ARCH; inline void branch64(Condition cond, Register64 lhs, Register64 rhs, Label* success, Label* fail = nullptr) PER_ARCH; // Only the NotEqual and Equal conditions are allowed for the branch64 // variants with Address as lhs. inline void branch64(Condition cond, const Address& lhs, Imm64 val, Label* label) PER_ARCH; inline void branch64(Condition cond, const Address& lhs, Register64 rhs, Label* label) PER_ARCH; // Compare the value at |lhs| with the value at |rhs|. The scratch // register *must not* be the base of |lhs| or |rhs|. inline void branch64(Condition cond, const Address& lhs, const Address& rhs, Register scratch, Label* label) PER_ARCH; template inline void branchPtr(Condition cond, Register lhs, Register rhs, L label) PER_SHARED_ARCH; inline void branchPtr(Condition cond, Register lhs, Imm32 rhs, Label* label) PER_SHARED_ARCH; inline void branchPtr(Condition cond, Register lhs, ImmPtr rhs, Label* label) PER_SHARED_ARCH; inline void branchPtr(Condition cond, Register lhs, ImmGCPtr rhs, Label* label) PER_SHARED_ARCH; inline void branchPtr(Condition cond, Register lhs, ImmWord rhs, Label* label) PER_SHARED_ARCH; template inline void branchPtr(Condition cond, const Address& lhs, Register rhs, L label) PER_SHARED_ARCH; inline void branchPtr(Condition cond, const Address& lhs, ImmPtr rhs, Label* label) PER_SHARED_ARCH; inline void branchPtr(Condition cond, const Address& lhs, ImmGCPtr rhs, Label* label) PER_SHARED_ARCH; inline void branchPtr(Condition cond, const Address& lhs, ImmWord rhs, Label* label) PER_SHARED_ARCH; inline void branchPtr(Condition cond, const BaseIndex& lhs, ImmWord rhs, Label* label) PER_SHARED_ARCH; inline void branchPtr(Condition cond, const BaseIndex& lhs, Register rhs, Label* label) PER_SHARED_ARCH; inline void branchPtr(Condition cond, const AbsoluteAddress& lhs, Register rhs, Label* label) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); inline void branchPtr(Condition cond, const AbsoluteAddress& lhs, ImmWord rhs, Label* label) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); inline void branchPtr(Condition cond, wasm::SymbolicAddress lhs, Register rhs, Label* label) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); // Given a pointer to a GC Cell, retrieve the StoreBuffer pointer from its // chunk header, or nullptr if it is in the tenured heap. void loadStoreBuffer(Register ptr, Register buffer) PER_ARCH; void branchPtrInNurseryChunk(Condition cond, Register ptr, Register temp, Label* label) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); void branchPtrInNurseryChunk(Condition cond, const Address& address, Register temp, Label* label) DEFINED_ON(x86); void branchValueIsNurseryCell(Condition cond, const Address& address, Register temp, Label* label) PER_ARCH; void branchValueIsNurseryCell(Condition cond, ValueOperand value, Register temp, Label* label) PER_ARCH; // This function compares a Value (lhs) which is having a private pointer // boxed inside a js::Value, with a raw pointer (rhs). inline void branchPrivatePtr(Condition cond, const Address& lhs, Register rhs, Label* label) PER_ARCH; inline void branchFloat(DoubleCondition cond, FloatRegister lhs, FloatRegister rhs, Label* label) PER_SHARED_ARCH; // Truncate a double/float32 to int32 and when it doesn't fit an int32 it will // jump to the failure label. This particular variant is allowed to return the // value module 2**32, which isn't implemented on all architectures. E.g. the // x64 variants will do this only in the int64_t range. inline void branchTruncateFloat32MaybeModUint32(FloatRegister src, Register dest, Label* fail) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); inline void branchTruncateDoubleMaybeModUint32(FloatRegister src, Register dest, Label* fail) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); // Truncate a double/float32 to intptr and when it doesn't fit jump to the // failure label. inline void branchTruncateFloat32ToPtr(FloatRegister src, Register dest, Label* fail) DEFINED_ON(x86, x64); inline void branchTruncateDoubleToPtr(FloatRegister src, Register dest, Label* fail) DEFINED_ON(x86, x64); // Truncate a double/float32 to int32 and when it doesn't fit jump to the // failure label. inline void branchTruncateFloat32ToInt32(FloatRegister src, Register dest, Label* fail) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); inline void branchTruncateDoubleToInt32(FloatRegister src, Register dest, Label* fail) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); inline void branchDouble(DoubleCondition cond, FloatRegister lhs, FloatRegister rhs, Label* label) PER_SHARED_ARCH; inline void branchDoubleNotInInt64Range(Address src, Register temp, Label* fail); inline void branchDoubleNotInUInt64Range(Address src, Register temp, Label* fail); inline void branchFloat32NotInInt64Range(Address src, Register temp, Label* fail); inline void branchFloat32NotInUInt64Range(Address src, Register temp, Label* fail); template inline void branchAdd32(Condition cond, T src, Register dest, Label* label) PER_SHARED_ARCH; template inline void branchSub32(Condition cond, T src, Register dest, Label* label) PER_SHARED_ARCH; template inline void branchMul32(Condition cond, T src, Register dest, Label* label) PER_SHARED_ARCH; template inline void branchRshift32(Condition cond, T src, Register dest, Label* label) PER_SHARED_ARCH; inline void branchNeg32(Condition cond, Register reg, Label* label) PER_SHARED_ARCH; inline void branchAdd64(Condition cond, Imm64 imm, Register64 dest, Label* label) DEFINED_ON(x86, arm, wasm32); template inline void branchAddPtr(Condition cond, T src, Register dest, Label* label) PER_SHARED_ARCH; template inline void branchSubPtr(Condition cond, T src, Register dest, Label* label) PER_SHARED_ARCH; inline void branchMulPtr(Condition cond, Register src, Register dest, Label* label) PER_SHARED_ARCH; inline void decBranchPtr(Condition cond, Register lhs, Imm32 rhs, Label* label) PER_SHARED_ARCH; template inline void branchTest32(Condition cond, Register lhs, Register rhs, L label) PER_SHARED_ARCH; template inline void branchTest32(Condition cond, Register lhs, Imm32 rhs, L label) PER_SHARED_ARCH; inline void branchTest32(Condition cond, const Address& lhs, Imm32 rhh, Label* label) PER_SHARED_ARCH; inline void branchTest32(Condition cond, const AbsoluteAddress& lhs, Imm32 rhs, Label* label) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); template inline void branchTestPtr(Condition cond, Register lhs, Register rhs, L label) PER_SHARED_ARCH; inline void branchTestPtr(Condition cond, Register lhs, Imm32 rhs, Label* label) PER_SHARED_ARCH; inline void branchTestPtr(Condition cond, const Address& lhs, Imm32 rhs, Label* label) PER_SHARED_ARCH; template inline void branchTest64(Condition cond, Register64 lhs, Register64 rhs, Register temp, L label) PER_ARCH; // Branches to |label| if |reg| is false. |reg| should be a C++ bool. template inline void branchIfFalseBool(Register reg, L label); // Branches to |label| if |reg| is true. |reg| should be a C++ bool. inline void branchIfTrueBool(Register reg, Label* label); inline void branchIfRope(Register str, Label* label); inline void branchIfNotRope(Register str, Label* label); inline void branchLatin1String(Register string, Label* label); inline void branchTwoByteString(Register string, Label* label); inline void branchIfBigIntIsNegative(Register bigInt, Label* label); inline void branchIfBigIntIsNonNegative(Register bigInt, Label* label); inline void branchIfBigIntIsZero(Register bigInt, Label* label); inline void branchIfBigIntIsNonZero(Register bigInt, Label* label); inline void branchTestFunctionFlags(Register fun, uint32_t flags, Condition cond, Label* label); inline void branchIfNotFunctionIsNonBuiltinCtor(Register fun, Register scratch, Label* label); inline void branchIfFunctionHasNoJitEntry(Register fun, bool isConstructing, Label* label); inline void branchIfFunctionHasJitEntry(Register fun, bool isConstructing, Label* label); inline void branchIfScriptHasJitScript(Register script, Label* label); inline void branchIfScriptHasNoJitScript(Register script, Label* label); inline void loadJitScript(Register script, Register dest); // Loads the function's argument count. inline void loadFunctionArgCount(Register func, Register output); // Loads the function length. This handles interpreted, native, and bound // functions. The caller is responsible for checking that INTERPRETED_LAZY and // RESOLVED_LENGTH flags are not set. void loadFunctionLength(Register func, Register funFlagsAndArgCount, Register output, Label* slowPath); // Loads the function name. This handles interpreted, native, and bound // functions. void loadFunctionName(Register func, Register output, ImmGCPtr emptyString, Label* slowPath); void assertFunctionIsExtended(Register func); inline void branchFunctionKind(Condition cond, FunctionFlags::FunctionKind kind, Register fun, Register scratch, Label* label); inline void branchIfObjectEmulatesUndefined(Register objReg, Register scratch, Label* slowCheck, Label* label); // For all methods below: spectreRegToZero is a register that will be zeroed // on speculatively executed code paths (when the branch should be taken but // branch prediction speculates it isn't). Usually this will be the object // register but the caller may pass a different register. inline void branchTestObjClass(Condition cond, Register obj, const JSClass* clasp, Register scratch, Register spectreRegToZero, Label* label); inline void branchTestObjClassNoSpectreMitigations(Condition cond, Register obj, const JSClass* clasp, Register scratch, Label* label); inline void branchTestObjClass(Condition cond, Register obj, const Address& clasp, Register scratch, Register spectreRegToZero, Label* label); inline void branchTestObjClassNoSpectreMitigations(Condition cond, Register obj, const Address& clasp, Register scratch, Label* label); inline void branchTestObjClass(Condition cond, Register obj, Register clasp, Register scratch, Register spectreRegToZero, Label* label); inline void branchTestObjShape(Condition cond, Register obj, const Shape* shape, Register scratch, Register spectreRegToZero, Label* label); inline void branchTestObjShapeNoSpectreMitigations(Condition cond, Register obj, const Shape* shape, Label* label); void branchTestObjShapeList(Condition cond, Register obj, Register shapeElements, Register shapeScratch, Register endScratch, Register spectreScratch, Label* label); inline void branchTestClassIsFunction(Condition cond, Register clasp, Label* label); inline void branchTestObjIsFunction(Condition cond, Register obj, Register scratch, Register spectreRegToZero, Label* label); inline void branchTestObjIsFunctionNoSpectreMitigations(Condition cond, Register obj, Register scratch, Label* label); inline void branchTestObjShape(Condition cond, Register obj, Register shape, Register scratch, Register spectreRegToZero, Label* label); inline void branchTestObjShapeNoSpectreMitigations(Condition cond, Register obj, Register shape, Label* label); // TODO: audit/fix callers to be Spectre safe. inline void branchTestObjShapeUnsafe(Condition cond, Register obj, Register shape, Label* label); void branchTestObjCompartment(Condition cond, Register obj, const Address& compartment, Register scratch, Label* label); void branchTestObjCompartment(Condition cond, Register obj, const JS::Compartment* compartment, Register scratch, Label* label); void branchIfNonNativeObj(Register obj, Register scratch, Label* label); void branchIfObjectNotExtensible(Register obj, Register scratch, Label* label); inline void branchTestClassIsProxy(bool proxy, Register clasp, Label* label); inline void branchTestObjectIsProxy(bool proxy, Register object, Register scratch, Label* label); inline void branchTestProxyHandlerFamily(Condition cond, Register proxy, Register scratch, const void* handlerp, Label* label); inline void branchTestNeedsIncrementalBarrier(Condition cond, Label* label); inline void branchTestNeedsIncrementalBarrierAnyZone(Condition cond, Label* label, Register scratch); // Perform a type-test on a tag of a Value (32bits boxing), or the tagged // value (64bits boxing). inline void branchTestUndefined(Condition cond, Register tag, Label* label) PER_SHARED_ARCH; inline void branchTestInt32(Condition cond, Register tag, Label* label) PER_SHARED_ARCH; inline void branchTestDouble(Condition cond, Register tag, Label* label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); inline void branchTestNumber(Condition cond, Register tag, Label* label) PER_SHARED_ARCH; inline void branchTestBoolean(Condition cond, Register tag, Label* label) PER_SHARED_ARCH; inline void branchTestString(Condition cond, Register tag, Label* label) PER_SHARED_ARCH; inline void branchTestSymbol(Condition cond, Register tag, Label* label) PER_SHARED_ARCH; inline void branchTestBigInt(Condition cond, Register tag, Label* label) PER_SHARED_ARCH; inline void branchTestNull(Condition cond, Register tag, Label* label) PER_SHARED_ARCH; inline void branchTestObject(Condition cond, Register tag, Label* label) PER_SHARED_ARCH; inline void branchTestPrimitive(Condition cond, Register tag, Label* label) PER_SHARED_ARCH; inline void branchTestMagic(Condition cond, Register tag, Label* label) PER_SHARED_ARCH; void branchTestType(Condition cond, Register tag, JSValueType type, Label* label); // Perform a type-test on a Value, addressed by Address or BaseIndex, or // loaded into ValueOperand. // BaseIndex and ValueOperand variants clobber the ScratchReg on x64. // All Variants clobber the ScratchReg on arm64. inline void branchTestUndefined(Condition cond, const Address& address, Label* label) PER_SHARED_ARCH; inline void branchTestUndefined(Condition cond, const BaseIndex& address, Label* label) PER_SHARED_ARCH; inline void branchTestUndefined(Condition cond, const ValueOperand& value, Label* label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); inline void branchTestInt32(Condition cond, const Address& address, Label* label) PER_SHARED_ARCH; inline void branchTestInt32(Condition cond, const BaseIndex& address, Label* label) PER_SHARED_ARCH; inline void branchTestInt32(Condition cond, const ValueOperand& value, Label* label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); inline void branchTestDouble(Condition cond, const Address& address, Label* label) PER_SHARED_ARCH; inline void branchTestDouble(Condition cond, const BaseIndex& address, Label* label) PER_SHARED_ARCH; inline void branchTestDouble(Condition cond, const ValueOperand& value, Label* label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); inline void branchTestNumber(Condition cond, const ValueOperand& value, Label* label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); inline void branchTestBoolean(Condition cond, const Address& address, Label* label) PER_SHARED_ARCH; inline void branchTestBoolean(Condition cond, const BaseIndex& address, Label* label) PER_SHARED_ARCH; inline void branchTestBoolean(Condition cond, const ValueOperand& value, Label* label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); inline void branchTestString(Condition cond, const Address& address, Label* label) PER_SHARED_ARCH; inline void branchTestString(Condition cond, const BaseIndex& address, Label* label) PER_SHARED_ARCH; inline void branchTestString(Condition cond, const ValueOperand& value, Label* label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); inline void branchTestSymbol(Condition cond, const Address& address, Label* label) PER_SHARED_ARCH; inline void branchTestSymbol(Condition cond, const BaseIndex& address, Label* label) PER_SHARED_ARCH; inline void branchTestSymbol(Condition cond, const ValueOperand& value, Label* label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); inline void branchTestBigInt(Condition cond, const Address& address, Label* label) PER_SHARED_ARCH; inline void branchTestBigInt(Condition cond, const BaseIndex& address, Label* label) PER_SHARED_ARCH; inline void branchTestBigInt(Condition cond, const ValueOperand& value, Label* label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); inline void branchTestNull(Condition cond, const Address& address, Label* label) PER_SHARED_ARCH; inline void branchTestNull(Condition cond, const BaseIndex& address, Label* label) PER_SHARED_ARCH; inline void branchTestNull(Condition cond, const ValueOperand& value, Label* label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); // Clobbers the ScratchReg on x64. inline void branchTestObject(Condition cond, const Address& address, Label* label) PER_SHARED_ARCH; inline void branchTestObject(Condition cond, const BaseIndex& address, Label* label) PER_SHARED_ARCH; inline void branchTestObject(Condition cond, const ValueOperand& value, Label* label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); inline void branchTestGCThing(Condition cond, const Address& address, Label* label) PER_SHARED_ARCH; inline void branchTestGCThing(Condition cond, const BaseIndex& address, Label* label) PER_SHARED_ARCH; inline void branchTestGCThing(Condition cond, const ValueOperand& value, Label* label) PER_SHARED_ARCH; inline void branchTestPrimitive(Condition cond, const ValueOperand& value, Label* label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); inline void branchTestMagic(Condition cond, const Address& address, Label* label) PER_SHARED_ARCH; inline void branchTestMagic(Condition cond, const BaseIndex& address, Label* label) PER_SHARED_ARCH; template inline void branchTestMagic(Condition cond, const ValueOperand& value, L label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); inline void branchTestMagic(Condition cond, const Address& valaddr, JSWhyMagic why, Label* label) PER_ARCH; inline void branchTestMagicValue(Condition cond, const ValueOperand& val, JSWhyMagic why, Label* label); void branchTestValue(Condition cond, const ValueOperand& lhs, const Value& rhs, Label* label) PER_ARCH; inline void branchTestValue(Condition cond, const BaseIndex& lhs, const ValueOperand& rhs, Label* label) PER_ARCH; // Checks if given Value is evaluated to true or false in a condition. // The type of the value should match the type of the method. inline void branchTestInt32Truthy(bool truthy, const ValueOperand& value, Label* label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, x86_shared, wasm32); inline void branchTestDoubleTruthy(bool truthy, FloatRegister reg, Label* label) PER_SHARED_ARCH; inline void branchTestBooleanTruthy(bool truthy, const ValueOperand& value, Label* label) PER_ARCH; inline void branchTestStringTruthy(bool truthy, const ValueOperand& value, Label* label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); inline void branchTestBigIntTruthy(bool truthy, const ValueOperand& value, Label* label) DEFINED_ON(arm, arm64, mips32, mips64, loong64, wasm32, x86_shared); // Create an unconditional branch to the address given as argument. inline void branchToComputedAddress(const BaseIndex& address) PER_ARCH; private: template inline void branchPtrImpl(Condition cond, const T& lhs, const S& rhs, L label) DEFINED_ON(x86_shared); void branchPtrInNurseryChunkImpl(Condition cond, Register ptr, Label* label) DEFINED_ON(x86); template void branchValueIsNurseryCellImpl(Condition cond, const T& value, Register temp, Label* label) DEFINED_ON(arm64, x64, mips64, loong64); template inline void branchTestUndefinedImpl(Condition cond, const T& t, Label* label) DEFINED_ON(arm, arm64, x86_shared); template inline void branchTestInt32Impl(Condition cond, const T& t, Label* label) DEFINED_ON(arm, arm64, x86_shared); template inline void branchTestDoubleImpl(Condition cond, const T& t, Label* label) DEFINED_ON(arm, arm64, x86_shared); template inline void branchTestNumberImpl(Condition cond, const T& t, Label* label) DEFINED_ON(arm, arm64, x86_shared); template inline void branchTestBooleanImpl(Condition cond, const T& t, Label* label) DEFINED_ON(arm, arm64, x86_shared); template inline void branchTestStringImpl(Condition cond, const T& t, Label* label) DEFINED_ON(arm, arm64, x86_shared); template inline void branchTestSymbolImpl(Condition cond, const T& t, Label* label) DEFINED_ON(arm, arm64, x86_shared); template inline void branchTestBigIntImpl(Condition cond, const T& t, Label* label) DEFINED_ON(arm, arm64, x86_shared); template inline void branchTestNullImpl(Condition cond, const T& t, Label* label) DEFINED_ON(arm, arm64, x86_shared); template inline void branchTestObjectImpl(Condition cond, const T& t, Label* label) DEFINED_ON(arm, arm64, x86_shared); template inline void branchTestGCThingImpl(Condition cond, const T& t, Label* label) PER_SHARED_ARCH; template inline void branchTestPrimitiveImpl(Condition cond, const T& t, Label* label) DEFINED_ON(arm, arm64, x86_shared); template inline void branchTestMagicImpl(Condition cond, const T& t, L label) DEFINED_ON(arm, arm64, x86_shared); public: template inline void testNumberSet(Condition cond, const T& src, Register dest) PER_SHARED_ARCH; template inline void testBooleanSet(Condition cond, const T& src, Register dest) PER_SHARED_ARCH; template inline void testStringSet(Condition cond, const T& src, Register dest) PER_SHARED_ARCH; template inline void testSymbolSet(Condition cond, const T& src, Register dest) PER_SHARED_ARCH; template inline void testBigIntSet(Condition cond, const T& src, Register dest) PER_SHARED_ARCH; public: // The fallibleUnbox* methods below combine a Value type check with an unbox. // Especially on 64-bit platforms this can be implemented more efficiently // than a separate branch + unbox. // // |src| and |dest| can be the same register, but |dest| may hold garbage on // failure. inline void fallibleUnboxPtr(const ValueOperand& src, Register dest, JSValueType type, Label* fail) PER_ARCH; inline void fallibleUnboxPtr(const Address& src, Register dest, JSValueType type, Label* fail) PER_ARCH; inline void fallibleUnboxPtr(const BaseIndex& src, Register dest, JSValueType type, Label* fail) PER_ARCH; template inline void fallibleUnboxInt32(const T& src, Register dest, Label* fail); template inline void fallibleUnboxBoolean(const T& src, Register dest, Label* fail); template inline void fallibleUnboxObject(const T& src, Register dest, Label* fail); template inline void fallibleUnboxString(const T& src, Register dest, Label* fail); template inline void fallibleUnboxSymbol(const T& src, Register dest, Label* fail); template inline void fallibleUnboxBigInt(const T& src, Register dest, Label* fail); inline void cmp32Move32(Condition cond, Register lhs, Register rhs, Register src, Register dest) DEFINED_ON(arm, arm64, loong64, wasm32, mips_shared, x86_shared); inline void cmp32Move32(Condition cond, Register lhs, const Address& rhs, Register src, Register dest) DEFINED_ON(arm, arm64, loong64, wasm32, mips_shared, x86_shared); inline void cmpPtrMovePtr(Condition cond, Register lhs, Register rhs, Register src, Register dest) PER_ARCH; inline void cmpPtrMovePtr(Condition cond, Register lhs, const Address& rhs, Register src, Register dest) PER_ARCH; inline void cmp32Load32(Condition cond, Register lhs, const Address& rhs, const Address& src, Register dest) DEFINED_ON(arm, arm64, loong64, mips_shared, x86_shared); inline void cmp32Load32(Condition cond, Register lhs, Register rhs, const Address& src, Register dest) DEFINED_ON(arm, arm64, loong64, mips_shared, x86_shared); inline void cmp32LoadPtr(Condition cond, const Address& lhs, Imm32 rhs, const Address& src, Register dest) DEFINED_ON(arm, arm64, loong64, wasm32, mips_shared, x86, x64); inline void cmp32MovePtr(Condition cond, Register lhs, Imm32 rhs, Register src, Register dest) DEFINED_ON(arm, arm64, loong64, wasm32, mips_shared, x86, x64); inline void test32LoadPtr(Condition cond, const Address& addr, Imm32 mask, const Address& src, Register dest) DEFINED_ON(arm, arm64, loong64, wasm32, mips_shared, x86, x64); inline void test32MovePtr(Condition cond, const Address& addr, Imm32 mask, Register src, Register dest) DEFINED_ON(arm, arm64, loong64, wasm32, mips_shared, x86, x64); // Conditional move for Spectre mitigations. inline void spectreMovePtr(Condition cond, Register src, Register dest) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); // Zeroes dest if the condition is true. inline void spectreZeroRegister(Condition cond, Register scratch, Register dest) DEFINED_ON(arm, arm64, mips_shared, x86_shared, loong64, wasm32); // Performs a bounds check and zeroes the index register if out-of-bounds // (to mitigate Spectre). private: inline void spectreBoundsCheck32(Register index, const Operand& length, Register maybeScratch, Label* failure) DEFINED_ON(x86); public: inline void spectreBoundsCheck32(Register index, Register length, Register maybeScratch, Label* failure) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); inline void spectreBoundsCheck32(Register index, const Address& length, Register maybeScratch, Label* failure) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); inline void spectreBoundsCheckPtr(Register index, Register length, Register maybeScratch, Label* failure) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); inline void spectreBoundsCheckPtr(Register index, const Address& length, Register maybeScratch, Label* failure) DEFINED_ON(arm, arm64, mips_shared, x86, x64, loong64, wasm32); // ======================================================================== // Canonicalization primitives. inline void canonicalizeDouble(FloatRegister reg); inline void canonicalizeDoubleIfDeterministic(FloatRegister reg); inline void canonicalizeFloat(FloatRegister reg); inline void canonicalizeFloatIfDeterministic(FloatRegister reg); public: // ======================================================================== // Memory access primitives. inline void storeUncanonicalizedDouble(FloatRegister src, const Address& dest) DEFINED_ON(x86_shared, arm, arm64, mips32, mips64, loong64, wasm32); inline void storeUncanonicalizedDouble(FloatRegister src, const BaseIndex& dest) DEFINED_ON(x86_shared, arm, arm64, mips32, mips64, loong64, wasm32); inline void storeUncanonicalizedDouble(FloatRegister src, const Operand& dest) DEFINED_ON(x86_shared); template inline void storeDouble(FloatRegister src, const T& dest); template inline void boxDouble(FloatRegister src, const T& dest); using MacroAssemblerSpecific::boxDouble; inline void storeUncanonicalizedFloat32(FloatRegister src, const Address& dest) DEFINED_ON(x86_shared, arm, arm64, mips32, mips64, loong64, wasm32); inline void storeUncanonicalizedFloat32(FloatRegister src, const BaseIndex& dest) DEFINED_ON(x86_shared, arm, arm64, mips32, mips64, loong64, wasm32); inline void storeUncanonicalizedFloat32(FloatRegister src, const Operand& dest) DEFINED_ON(x86_shared); template inline void storeFloat32(FloatRegister src, const T& dest); template void storeUnboxedValue(const ConstantOrRegister& value, MIRType valueType, const T& dest) PER_ARCH; inline void memoryBarrier(MemoryBarrierBits barrier) PER_SHARED_ARCH; public: // ======================================================================== // Wasm SIMD // // Naming is "operationSimd128" when operate on the whole vector, otherwise // it's "operationx". // // For microarchitectural reasons we can in principle get a performance win by // using int or float specific instructions in the operationSimd128 case when // we know that subsequent operations on the result are int or float oriented. // In practice, we don't care about that yet. // // The order of operations here follows those in the SIMD overview document, // https://github.com/WebAssembly/simd/blob/master/proposals/simd/SIMD.md. // // Since we must target Intel SSE indefinitely and SSE is one-address or // two-address, the x86 porting interfaces are nearly all one-address or // two-address. Likewise there are two-address ARM64 interfaces to support // the baseline compiler. But there are also three-address ARM64 interfaces // as the ARM64 Ion back-end can use those. In the future, they may support // AVX2 or similar for x86. // // Conventions for argument order and naming and semantics: // - Condition codes come first. // - Other immediates (masks, shift counts) come next. // - Operands come next: // - For a binary two-address operator where the left-hand-side has the // same type as the result, one register parameter is normally named // `lhsDest` and is both the left-hand side and destination; the other // parameter is named `rhs` and is the right-hand side. `rhs` comes // first, `lhsDest` second. `rhs` and `lhsDest` may be the same register // (if rhs is a register). // - For a binary three-address operator the order is `lhs`, `rhs`, `dest`, // and generally these registers may be the same. // - For a unary operator, the input is named `src` and the output is named // `dest`. `src` comes first, `dest` second. `src` and `dest` may be // the same register (if `src` is a register). // - Temp registers follow operands and are named `temp` if there's only one, // otherwise `temp1`, `temp2`, etc regardless of type. GPR temps precede // FPU temps. If there are several temps then they must be distinct // registers, and they must be distinct from the operand registers unless // noted. // Moves inline void moveSimd128(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Constants inline void loadConstantSimd128(const SimdConstant& v, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Splat inline void splatX16(Register src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void splatX16(uint32_t srcLane, FloatRegister src, FloatRegister dest) DEFINED_ON(arm64); inline void splatX8(Register src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void splatX8(uint32_t srcLane, FloatRegister src, FloatRegister dest) DEFINED_ON(arm64); inline void splatX4(Register src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void splatX4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void splatX2(Register64 src, FloatRegister dest) DEFINED_ON(x86, x64, arm64); inline void splatX2(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Extract lane as scalar. Float extraction does not canonicalize the value. inline void extractLaneInt8x16(uint32_t lane, FloatRegister src, Register dest) DEFINED_ON(x86_shared, arm64); inline void unsignedExtractLaneInt8x16(uint32_t lane, FloatRegister src, Register dest) DEFINED_ON(x86_shared, arm64); inline void extractLaneInt16x8(uint32_t lane, FloatRegister src, Register dest) DEFINED_ON(x86_shared, arm64); inline void unsignedExtractLaneInt16x8(uint32_t lane, FloatRegister src, Register dest) DEFINED_ON(x86_shared, arm64); inline void extractLaneInt32x4(uint32_t lane, FloatRegister src, Register dest) DEFINED_ON(x86_shared, arm64); inline void extractLaneInt64x2(uint32_t lane, FloatRegister src, Register64 dest) DEFINED_ON(x86, x64, arm64); inline void extractLaneFloat32x4(uint32_t lane, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void extractLaneFloat64x2(uint32_t lane, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Replace lane value inline void replaceLaneInt8x16(unsigned lane, FloatRegister lhs, Register rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void replaceLaneInt8x16(unsigned lane, Register rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared, arm64); inline void replaceLaneInt16x8(unsigned lane, FloatRegister lhs, Register rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void replaceLaneInt16x8(unsigned lane, Register rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared, arm64); inline void replaceLaneInt32x4(unsigned lane, FloatRegister lhs, Register rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void replaceLaneInt32x4(unsigned lane, Register rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared, arm64); inline void replaceLaneInt64x2(unsigned lane, FloatRegister lhs, Register64 rhs, FloatRegister dest) DEFINED_ON(x86, x64); inline void replaceLaneInt64x2(unsigned lane, Register64 rhs, FloatRegister lhsDest) DEFINED_ON(x86, x64, arm64); inline void replaceLaneFloat32x4(unsigned lane, FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void replaceLaneFloat32x4(unsigned lane, FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared, arm64); inline void replaceLaneFloat64x2(unsigned lane, FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void replaceLaneFloat64x2(unsigned lane, FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared, arm64); // Shuffle - blend and permute with immediate indices, and its many // specializations. Lane values other than those mentioned are illegal. // lane values 0..31 inline void shuffleInt8x16(const uint8_t lanes[16], FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared, arm64); inline void shuffleInt8x16(const uint8_t lanes[16], FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Lane values must be 0 (select from lhs) or FF (select from rhs). // The behavior is undefined for lane values that are neither 0 nor FF. // on x86_shared: it is required that lhs == dest. inline void blendInt8x16(const uint8_t lanes[16], FloatRegister lhs, FloatRegister rhs, FloatRegister dest, FloatRegister temp) DEFINED_ON(x86_shared); // Lane values must be 0 (select from lhs) or FF (select from rhs). // The behavior is undefined for lane values that are neither 0 nor FF. inline void blendInt8x16(const uint8_t lanes[16], FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(arm64); // Lane values must be 0 (select from lhs) or FFFF (select from rhs). // The behavior is undefined for lane values that are neither 0 nor FFFF. // on x86_shared: it is required that lhs == dest. inline void blendInt16x8(const uint16_t lanes[8], FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Mask lane values must be ~0 or 0. The former selects from lhs and the // latter from rhs. // The implementation works effectively for I8x16, I16x8, I32x4, and I64x2. inline void laneSelectSimd128(FloatRegister mask, FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void interleaveHighInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void interleaveHighInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void interleaveHighInt32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void interleaveHighInt64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void interleaveLowInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void interleaveLowInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void interleaveLowInt32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void interleaveLowInt64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Permute - permute with immediate indices. // lane values 0..15 inline void permuteInt8x16(const uint8_t lanes[16], FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // lane values 0..7 inline void permuteInt16x8(const uint16_t lanes[8], FloatRegister src, FloatRegister dest) DEFINED_ON(arm64); // lane values 0..3 [sic]. inline void permuteHighInt16x8(const uint16_t lanes[4], FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared); // lane values 0..3. inline void permuteLowInt16x8(const uint16_t lanes[4], FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared); // lane values 0..3 inline void permuteInt32x4(const uint32_t lanes[4], FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Funnel shift by immediate count: // low_16_bytes_of((lhs ++ rhs) >> shift*8), shift must be < 16 inline void concatAndRightShiftSimd128(FloatRegister lhs, FloatRegister rhs, FloatRegister dest, uint32_t shift) DEFINED_ON(x86_shared, arm64); // Rotate right by immediate count: // low_16_bytes_of((src ++ src) >> shift*8), shift must be < 16 inline void rotateRightSimd128(FloatRegister src, FloatRegister dest, uint32_t shift) DEFINED_ON(arm64); // Shift bytes with immediate count, shifting in zeroes. Shift count 0..15. inline void leftShiftSimd128(Imm32 count, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void rightShiftSimd128(Imm32 count, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Reverse bytes in lanes. inline void reverseInt16x8(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void reverseInt32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void reverseInt64x2(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Swizzle - permute with variable indices. `rhs` holds the lanes parameter. inline void swizzleInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void swizzleInt8x16Relaxed(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Integer Add inline void addInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void addInt8x16(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void addInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void addInt16x8(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void addInt32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void addInt32x4(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void addInt64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void addInt64x2(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); // Integer Subtract inline void subInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void subInt8x16(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void subInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void subInt16x8(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void subInt32x4(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void subInt32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void subInt64x2(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void subInt64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Integer Multiply inline void mulInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void mulInt16x8(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void mulInt32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void mulInt32x4(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); // On x86_shared, it is required lhs == dest inline void mulInt64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest, FloatRegister temp) DEFINED_ON(x86_shared); inline void mulInt64x2(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest, FloatRegister temp) DEFINED_ON(x86_shared); inline void mulInt64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest, FloatRegister temp1, FloatRegister temp2) DEFINED_ON(arm64); // Note for the extMul opcodes, the NxM designation is for the input lanes; // the output lanes are twice as wide. inline void extMulLowInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void extMulHighInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedExtMulLowInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedExtMulHighInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void extMulLowInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void extMulHighInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedExtMulLowInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedExtMulHighInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void extMulLowInt32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void extMulHighInt32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedExtMulLowInt32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedExtMulHighInt32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void q15MulrSatInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Integer Negate inline void negInt8x16(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void negInt16x8(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void negInt32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void negInt64x2(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Saturating integer add inline void addSatInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void addSatInt8x16(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void unsignedAddSatInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedAddSatInt8x16(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void addSatInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void addSatInt16x8(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void unsignedAddSatInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedAddSatInt16x8(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); // Saturating integer subtract inline void subSatInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void subSatInt8x16(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void unsignedSubSatInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedSubSatInt8x16(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void subSatInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void subSatInt16x8(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void unsignedSubSatInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedSubSatInt16x8(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); // Lane-wise integer minimum inline void minInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void minInt8x16(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void unsignedMinInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedMinInt8x16(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void minInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void minInt16x8(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void unsignedMinInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedMinInt16x8(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void minInt32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void minInt32x4(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void unsignedMinInt32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedMinInt32x4(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); // Lane-wise integer maximum inline void maxInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void maxInt8x16(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void unsignedMaxInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedMaxInt8x16(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void maxInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void maxInt16x8(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void unsignedMaxInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedMaxInt16x8(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void maxInt32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void maxInt32x4(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void unsignedMaxInt32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedMaxInt32x4(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); // Lane-wise integer rounding average inline void unsignedAverageInt8x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedAverageInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Lane-wise integer absolute value inline void absInt8x16(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void absInt16x8(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void absInt32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void absInt64x2(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Left shift by scalar. Immediates and variable shifts must have been // masked; shifts of zero will work but may or may not generate code. inline void leftShiftInt8x16(Register rhs, FloatRegister lhsDest, FloatRegister temp) DEFINED_ON(x86_shared); inline void leftShiftInt8x16(FloatRegister lhs, Register rhs, FloatRegister dest) DEFINED_ON(arm64); inline void leftShiftInt8x16(Imm32 count, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void leftShiftInt16x8(Register rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared); inline void leftShiftInt16x8(FloatRegister lhs, Register rhs, FloatRegister dest) DEFINED_ON(arm64); inline void leftShiftInt16x8(Imm32 count, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void leftShiftInt32x4(Register rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared); inline void leftShiftInt32x4(FloatRegister lhs, Register rhs, FloatRegister dest) DEFINED_ON(arm64); inline void leftShiftInt32x4(Imm32 count, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void leftShiftInt64x2(Register rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared); inline void leftShiftInt64x2(FloatRegister lhs, Register rhs, FloatRegister dest) DEFINED_ON(arm64); inline void leftShiftInt64x2(Imm32 count, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Right shift by scalar. Immediates and variable shifts must have been // masked; shifts of zero will work but may or may not generate code. inline void rightShiftInt8x16(Register rhs, FloatRegister lhsDest, FloatRegister temp) DEFINED_ON(x86_shared); inline void rightShiftInt8x16(FloatRegister lhs, Register rhs, FloatRegister dest) DEFINED_ON(arm64); inline void rightShiftInt8x16(Imm32 count, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedRightShiftInt8x16(Register rhs, FloatRegister lhsDest, FloatRegister temp) DEFINED_ON(x86_shared); inline void unsignedRightShiftInt8x16(FloatRegister lhs, Register rhs, FloatRegister dest) DEFINED_ON(arm64); inline void unsignedRightShiftInt8x16(Imm32 count, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void rightShiftInt16x8(Register rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared); inline void rightShiftInt16x8(FloatRegister lhs, Register rhs, FloatRegister dest) DEFINED_ON(arm64); inline void rightShiftInt16x8(Imm32 count, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedRightShiftInt16x8(Register rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared); inline void unsignedRightShiftInt16x8(FloatRegister lhs, Register rhs, FloatRegister dest) DEFINED_ON(arm64); inline void unsignedRightShiftInt16x8(Imm32 count, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void rightShiftInt32x4(Register rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared); inline void rightShiftInt32x4(FloatRegister lhs, Register rhs, FloatRegister dest) DEFINED_ON(arm64); inline void rightShiftInt32x4(Imm32 count, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedRightShiftInt32x4(Register rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared); inline void unsignedRightShiftInt32x4(FloatRegister lhs, Register rhs, FloatRegister dest) DEFINED_ON(arm64); inline void unsignedRightShiftInt32x4(Imm32 count, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void rightShiftInt64x2(Register rhs, FloatRegister lhsDest, FloatRegister temp) DEFINED_ON(x86_shared); inline void rightShiftInt64x2(Imm32 count, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void rightShiftInt64x2(FloatRegister lhs, Register rhs, FloatRegister dest) DEFINED_ON(arm64); inline void unsignedRightShiftInt64x2(Register rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared); inline void unsignedRightShiftInt64x2(FloatRegister lhs, Register rhs, FloatRegister dest) DEFINED_ON(arm64); inline void unsignedRightShiftInt64x2(Imm32 count, FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Sign replication operation inline void signReplicationInt8x16(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared); inline void signReplicationInt16x8(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared); inline void signReplicationInt32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared); inline void signReplicationInt64x2(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared); // Bitwise and, or, xor, not inline void bitwiseAndSimd128(FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared, arm64); inline void bitwiseAndSimd128(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void bitwiseAndSimd128(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void bitwiseOrSimd128(FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared, arm64); inline void bitwiseOrSimd128(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void bitwiseOrSimd128(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void bitwiseXorSimd128(FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared, arm64); inline void bitwiseXorSimd128(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void bitwiseXorSimd128(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void bitwiseNotSimd128(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Bitwise AND with compliment: dest = lhs & ~rhs, note only arm64 can do it. inline void bitwiseAndNotSimd128(FloatRegister lhs, FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(arm64); // Bitwise AND with complement: dest = ~lhs & rhs, note this is not what Wasm // wants but what the x86 hardware offers. Hence the name. inline void bitwiseNotAndSimd128(FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared, arm64); inline void bitwiseNotAndSimd128(FloatRegister lhs, FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared); // Bitwise select inline void bitwiseSelectSimd128(FloatRegister mask, FloatRegister onTrue, FloatRegister onFalse, FloatRegister dest, FloatRegister temp) DEFINED_ON(x86_shared); inline void bitwiseSelectSimd128(FloatRegister onTrue, FloatRegister onFalse, FloatRegister maskDest) DEFINED_ON(arm64); // Population count inline void popcntInt8x16(FloatRegister src, FloatRegister dest, FloatRegister temp) DEFINED_ON(x86_shared); inline void popcntInt8x16(FloatRegister src, FloatRegister dest) DEFINED_ON(arm64); // Any lane true, ie, any bit set inline void anyTrueSimd128(FloatRegister src, Register dest) DEFINED_ON(x86_shared, arm64); // All lanes true inline void allTrueInt8x16(FloatRegister src, Register dest) DEFINED_ON(x86_shared, arm64); inline void allTrueInt16x8(FloatRegister src, Register dest) DEFINED_ON(x86_shared, arm64); inline void allTrueInt32x4(FloatRegister src, Register dest) DEFINED_ON(x86_shared, arm64); inline void allTrueInt64x2(FloatRegister src, Register dest) DEFINED_ON(x86_shared, arm64); // Bitmask, ie extract and compress high bits of all lanes inline void bitmaskInt8x16(FloatRegister src, Register dest) DEFINED_ON(x86_shared); inline void bitmaskInt8x16(FloatRegister src, Register dest, FloatRegister temp) DEFINED_ON(arm64); inline void bitmaskInt16x8(FloatRegister src, Register dest) DEFINED_ON(x86_shared); inline void bitmaskInt16x8(FloatRegister src, Register dest, FloatRegister temp) DEFINED_ON(arm64); inline void bitmaskInt32x4(FloatRegister src, Register dest) DEFINED_ON(x86_shared); inline void bitmaskInt32x4(FloatRegister src, Register dest, FloatRegister temp) DEFINED_ON(arm64); inline void bitmaskInt64x2(FloatRegister src, Register dest) DEFINED_ON(x86_shared); inline void bitmaskInt64x2(FloatRegister src, Register dest, FloatRegister temp) DEFINED_ON(arm64); // Comparisons (integer and floating-point) inline void compareInt8x16(Assembler::Condition cond, FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared, arm64); // On x86_shared, limited to !=, ==, <=, > inline void compareInt8x16(Assembler::Condition cond, FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); // On arm64, use any integer comparison condition. inline void compareInt8x16(Assembler::Condition cond, FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void compareInt16x8(Assembler::Condition cond, FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared, arm64); inline void compareInt16x8(Assembler::Condition cond, FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // On x86_shared, limited to !=, ==, <=, > inline void compareInt16x8(Assembler::Condition cond, FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); // On x86_shared, limited to !=, ==, <=, > inline void compareInt32x4(Assembler::Condition cond, FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared, arm64); inline void compareInt32x4(Assembler::Condition cond, FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); // On arm64, use any integer comparison condition. inline void compareInt32x4(Assembler::Condition cond, FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void compareForEqualityInt64x2(Assembler::Condition cond, FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void compareForOrderingInt64x2(Assembler::Condition cond, FloatRegister lhs, FloatRegister rhs, FloatRegister dest, FloatRegister temp1, FloatRegister temp2) DEFINED_ON(x86_shared); inline void compareInt64x2(Assembler::Condition cond, FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(arm64); inline void compareInt64x2(Assembler::Condition cond, FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(arm64); inline void compareFloat32x4(Assembler::Condition cond, FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared, arm64); // On x86_shared, limited to ==, !=, <, <= inline void compareFloat32x4(Assembler::Condition cond, FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); // On x86_shared, limited to ==, !=, <, <= // On arm64, use any float-point comparison condition. inline void compareFloat32x4(Assembler::Condition cond, FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void compareFloat64x2(Assembler::Condition cond, FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(x86_shared, arm64); // On x86_shared, limited to ==, !=, <, <= inline void compareFloat64x2(Assembler::Condition cond, FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); // On x86_shared, limited to ==, !=, <, <= // On arm64, use any float-point comparison condition. inline void compareFloat64x2(Assembler::Condition cond, FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Load inline void loadUnalignedSimd128(const Operand& src, FloatRegister dest) DEFINED_ON(x86_shared); inline void loadUnalignedSimd128(const Address& src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void loadUnalignedSimd128(const BaseIndex& src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Store inline void storeUnalignedSimd128(FloatRegister src, const Address& dest) DEFINED_ON(x86_shared, arm64); inline void storeUnalignedSimd128(FloatRegister src, const BaseIndex& dest) DEFINED_ON(x86_shared, arm64); // Floating point negation inline void negFloat32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void negFloat64x2(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Floating point absolute value inline void absFloat32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void absFloat64x2(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // NaN-propagating minimum inline void minFloat32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest, FloatRegister temp1, FloatRegister temp2) DEFINED_ON(x86_shared); inline void minFloat32x4(FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(arm64); inline void minFloat32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(arm64); inline void minFloat64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest, FloatRegister temp1, FloatRegister temp2) DEFINED_ON(x86_shared); inline void minFloat64x2(FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(arm64); inline void minFloat64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(arm64); // NaN-propagating maximum inline void maxFloat32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest, FloatRegister temp1, FloatRegister temp2) DEFINED_ON(x86_shared); inline void maxFloat32x4(FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(arm64); inline void maxFloat32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(arm64); inline void maxFloat64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest, FloatRegister temp1, FloatRegister temp2) DEFINED_ON(x86_shared); inline void maxFloat64x2(FloatRegister rhs, FloatRegister lhsDest) DEFINED_ON(arm64); inline void maxFloat64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(arm64); // Floating add inline void addFloat32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void addFloat32x4(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void addFloat64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void addFloat64x2(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); // Floating subtract inline void subFloat32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void subFloat32x4(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void subFloat64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void subFloat64x2(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); // Floating division inline void divFloat32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void divFloat32x4(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void divFloat64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void divFloat64x2(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); // Floating Multiply inline void mulFloat32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void mulFloat32x4(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void mulFloat64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void mulFloat64x2(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); // Pairwise add inline void extAddPairwiseInt8x16(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedExtAddPairwiseInt8x16(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void extAddPairwiseInt16x8(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedExtAddPairwiseInt16x8(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Floating square root inline void sqrtFloat32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void sqrtFloat64x2(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Integer to floating point with rounding inline void convertInt32x4ToFloat32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedConvertInt32x4ToFloat32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void convertInt32x4ToFloat64x2(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedConvertInt32x4ToFloat64x2(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Floating point to integer with saturation inline void truncSatFloat32x4ToInt32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedTruncSatFloat32x4ToInt32x4(FloatRegister src, FloatRegister dest, FloatRegister temp) DEFINED_ON(x86_shared); inline void unsignedTruncSatFloat32x4ToInt32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(arm64); inline void truncSatFloat64x2ToInt32x4(FloatRegister src, FloatRegister dest, FloatRegister temp) DEFINED_ON(x86_shared, arm64); inline void unsignedTruncSatFloat64x2ToInt32x4(FloatRegister src, FloatRegister dest, FloatRegister temp) DEFINED_ON(x86_shared, arm64); inline void truncSatFloat32x4ToInt32x4Relaxed(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedTruncSatFloat32x4ToInt32x4Relaxed(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void truncSatFloat64x2ToInt32x4Relaxed(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedTruncSatFloat64x2ToInt32x4Relaxed(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Floating point narrowing inline void convertFloat64x2ToFloat32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Floating point widening inline void convertFloat32x4ToFloat64x2(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Integer to integer narrowing inline void narrowInt16x8(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void narrowInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedNarrowInt16x8(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void unsignedNarrowInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void narrowInt32x4(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void narrowInt32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedNarrowInt32x4(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void unsignedNarrowInt32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Integer to integer widening inline void widenLowInt8x16(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void widenHighInt8x16(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedWidenLowInt8x16(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedWidenHighInt8x16(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void widenLowInt16x8(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void widenHighInt16x8(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedWidenLowInt16x8(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedWidenHighInt16x8(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void widenLowInt32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedWidenLowInt32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void widenHighInt32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void unsignedWidenHighInt32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Compare-based minimum/maximum // // On x86, the signature is (rhsDest, lhs); on arm64 it is (rhs, lhsDest). // // The masm preprocessor can't deal with multiple declarations with identical // signatures even if they are on different platforms, hence the weird // argument names. inline void pseudoMinFloat32x4(FloatRegister rhsOrRhsDest, FloatRegister lhsOrLhsDest) DEFINED_ON(x86_shared, arm64); inline void pseudoMinFloat32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void pseudoMinFloat64x2(FloatRegister rhsOrRhsDest, FloatRegister lhsOrLhsDest) DEFINED_ON(x86_shared, arm64); inline void pseudoMinFloat64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void pseudoMaxFloat32x4(FloatRegister rhsOrRhsDest, FloatRegister lhsOrLhsDest) DEFINED_ON(x86_shared, arm64); inline void pseudoMaxFloat32x4(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void pseudoMaxFloat64x2(FloatRegister rhsOrRhsDest, FloatRegister lhsOrLhsDest) DEFINED_ON(x86_shared, arm64); inline void pseudoMaxFloat64x2(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Widening/pairwise integer dot product inline void widenDotInt16x8(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void widenDotInt16x8(FloatRegister lhs, const SimdConstant& rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void dotInt8x16Int7x16(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void dotInt8x16Int7x16ThenAdd(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared); inline void dotInt8x16Int7x16ThenAdd(FloatRegister lhs, FloatRegister rhs, FloatRegister dest, FloatRegister temp) DEFINED_ON(arm64); inline void dotBFloat16x8ThenAdd(FloatRegister lhs, FloatRegister rhs, FloatRegister dest, FloatRegister temp) DEFINED_ON(x86_shared, arm64); // Floating point rounding inline void ceilFloat32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void ceilFloat64x2(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void floorFloat32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void floorFloat64x2(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void truncFloat32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void truncFloat64x2(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void nearestFloat32x4(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void nearestFloat64x2(FloatRegister src, FloatRegister dest) DEFINED_ON(x86_shared, arm64); // Floating multiply-accumulate: srcDest [+-]= src1 * src2 inline void fmaFloat32x4(FloatRegister src1, FloatRegister src2, FloatRegister srcDest) DEFINED_ON(x86_shared, arm64); inline void fnmaFloat32x4(FloatRegister src1, FloatRegister src2, FloatRegister srcDest) DEFINED_ON(x86_shared, arm64); inline void fmaFloat64x2(FloatRegister src1, FloatRegister src2, FloatRegister srcDest) DEFINED_ON(x86_shared, arm64); inline void fnmaFloat64x2(FloatRegister src1, FloatRegister src2, FloatRegister srcDest) DEFINED_ON(x86_shared, arm64); inline void minFloat32x4Relaxed(FloatRegister src, FloatRegister srcDest) DEFINED_ON(x86_shared, arm64); inline void minFloat32x4Relaxed(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void maxFloat32x4Relaxed(FloatRegister src, FloatRegister srcDest) DEFINED_ON(x86_shared, arm64); inline void maxFloat32x4Relaxed(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void minFloat64x2Relaxed(FloatRegister src, FloatRegister srcDest) DEFINED_ON(x86_shared, arm64); inline void minFloat64x2Relaxed(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void maxFloat64x2Relaxed(FloatRegister src, FloatRegister srcDest) DEFINED_ON(x86_shared, arm64); inline void maxFloat64x2Relaxed(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); inline void q15MulrInt16x8Relaxed(FloatRegister lhs, FloatRegister rhs, FloatRegister dest) DEFINED_ON(x86_shared, arm64); public: // ======================================================================== // Truncate floating point. // Undefined behaviour when truncation is outside Int64 range. // Needs a temp register if SSE3 is not present. inline void truncateFloat32ToInt64(Address src, Address dest, Register temp) DEFINED_ON(x86_shared); inline void truncateFloat32ToUInt64(Address src, Address dest, Register temp, FloatRegister floatTemp) DEFINED_ON(x86, x64); inline void truncateDoubleToInt64(Address src, Address dest, Register temp) DEFINED_ON(x86_shared); inline void truncateDoubleToUInt64(Address src, Address dest, Register temp, FloatRegister floatTemp) DEFINED_ON(x86, x64); public: // ======================================================================== // Convert floating point. // temp required on x86 and x64; must be undefined on mips64 and loong64. void convertUInt64ToFloat32(Register64 src, FloatRegister dest, Register temp) DEFINED_ON(arm64, mips64, loong64, wasm32, x64, x86); void convertInt64ToFloat32(Register64 src, FloatRegister dest) DEFINED_ON(arm64, mips64, loong64, wasm32, x64, x86); bool convertUInt64ToDoubleNeedsTemp() PER_ARCH; // temp required when convertUInt64ToDoubleNeedsTemp() returns true. void convertUInt64ToDouble(Register64 src, FloatRegister dest, Register temp) PER_ARCH; void convertInt64ToDouble(Register64 src, FloatRegister dest) PER_ARCH; void convertIntPtrToDouble(Register src, FloatRegister dest) PER_ARCH; public: // ======================================================================== // wasm support CodeOffset wasmTrapInstruction() PER_SHARED_ARCH; void wasmTrap(wasm::Trap trap, wasm::BytecodeOffset bytecodeOffset); // Load all pinned regs via InstanceReg. If the trapOffset is something, // give the first load a trap descriptor with type IndirectCallToNull, so that // a null instance will cause a trap. void loadWasmPinnedRegsFromInstance( mozilla::Maybe trapOffset = mozilla::Nothing()); // Returns a pair: the offset of the undefined (trapping) instruction, and // the number of extra bytes of stack allocated prior to the trap // instruction proper. std::pair wasmReserveStackChecked( uint32_t amount, wasm::BytecodeOffset trapOffset); // Emit a bounds check against the wasm heap limit, jumping to 'ok' if 'cond' // holds; this can be the label either of the access or of the trap. The // label should name a code position greater than the position of the bounds // check. // // If JitOptions.spectreMaskIndex is true, a no-op speculation barrier is // emitted in the code stream after the check to prevent an OOB access from // being executed speculatively. (On current tier-1 platforms the barrier is // a conditional saturation of 'index' to 'boundsCheckLimit', using the same // condition as the check.) If the condition is such that the bounds check // branches out of line to the trap, the barrier will actually be executed // when the bounds check passes. // // On 32-bit systems for both wasm and asm.js, and on 64-bit systems for // asm.js, heap lengths are limited to 2GB. On 64-bit systems for wasm, // 32-bit heap lengths are limited to 4GB, and 64-bit heap lengths will be // limited to something much larger. void wasmBoundsCheck32(Condition cond, Register index, Register boundsCheckLimit, Label* ok) DEFINED_ON(arm, arm64, mips32, mips64, x86_shared, loong64, wasm32); void wasmBoundsCheck32(Condition cond, Register index, Address boundsCheckLimit, Label* ok) DEFINED_ON(arm, arm64, mips32, mips64, x86_shared, loong64, wasm32); void wasmBoundsCheck64(Condition cond, Register64 index, Register64 boundsCheckLimit, Label* ok) DEFINED_ON(arm64, mips64, x64, x86, arm, loong64, wasm32); void wasmBoundsCheck64(Condition cond, Register64 index, Address boundsCheckLimit, Label* ok) DEFINED_ON(arm64, mips64, x64, x86, arm, loong64, wasm32); // Each wasm load/store instruction appends its own wasm::Trap::OutOfBounds. void wasmLoad(const wasm::MemoryAccessDesc& access, Operand srcAddr, AnyRegister out) DEFINED_ON(x86, x64); void wasmLoadI64(const wasm::MemoryAccessDesc& access, Operand srcAddr, Register64 out) DEFINED_ON(x86, x64); void wasmStore(const wasm::MemoryAccessDesc& access, AnyRegister value, Operand dstAddr) DEFINED_ON(x86, x64); void wasmStoreI64(const wasm::MemoryAccessDesc& access, Register64 value, Operand dstAddr) DEFINED_ON(x86); // For all the ARM/MIPS/LOONG64 wasmLoad and wasmStore functions below, `ptr` // MUST equal `ptrScratch`, and that register will be updated based on // conditions listed below (where it is only mentioned as `ptr`). // `ptr` will be updated if access.offset() != 0 or access.type() == // Scalar::Int64. void wasmLoad(const wasm::MemoryAccessDesc& access, Register memoryBase, Register ptr, Register ptrScratch, AnyRegister output) DEFINED_ON(arm, loong64, mips_shared); void wasmLoadI64(const wasm::MemoryAccessDesc& access, Register memoryBase, Register ptr, Register ptrScratch, Register64 output) DEFINED_ON(arm, mips32, mips64, loong64); void wasmStore(const wasm::MemoryAccessDesc& access, AnyRegister value, Register memoryBase, Register ptr, Register ptrScratch) DEFINED_ON(arm, loong64, mips_shared); void wasmStoreI64(const wasm::MemoryAccessDesc& access, Register64 value, Register memoryBase, Register ptr, Register ptrScratch) DEFINED_ON(arm, mips32, mips64, loong64); // These accept general memoryBase + ptr + offset (in `access`); the offset is // always smaller than the guard region. They will insert an additional add // if the offset is nonzero, and of course that add may require a temporary // register for the offset if the offset is large, and instructions to set it // up. void wasmLoad(const wasm::MemoryAccessDesc& access, Register memoryBase, Register ptr, AnyRegister output) DEFINED_ON(arm64); void wasmLoadI64(const wasm::MemoryAccessDesc& access, Register memoryBase, Register ptr, Register64 output) DEFINED_ON(arm64); void wasmStore(const wasm::MemoryAccessDesc& access, AnyRegister value, Register memoryBase, Register ptr) DEFINED_ON(arm64); void wasmStoreI64(const wasm::MemoryAccessDesc& access, Register64 value, Register memoryBase, Register ptr) DEFINED_ON(arm64); // `ptr` will always be updated. void wasmUnalignedLoad(const wasm::MemoryAccessDesc& access, Register memoryBase, Register ptr, Register ptrScratch, Register output, Register tmp) DEFINED_ON(mips32, mips64); // MIPS: `ptr` will always be updated. void wasmUnalignedLoadFP(const wasm::MemoryAccessDesc& access, Register memoryBase, Register ptr, Register ptrScratch, FloatRegister output, Register tmp1) DEFINED_ON(mips32, mips64); // `ptr` will always be updated. void wasmUnalignedLoadI64(const wasm::MemoryAccessDesc& access, Register memoryBase, Register ptr, Register ptrScratch, Register64 output, Register tmp) DEFINED_ON(mips32, mips64); // MIPS: `ptr` will always be updated. void wasmUnalignedStore(const wasm::MemoryAccessDesc& access, Register value, Register memoryBase, Register ptr, Register ptrScratch, Register tmp) DEFINED_ON(mips32, mips64); // `ptr` will always be updated. void wasmUnalignedStoreFP(const wasm::MemoryAccessDesc& access, FloatRegister floatValue, Register memoryBase, Register ptr, Register ptrScratch, Register tmp) DEFINED_ON(mips32, mips64); // `ptr` will always be updated. void wasmUnalignedStoreI64(const wasm::MemoryAccessDesc& access, Register64 value, Register memoryBase, Register ptr, Register ptrScratch, Register tmp) DEFINED_ON(mips32, mips64); // wasm specific methods, used in both the wasm baseline compiler and ion. // The truncate-to-int32 methods do not bind the rejoin label; clients must // do so if oolWasmTruncateCheckF64ToI32() can jump to it. void wasmTruncateDoubleToUInt32(FloatRegister input, Register output, bool isSaturating, Label* oolEntry) PER_ARCH; void wasmTruncateDoubleToInt32(FloatRegister input, Register output, bool isSaturating, Label* oolEntry) PER_SHARED_ARCH; void oolWasmTruncateCheckF64ToI32(FloatRegister input, Register output, TruncFlags flags, wasm::BytecodeOffset off, Label* rejoin) DEFINED_ON(arm, arm64, x86_shared, mips_shared, loong64, wasm32); void wasmTruncateFloat32ToUInt32(FloatRegister input, Register output, bool isSaturating, Label* oolEntry) PER_ARCH; void wasmTruncateFloat32ToInt32(FloatRegister input, Register output, bool isSaturating, Label* oolEntry) PER_SHARED_ARCH; void oolWasmTruncateCheckF32ToI32(FloatRegister input, Register output, TruncFlags flags, wasm::BytecodeOffset off, Label* rejoin) DEFINED_ON(arm, arm64, x86_shared, mips_shared, loong64, wasm32); // The truncate-to-int64 methods will always bind the `oolRejoin` label // after the last emitted instruction. void wasmTruncateDoubleToInt64(FloatRegister input, Register64 output, bool isSaturating, Label* oolEntry, Label* oolRejoin, FloatRegister tempDouble) DEFINED_ON(arm64, x86, x64, mips64, loong64, wasm32); void wasmTruncateDoubleToUInt64(FloatRegister input, Register64 output, bool isSaturating, Label* oolEntry, Label* oolRejoin, FloatRegister tempDouble) DEFINED_ON(arm64, x86, x64, mips64, loong64, wasm32); void oolWasmTruncateCheckF64ToI64(FloatRegister input, Register64 output, TruncFlags flags, wasm::BytecodeOffset off, Label* rejoin) DEFINED_ON(arm, arm64, x86_shared, mips_shared, loong64, wasm32); void wasmTruncateFloat32ToInt64(FloatRegister input, Register64 output, bool isSaturating, Label* oolEntry, Label* oolRejoin, FloatRegister tempDouble) DEFINED_ON(arm64, x86, x64, mips64, loong64, wasm32); void wasmTruncateFloat32ToUInt64(FloatRegister input, Register64 output, bool isSaturating, Label* oolEntry, Label* oolRejoin, FloatRegister tempDouble) DEFINED_ON(arm64, x86, x64, mips64, loong64, wasm32); void oolWasmTruncateCheckF32ToI64(FloatRegister input, Register64 output, TruncFlags flags, wasm::BytecodeOffset off, Label* rejoin) DEFINED_ON(arm, arm64, x86_shared, mips_shared, loong64, wasm32); void loadWasmGlobalPtr(uint32_t globalDataOffset, Register dest); // This function takes care of loading the callee's instance and pinned regs // but it is the caller's responsibility to save/restore instance or pinned // regs. CodeOffset wasmCallImport(const wasm::CallSiteDesc& desc, const wasm::CalleeDesc& callee); // WasmTableCallIndexReg must contain the index of the indirect call. This is // for wasm calls only. // // Indirect calls use a dual-path mechanism where a run-time test determines // whether a context switch is needed (slow path) or not (fast path). This // gives rise to two call instructions, both of which need safe points. As // per normal, the call offsets are the code offsets at the end of the call // instructions (the return points). // // `boundsCheckFailedLabel` is non-null iff a bounds check is required. // `nullCheckFailedLabel` is non-null only on platforms that can't fold the // null check into the rest of the call instructions. void wasmCallIndirect(const wasm::CallSiteDesc& desc, const wasm::CalleeDesc& callee, Label* boundsCheckFailedLabel, Label* nullCheckFailedLabel, mozilla::Maybe tableSize, CodeOffset* fastCallOffset, CodeOffset* slowCallOffset); // This function takes care of loading the callee's instance and address from // pinned reg. void wasmCallRef(const wasm::CallSiteDesc& desc, const wasm::CalleeDesc& callee, CodeOffset* fastCallOffset, CodeOffset* slowCallOffset); // WasmTableCallIndexReg must contain the index of the indirect call. // This is for asm.js calls only. CodeOffset asmCallIndirect(const wasm::CallSiteDesc& desc, const wasm::CalleeDesc& callee); // This function takes care of loading the pointer to the current instance // as the implicit first argument. It preserves instance and pinned registers. // (instance & pinned regs are non-volatile registers in the system ABI). CodeOffset wasmCallBuiltinInstanceMethod(const wasm::CallSiteDesc& desc, const ABIArg& instanceArg, wasm::SymbolicAddress builtin, wasm::FailureMode failureMode); // Perform a subtype check that `subTypeDef` is a subtype of `superTypeDef` // branching to label depending on `onSuccess`. This method is a // specialization of the general `wasm::TypeDef::isSubTypeOf` method for the // case where the `superTypeDef` is statically known, which is the case for // all wasm instructions. // // `scratch` is required iff the `subTypeDepth` is >= // wasm::MinSuperTypeVectorLength. `subTypeDef` is clobbered by this method. // `superTypeDef` is preserved. void branchWasmTypeDefIsSubtype(Register subTypeDef, Register superTypeDef, Register scratch, uint32_t subTypeDepth, Label* label, bool onSuccess); // Compute ptr += (indexTemp32 << shift) where shift can be any value < 32. // May destroy indexTemp32. The value of indexTemp32 must be positive, and it // is implementation-defined what happens if bits are lost or the value // becomes negative through the shift. On 64-bit systems, the high 32 bits of // indexTemp32 must be zero, not garbage. void shiftIndex32AndAdd(Register indexTemp32, int shift, Register pointer) PER_SHARED_ARCH; // The System ABI frequently states that the high bits of a 64-bit register // that holds a 32-bit return value are unpredictable, and C++ compilers will // indeed generate code that leaves garbage in the upper bits. // // Adjust the contents of the 64-bit register `r` to conform to our internal // convention, which requires predictable high bits. In practice, this means // that the 32-bit value will be zero-extended or sign-extended to 64 bits as // appropriate for the platform. void widenInt32(Register r) DEFINED_ON(arm64, x64, mips64, loong64); // As enterFakeExitFrame(), but using register conventions appropriate for // wasm stubs. void enterFakeExitFrameForWasm(Register cxreg, Register scratch, ExitFrameType type) PER_SHARED_ARCH; public: // ======================================================================== // Barrier functions. void emitPreBarrierFastPath(JSRuntime* rt, MIRType type, Register temp1, Register temp2, Register temp3, Label* noBarrier); public: // ======================================================================== // Clamping functions. inline void clampIntToUint8(Register reg) PER_SHARED_ARCH; public: // ======================================================================== // Primitive atomic operations. // // If the access is from JS and the eventual destination of the result is a // js::Value, it's probably best to use the JS-specific versions of these, // see further below. // // Temp registers must be defined unless otherwise noted in the per-function // constraints. // 8-bit, 16-bit, and 32-bit wide operations. // // The 8-bit and 16-bit operations zero-extend or sign-extend the result to // 32 bits, according to `type`. On 64-bit systems, the upper 32 bits of the // result will be zero on some platforms (eg, on x64) and will be the sign // extension of the lower bits on other platforms (eg, MIPS). // CompareExchange with memory. Return the value that was in memory, // whether we wrote or not. // // x86-shared: `output` must be eax. // MIPS: `valueTemp`, `offsetTemp` and `maskTemp` must be defined for 8-bit // and 16-bit wide operations. void compareExchange(Scalar::Type type, const Synchronization& sync, const Address& mem, Register expected, Register replacement, Register output) DEFINED_ON(arm, arm64, x86_shared); void compareExchange(Scalar::Type type, const Synchronization& sync, const BaseIndex& mem, Register expected, Register replacement, Register output) DEFINED_ON(arm, arm64, x86_shared); void compareExchange(Scalar::Type type, const Synchronization& sync, const Address& mem, Register expected, Register replacement, Register valueTemp, Register offsetTemp, Register maskTemp, Register output) DEFINED_ON(mips_shared, loong64); void compareExchange(Scalar::Type type, const Synchronization& sync, const BaseIndex& mem, Register expected, Register replacement, Register valueTemp, Register offsetTemp, Register maskTemp, Register output) DEFINED_ON(mips_shared, loong64); // x86: `expected` and `output` must be edx:eax; `replacement` is ecx:ebx. // x64: `output` must be rax. // ARM: Registers must be distinct; `replacement` and `output` must be // (even,odd) pairs. void compareExchange64(const Synchronization& sync, const Address& mem, Register64 expected, Register64 replacement, Register64 output) DEFINED_ON(arm, arm64, x64, x86, mips64, loong64); void compareExchange64(const Synchronization& sync, const BaseIndex& mem, Register64 expected, Register64 replacement, Register64 output) DEFINED_ON(arm, arm64, x64, x86, mips64, loong64); // Exchange with memory. Return the value initially in memory. // MIPS: `valueTemp`, `offsetTemp` and `maskTemp` must be defined for 8-bit // and 16-bit wide operations. void atomicExchange(Scalar::Type type, const Synchronization& sync, const Address& mem, Register value, Register output) DEFINED_ON(arm, arm64, x86_shared); void atomicExchange(Scalar::Type type, const Synchronization& sync, const BaseIndex& mem, Register value, Register output) DEFINED_ON(arm, arm64, x86_shared); void atomicExchange(Scalar::Type type, const Synchronization& sync, const Address& mem, Register value, Register valueTemp, Register offsetTemp, Register maskTemp, Register output) DEFINED_ON(mips_shared, loong64); void atomicExchange(Scalar::Type type, const Synchronization& sync, const BaseIndex& mem, Register value, Register valueTemp, Register offsetTemp, Register maskTemp, Register output) DEFINED_ON(mips_shared, loong64); // x86: `value` must be ecx:ebx; `output` must be edx:eax. // ARM: `value` and `output` must be distinct and (even,odd) pairs. // ARM64: `value` and `output` must be distinct. void atomicExchange64(const Synchronization& sync, const Address& mem, Register64 value, Register64 output) DEFINED_ON(arm, arm64, x64, x86, mips64, loong64); void atomicExchange64(const Synchronization& sync, const BaseIndex& mem, Register64 value, Register64 output) DEFINED_ON(arm, arm64, x64, x86, mips64, loong64); // Read-modify-write with memory. Return the value in memory before the // operation. // // x86-shared: // For 8-bit operations, `value` and `output` must have a byte subregister. // For Add and Sub, `temp` must be invalid. // For And, Or, and Xor, `output` must be eax and `temp` must have a byte // subregister. // // ARM: Registers `value` and `output` must differ. // MIPS: `valueTemp`, `offsetTemp` and `maskTemp` must be defined for 8-bit // and 16-bit wide operations; `value` and `output` must differ. void atomicFetchOp(Scalar::Type type, const Synchronization& sync, AtomicOp op, Register value, const Address& mem, Register temp, Register output) DEFINED_ON(arm, arm64, x86_shared); void atomicFetchOp(Scalar::Type type, const Synchronization& sync, AtomicOp op, Imm32 value, const Address& mem, Register temp, Register output) DEFINED_ON(x86_shared); void atomicFetchOp(Scalar::Type type, const Synchronization& sync, AtomicOp op, Register value, const BaseIndex& mem, Register temp, Register output) DEFINED_ON(arm, arm64, x86_shared); void atomicFetchOp(Scalar::Type type, const Synchronization& sync, AtomicOp op, Imm32 value, const BaseIndex& mem, Register temp, Register output) DEFINED_ON(x86_shared); void atomicFetchOp(Scalar::Type type, const Synchronization& sync, AtomicOp op, Register value, const Address& mem, Register valueTemp, Register offsetTemp, Register maskTemp, Register output) DEFINED_ON(mips_shared, loong64); void atomicFetchOp(Scalar::Type type, const Synchronization& sync, AtomicOp op, Register value, const BaseIndex& mem, Register valueTemp, Register offsetTemp, Register maskTemp, Register output) DEFINED_ON(mips_shared, loong64); // x86: // `temp` must be ecx:ebx; `output` must be edx:eax. // x64: // For Add and Sub, `temp` is ignored. // For And, Or, and Xor, `output` must be rax. // ARM: // `temp` and `output` must be (even,odd) pairs and distinct from `value`. // ARM64: // Registers `value`, `temp`, and `output` must all differ. void atomicFetchOp64(const Synchronization& sync, AtomicOp op, Register64 value, const Address& mem, Register64 temp, Register64 output) DEFINED_ON(arm, arm64, x64, mips64, loong64); void atomicFetchOp64(const Synchronization& sync, AtomicOp op, const Address& value, const Address& mem, Register64 temp, Register64 output) DEFINED_ON(x86); void atomicFetchOp64(const Synchronization& sync, AtomicOp op, Register64 value, const BaseIndex& mem, Register64 temp, Register64 output) DEFINED_ON(arm, arm64, x64, mips64, loong64); void atomicFetchOp64(const Synchronization& sync, AtomicOp op, const Address& value, const BaseIndex& mem, Register64 temp, Register64 output) DEFINED_ON(x86); // x64: // `value` can be any register. // ARM: // `temp` must be an (even,odd) pair and distinct from `value`. // ARM64: // Registers `value` and `temp` must differ. void atomicEffectOp64(const Synchronization& sync, AtomicOp op, Register64 value, const Address& mem) DEFINED_ON(x64); void atomicEffectOp64(const Synchronization& sync, AtomicOp op, Register64 value, const Address& mem, Register64 temp) DEFINED_ON(arm, arm64, mips64, loong64); void atomicEffectOp64(const Synchronization& sync, AtomicOp op, Register64 value, const BaseIndex& mem) DEFINED_ON(x64); void atomicEffectOp64(const Synchronization& sync, AtomicOp op, Register64 value, const BaseIndex& mem, Register64 temp) DEFINED_ON(arm, arm64, mips64, loong64); // 64-bit atomic load. On 64-bit systems, use regular load with // Synchronization::Load, not this method. // // x86: `temp` must be ecx:ebx; `output` must be edx:eax. // ARM: `output` must be (even,odd) pair. void atomicLoad64(const Synchronization& sync, const Address& mem, Register64 temp, Register64 output) DEFINED_ON(x86); void atomicLoad64(const Synchronization& sync, const BaseIndex& mem, Register64 temp, Register64 output) DEFINED_ON(x86); void atomicLoad64(const Synchronization& sync, const Address& mem, Register64 output) DEFINED_ON(arm); void atomicLoad64(const Synchronization& sync, const BaseIndex& mem, Register64 output) DEFINED_ON(arm); // 64-bit atomic store. On 64-bit systems, use regular store with // Synchronization::Store, not this method. // // x86: `value` must be ecx:ebx; `temp` must be edx:eax. // ARM: `value` and `temp` must be (even,odd) pairs. void atomicStore64(const Synchronization& sync, const Address& mem, Register64 value, Register64 temp) DEFINED_ON(x86, arm); void atomicStore64(const Synchronization& sync, const BaseIndex& mem, Register64 value, Register64 temp) DEFINED_ON(x86, arm); // ======================================================================== // Wasm atomic operations. // // Constraints, when omitted, are exactly as for the primitive operations // above. void wasmCompareExchange(const wasm::MemoryAccessDesc& access, const Address& mem, Register expected, Register replacement, Register output) DEFINED_ON(arm, arm64, x86_shared); void wasmCompareExchange(const wasm::MemoryAccessDesc& access, const BaseIndex& mem, Register expected, Register replacement, Register output) DEFINED_ON(arm, arm64, x86_shared); void wasmCompareExchange(const wasm::MemoryAccessDesc& access, const Address& mem, Register expected, Register replacement, Register valueTemp, Register offsetTemp, Register maskTemp, Register output) DEFINED_ON(mips_shared, loong64); void wasmCompareExchange(const wasm::MemoryAccessDesc& access, const BaseIndex& mem, Register expected, Register replacement, Register valueTemp, Register offsetTemp, Register maskTemp, Register output) DEFINED_ON(mips_shared, loong64); void wasmAtomicExchange(const wasm::MemoryAccessDesc& access, const Address& mem, Register value, Register output) DEFINED_ON(arm, arm64, x86_shared); void wasmAtomicExchange(const wasm::MemoryAccessDesc& access, const BaseIndex& mem, Register value, Register output) DEFINED_ON(arm, arm64, x86_shared); void wasmAtomicExchange(const wasm::MemoryAccessDesc& access, const Address& mem, Register value, Register valueTemp, Register offsetTemp, Register maskTemp, Register output) DEFINED_ON(mips_shared, loong64); void wasmAtomicExchange(const wasm::MemoryAccessDesc& access, const BaseIndex& mem, Register value, Register valueTemp, Register offsetTemp, Register maskTemp, Register output) DEFINED_ON(mips_shared, loong64); void wasmAtomicFetchOp(const wasm::MemoryAccessDesc& access, AtomicOp op, Register value, const Address& mem, Register temp, Register output) DEFINED_ON(arm, arm64, x86_shared); void wasmAtomicFetchOp(const wasm::MemoryAccessDesc& access, AtomicOp op, Imm32 value, const Address& mem, Register temp, Register output) DEFINED_ON(x86_shared); void wasmAtomicFetchOp(const wasm::MemoryAccessDesc& access, AtomicOp op, Register value, const BaseIndex& mem, Register temp, Register output) DEFINED_ON(arm, arm64, x86_shared); void wasmAtomicFetchOp(const wasm::MemoryAccessDesc& access, AtomicOp op, Imm32 value, const BaseIndex& mem, Register temp, Register output) DEFINED_ON(x86_shared); void wasmAtomicFetchOp(const wasm::MemoryAccessDesc& access, AtomicOp op, Register value, const Address& mem, Register valueTemp, Register offsetTemp, Register maskTemp, Register output) DEFINED_ON(mips_shared, loong64); void wasmAtomicFetchOp(const wasm::MemoryAccessDesc& access, AtomicOp op, Register value, const BaseIndex& mem, Register valueTemp, Register offsetTemp, Register maskTemp, Register output) DEFINED_ON(mips_shared, loong64); // Read-modify-write with memory. Return no value. // // MIPS: `valueTemp`, `offsetTemp` and `maskTemp` must be defined for 8-bit // and 16-bit wide operations. void wasmAtomicEffectOp(const wasm::MemoryAccessDesc& access, AtomicOp op, Register value, const Address& mem, Register temp) DEFINED_ON(arm, arm64, x86_shared); void wasmAtomicEffectOp(const wasm::MemoryAccessDesc& access, AtomicOp op, Imm32 value, const Address& mem, Register temp) DEFINED_ON(x86_shared); void wasmAtomicEffectOp(const wasm::MemoryAccessDesc& access, AtomicOp op, Register value, const BaseIndex& mem, Register temp) DEFINED_ON(arm, arm64, x86_shared); void wasmAtomicEffectOp(const wasm::MemoryAccessDesc& access, AtomicOp op, Imm32 value, const BaseIndex& mem, Register temp) DEFINED_ON(x86_shared); void wasmAtomicEffectOp(const wasm::MemoryAccessDesc& access, AtomicOp op, Register value, const Address& mem, Register valueTemp, Register offsetTemp, Register maskTemp) DEFINED_ON(mips_shared, loong64); void wasmAtomicEffectOp(const wasm::MemoryAccessDesc& access, AtomicOp op, Register value, const BaseIndex& mem, Register valueTemp, Register offsetTemp, Register maskTemp) DEFINED_ON(mips_shared, loong64); // 64-bit wide operations. // 64-bit atomic load. On 64-bit systems, use regular wasm load with // Synchronization::Load, not this method. // // x86: `temp` must be ecx:ebx; `output` must be edx:eax. // ARM: `temp` should be invalid; `output` must be (even,odd) pair. // MIPS32: `temp` should be invalid. void wasmAtomicLoad64(const wasm::MemoryAccessDesc& access, const Address& mem, Register64 temp, Register64 output) DEFINED_ON(arm, mips32, x86, wasm32); void wasmAtomicLoad64(const wasm::MemoryAccessDesc& access, const BaseIndex& mem, Register64 temp, Register64 output) DEFINED_ON(arm, mips32, x86, wasm32); // x86: `expected` must be the same as `output`, and must be edx:eax. // x86: `replacement` must be ecx:ebx. // x64: `output` must be rax. // ARM: Registers must be distinct; `replacement` and `output` must be // (even,odd) pairs. // ARM64: The base register in `mem` must not overlap `output`. // MIPS: Registers must be distinct. void wasmCompareExchange64(const wasm::MemoryAccessDesc& access, const Address& mem, Register64 expected, Register64 replacement, Register64 output) PER_ARCH; void wasmCompareExchange64(const wasm::MemoryAccessDesc& access, const BaseIndex& mem, Register64 expected, Register64 replacement, Register64 output) PER_ARCH; // x86: `value` must be ecx:ebx; `output` must be edx:eax. // ARM: Registers must be distinct; `value` and `output` must be (even,odd) // pairs. // MIPS: Registers must be distinct. void wasmAtomicExchange64(const wasm::MemoryAccessDesc& access, const Address& mem, Register64 value, Register64 output) PER_ARCH; void wasmAtomicExchange64(const wasm::MemoryAccessDesc& access, const BaseIndex& mem, Register64 value, Register64 output) PER_ARCH; // x86: `output` must be edx:eax, `temp` must be ecx:ebx. // x64: For And, Or, and Xor `output` must be rax. // ARM: Registers must be distinct; `temp` and `output` must be (even,odd) // pairs. // MIPS: Registers must be distinct. // MIPS32: `temp` should be invalid. void wasmAtomicFetchOp64(const wasm::MemoryAccessDesc& access, AtomicOp op, Register64 value, const Address& mem, Register64 temp, Register64 output) DEFINED_ON(arm, arm64, mips32, mips64, loong64, x64); void wasmAtomicFetchOp64(const wasm::MemoryAccessDesc& access, AtomicOp op, Register64 value, const BaseIndex& mem, Register64 temp, Register64 output) DEFINED_ON(arm, arm64, mips32, mips64, loong64, x64); void wasmAtomicFetchOp64(const wasm::MemoryAccessDesc& access, AtomicOp op, const Address& value, const Address& mem, Register64 temp, Register64 output) DEFINED_ON(x86); void wasmAtomicFetchOp64(const wasm::MemoryAccessDesc& access, AtomicOp op, const Address& value, const BaseIndex& mem, Register64 temp, Register64 output) DEFINED_ON(x86); // Here `value` can be any register. void wasmAtomicEffectOp64(const wasm::MemoryAccessDesc& access, AtomicOp op, Register64 value, const BaseIndex& mem) DEFINED_ON(x64); void wasmAtomicEffectOp64(const wasm::MemoryAccessDesc& access, AtomicOp op, Register64 value, const BaseIndex& mem, Register64 temp) DEFINED_ON(arm64); // ======================================================================== // JS atomic operations. // // Here the arrayType must be a type that is valid for JS. As of 2017 that // is an 8-bit, 16-bit, or 32-bit integer type. // // If arrayType is Scalar::Uint32 then: // // - `output` must be a float register // - if the operation takes one temp register then `temp` must be defined // - if the operation takes two temp registers then `temp2` must be defined. // // Otherwise `output` must be a GPR and `temp`/`temp2` should be InvalidReg. // (`temp1` must always be valid.) // // For additional register constraints, see the primitive 32-bit operations // and/or wasm operations above. void compareExchangeJS(Scalar::Type arrayType, const Synchronization& sync, const Address& mem, Register expected, Register replacement, Register temp, AnyRegister output) DEFINED_ON(arm, arm64, x86_shared); void compareExchangeJS(Scalar::Type arrayType, const Synchronization& sync, const BaseIndex& mem, Register expected, Register replacement, Register temp, AnyRegister output) DEFINED_ON(arm, arm64, x86_shared); void compareExchangeJS(Scalar::Type arrayType, const Synchronization& sync, const Address& mem, Register expected, Register replacement, Register valueTemp, Register offsetTemp, Register maskTemp, Register temp, AnyRegister output) DEFINED_ON(mips_shared, loong64); void compareExchangeJS(Scalar::Type arrayType, const Synchronization& sync, const BaseIndex& mem, Register expected, Register replacement, Register valueTemp, Register offsetTemp, Register maskTemp, Register temp, AnyRegister output) DEFINED_ON(mips_shared, loong64); void atomicExchangeJS(Scalar::Type arrayType, const Synchronization& sync, const Address& mem, Register value, Register temp, AnyRegister output) DEFINED_ON(arm, arm64, x86_shared); void atomicExchangeJS(Scalar::Type arrayType, const Synchronization& sync, const BaseIndex& mem, Register value, Register temp, AnyRegister output) DEFINED_ON(arm, arm64, x86_shared); void atomicExchangeJS(Scalar::Type arrayType, const Synchronization& sync, const Address& mem, Register value, Register valueTemp, Register offsetTemp, Register maskTemp, Register temp, AnyRegister output) DEFINED_ON(mips_shared, loong64); void atomicExchangeJS(Scalar::Type arrayType, const Synchronization& sync, const BaseIndex& mem, Register value, Register valueTemp, Register offsetTemp, Register maskTemp, Register temp, AnyRegister output) DEFINED_ON(mips_shared, loong64); void atomicFetchOpJS(Scalar::Type arrayType, const Synchronization& sync, AtomicOp op, Register value, const Address& mem, Register temp1, Register temp2, AnyRegister output) DEFINED_ON(arm, arm64, x86_shared); void atomicFetchOpJS(Scalar::Type arrayType, const Synchronization& sync, AtomicOp op, Register value, const BaseIndex& mem, Register temp1, Register temp2, AnyRegister output) DEFINED_ON(arm, arm64, x86_shared); void atomicFetchOpJS(Scalar::Type arrayType, const Synchronization& sync, AtomicOp op, Imm32 value, const Address& mem, Register temp1, Register temp2, AnyRegister output) DEFINED_ON(x86_shared); void atomicFetchOpJS(Scalar::Type arrayType, const Synchronization& sync, AtomicOp op, Imm32 value, const BaseIndex& mem, Register temp1, Register temp2, AnyRegister output) DEFINED_ON(x86_shared); void atomicFetchOpJS(Scalar::Type arrayType, const Synchronization& sync, AtomicOp op, Register value, const Address& mem, Register valueTemp, Register offsetTemp, Register maskTemp, Register temp, AnyRegister output) DEFINED_ON(mips_shared, loong64); void atomicFetchOpJS(Scalar::Type arrayType, const Synchronization& sync, AtomicOp op, Register value, const BaseIndex& mem, Register valueTemp, Register offsetTemp, Register maskTemp, Register temp, AnyRegister output) DEFINED_ON(mips_shared, loong64); void atomicEffectOpJS(Scalar::Type arrayType, const Synchronization& sync, AtomicOp op, Register value, const Address& mem, Register temp) DEFINED_ON(arm, arm64, x86_shared); void atomicEffectOpJS(Scalar::Type arrayType, const Synchronization& sync, AtomicOp op, Register value, const BaseIndex& mem, Register temp) DEFINED_ON(arm, arm64, x86_shared); void atomicEffectOpJS(Scalar::Type arrayType, const Synchronization& sync, AtomicOp op, Imm32 value, const Address& mem, Register temp) DEFINED_ON(x86_shared); void atomicEffectOpJS(Scalar::Type arrayType, const Synchronization& sync, AtomicOp op, Imm32 value, const BaseIndex& mem, Register temp) DEFINED_ON(x86_shared); void atomicEffectOpJS(Scalar::Type arrayType, const Synchronization& sync, AtomicOp op, Register value, const Address& mem, Register valueTemp, Register offsetTemp, Register maskTemp) DEFINED_ON(mips_shared, loong64); void atomicEffectOpJS(Scalar::Type arrayType, const Synchronization& sync, AtomicOp op, Register value, const BaseIndex& mem, Register valueTemp, Register offsetTemp, Register maskTemp) DEFINED_ON(mips_shared, loong64); void atomicIsLockFreeJS(Register value, Register output); // ======================================================================== // Spectre Mitigations. // // Spectre attacks are side-channel attacks based on cache pollution or // slow-execution of some instructions. We have multiple spectre mitigations // possible: // // - Stop speculative executions, with memory barriers. Memory barriers // force all branches depending on loads to be resolved, and thus // resolve all miss-speculated paths. // // - Use conditional move instructions. Some CPUs have a branch predictor, // and not a flag predictor. In such cases, using a conditional move // instruction to zero some pointer/index is enough to add a // data-dependency which prevents any futher executions until the load is // resolved. void spectreMaskIndex32(Register index, Register length, Register output); void spectreMaskIndex32(Register index, const Address& length, Register output); void spectreMaskIndexPtr(Register index, Register length, Register output); void spectreMaskIndexPtr(Register index, const Address& length, Register output); // The length must be a power of two. Performs a bounds check and Spectre // index masking. void boundsCheck32PowerOfTwo(Register index, uint32_t length, Label* failure); void speculationBarrier() PER_SHARED_ARCH; //}}} check_macroassembler_decl_style public: // Unsafe here means the caller is responsible for Spectre mitigations if // needed. Prefer branchTestObjClass or one of the other masm helpers! inline void loadObjClassUnsafe(Register obj, Register dest); template inline void storeObjShape(Register shape, Register obj, EmitPreBarrier emitPreBarrier); template inline void storeObjShape(Shape* shape, Register obj, EmitPreBarrier emitPreBarrier); inline void loadObjProto(Register obj, Register dest); inline void loadStringLength(Register str, Register dest); void loadStringChars(Register str, Register dest, CharEncoding encoding); void loadNonInlineStringChars(Register str, Register dest, CharEncoding encoding); void loadNonInlineStringCharsForStore(Register str, Register dest); void storeNonInlineStringChars(Register chars, Register str); void loadInlineStringChars(Register str, Register dest, CharEncoding encoding); void loadInlineStringCharsForStore(Register str, Register dest); private: void loadRopeChild(Register str, Register index, Register output, Label* isLinear); public: void branchIfCanLoadStringChar(Register str, Register index, Register scratch, Label* label); void branchIfNotCanLoadStringChar(Register str, Register index, Register scratch, Label* label); void loadStringChar(Register str, Register index, Register output, Register scratch1, Register scratch2, Label* fail); void loadRopeLeftChild(Register str, Register dest); void loadRopeRightChild(Register str, Register dest); void storeRopeChildren(Register left, Register right, Register str); void loadDependentStringBase(Register str, Register dest); void storeDependentStringBase(Register base, Register str); void loadStringIndexValue(Register str, Register dest, Label* fail); /** * Store the character in |src| to |dest|. */ template void storeChar(const T& src, Address dest, CharEncoding encoding) { if (encoding == CharEncoding::Latin1) { store8(src, dest); } else { store16(src, dest); } } /** * Load the character at |src| into |dest|. */ template void loadChar(const T& src, Register dest, CharEncoding encoding) { if (encoding == CharEncoding::Latin1) { load8ZeroExtend(src, dest); } else { load16ZeroExtend(src, dest); } } /** * Load the character at |chars[index + offset]| into |dest|. The optional * offset argument is not scaled to the character encoding. */ void loadChar(Register chars, Register index, Register dest, CharEncoding encoding, int32_t offset = 0); /** * Add |index| to |chars| so that |chars| now points at |chars[index]|. */ void addToCharPtr(Register chars, Register index, CharEncoding encoding); private: void loadStringFromUnit(Register unit, Register dest, const StaticStrings& staticStrings); void loadLengthTwoString(Register c1, Register c2, Register dest, const StaticStrings& staticStrings); public: /** * Load the string representation of |input| in base |base|. Jumps to |fail| * when the string representation needs to be allocated dynamically. */ void loadInt32ToStringWithBase(Register input, Register base, Register dest, Register scratch1, Register scratch2, const StaticStrings& staticStrings, const LiveRegisterSet& volatileRegs, Label* fail); void loadInt32ToStringWithBase(Register input, int32_t base, Register dest, Register scratch1, Register scratch2, const StaticStrings& staticStrings, Label* fail); /** * Load the BigInt digits from |bigInt| into |digits|. */ void loadBigIntDigits(Register bigInt, Register digits); /** * Load the first [u]int64 value from |bigInt| into |dest|. */ void loadBigInt64(Register bigInt, Register64 dest); /** * Load the first digit from |bigInt| into |dest|. Handles the case when the * BigInt digits length is zero. * * Note: A BigInt digit is a pointer-sized value. */ void loadFirstBigIntDigitOrZero(Register bigInt, Register dest); /** * Load the number stored in |bigInt| into |dest|. Handles the case when the * BigInt digits length is zero. Jumps to |fail| when the number can't be * saved into a single pointer-sized register. */ void loadBigInt(Register bigInt, Register dest, Label* fail); /** * Load the number stored in |bigInt| into |dest|. Doesn't handle the case * when the BigInt digits length is zero. Jumps to |fail| when the number * can't be saved into a single pointer-sized register. */ void loadBigIntNonZero(Register bigInt, Register dest, Label* fail); /** * Load the absolute number stored in |bigInt| into |dest|. Handles the case * when the BigInt digits length is zero. Jumps to |fail| when the number * can't be saved into a single pointer-sized register. */ void loadBigIntAbsolute(Register bigInt, Register dest, Label* fail); /** * In-place modifies the BigInt digit to a signed pointer-sized value. Jumps * to |fail| when the digit exceeds the representable range. */ void bigIntDigitToSignedPtr(Register bigInt, Register digit, Label* fail); /** * Initialize a BigInt from |val|. Clobbers |val|! */ void initializeBigInt64(Scalar::Type type, Register bigInt, Register64 val); /** * Initialize a BigInt from the signed, pointer-sized register |val|. * Clobbers |val|! */ void initializeBigInt(Register bigInt, Register val); /** * Initialize a BigInt from the pointer-sized register |val|. */ void initializeBigIntAbsolute(Register bigInt, Register val); /** * Copy a BigInt. Jumps to |fail| on allocation failure or when the BigInt * digits need to be heap allocated. */ void copyBigIntWithInlineDigits(Register src, Register dest, Register temp, gc::InitialHeap initialHeap, Label* fail); /** * Compare a BigInt and an Int32 value. Falls through to the false case. */ void compareBigIntAndInt32(JSOp op, Register bigInt, Register int32, Register scratch1, Register scratch2, Label* ifTrue, Label* ifFalse); /** * Compare two BigInts for equality. Falls through if both BigInts are equal * to each other. * * - When we jump to |notSameLength|, |temp1| holds the length of the right * operand. * - When we jump to |notSameDigit|, |temp2| points to the current digit of * the left operand and |temp4| holds the current digit of the right * operand. */ void equalBigInts(Register left, Register right, Register temp1, Register temp2, Register temp3, Register temp4, Label* notSameSign, Label* notSameLength, Label* notSameDigit); void loadJSContext(Register dest); void switchToRealm(Register realm); void switchToRealm(const void* realm, Register scratch); void switchToObjectRealm(Register obj, Register scratch); void switchToBaselineFrameRealm(Register scratch); void switchToWasmInstanceRealm(Register scratch1, Register scratch2); void debugAssertContextRealm(const void* realm, Register scratch); void loadJitActivation(Register dest); void guardSpecificAtom(Register str, JSAtom* atom, Register scratch, const LiveRegisterSet& volatileRegs, Label* fail); void guardStringToInt32(Register str, Register output, Register scratch, LiveRegisterSet volatileRegs, Label* fail); template void loadTypedOrValue(const T& src, TypedOrValueRegister dest) { if (dest.hasValue()) { loadValue(src, dest.valueReg()); } else { loadUnboxedValue(src, dest.type(), dest.typedReg()); } } template void storeTypedOrValue(TypedOrValueRegister src, const T& dest) { if (src.hasValue()) { storeValue(src.valueReg(), dest); } else if (IsFloatingPointType(src.type())) { FloatRegister reg = src.typedReg().fpu(); if (src.type() == MIRType::Float32) { ScratchDoubleScope fpscratch(*this); convertFloat32ToDouble(reg, fpscratch); boxDouble(fpscratch, dest); } else { boxDouble(reg, dest); } } else { storeValue(ValueTypeFromMIRType(src.type()), src.typedReg().gpr(), dest); } } template void storeConstantOrRegister(const ConstantOrRegister& src, const T& dest) { if (src.constant()) { storeValue(src.value(), dest); } else { storeTypedOrValue(src.reg(), dest); } } void storeCallPointerResult(Register reg) { if (reg != ReturnReg) { mov(ReturnReg, reg); } } inline void storeCallBoolResult(Register reg); inline void storeCallInt32Result(Register reg); void storeCallFloatResult(FloatRegister reg) { if (reg != ReturnDoubleReg) { moveDouble(ReturnDoubleReg, reg); } } inline void storeCallResultValue(AnyRegister dest, JSValueType type); void storeCallResultValue(ValueOperand dest) { #if defined(JS_NUNBOX32) // reshuffle the return registers used for a call result to store into // dest, using ReturnReg as a scratch register if necessary. This must // only be called after returning from a call, at a point when the // return register is not live. XXX would be better to allow wrappers // to store the return value to different places. if (dest.typeReg() == JSReturnReg_Data) { if (dest.payloadReg() == JSReturnReg_Type) { // swap the two registers. mov(JSReturnReg_Type, ReturnReg); mov(JSReturnReg_Data, JSReturnReg_Type); mov(ReturnReg, JSReturnReg_Data); } else { mov(JSReturnReg_Data, dest.payloadReg()); mov(JSReturnReg_Type, dest.typeReg()); } } else { mov(JSReturnReg_Type, dest.typeReg()); mov(JSReturnReg_Data, dest.payloadReg()); } #elif defined(JS_PUNBOX64) if (dest.valueReg() != JSReturnReg) { mov(JSReturnReg, dest.valueReg()); } #else # error "Bad architecture" #endif } inline void storeCallResultValue(TypedOrValueRegister dest); private: TrampolinePtr preBarrierTrampoline(MIRType type); template void unguardedCallPreBarrier(const T& address, MIRType type) { Label done; if (type == MIRType::Value) { branchTestGCThing(Assembler::NotEqual, address, &done); } else if (type == MIRType::Object || type == MIRType::String) { branchPtr(Assembler::Equal, address, ImmWord(0), &done); } Push(PreBarrierReg); computeEffectiveAddress(address, PreBarrierReg); TrampolinePtr preBarrier = preBarrierTrampoline(type); call(preBarrier); Pop(PreBarrierReg); // On arm64, SP may be < PSP now (that's OK). // eg testcase: tests/auto-regress/bug702915.js bind(&done); } public: template void guardedCallPreBarrier(const T& address, MIRType type) { Label done; branchTestNeedsIncrementalBarrier(Assembler::Zero, &done); unguardedCallPreBarrier(address, type); bind(&done); } // Like guardedCallPreBarrier, but unlike guardedCallPreBarrier this can be // called from runtime-wide trampolines because it loads cx->zone (instead of // baking in the current Zone) if JitContext::realm is nullptr. template void guardedCallPreBarrierAnyZone(const T& address, MIRType type, Register scratch) { Label done; branchTestNeedsIncrementalBarrierAnyZone(Assembler::Zero, &done, scratch); unguardedCallPreBarrier(address, type); bind(&done); } enum class Uint32Mode { FailOnDouble, ForceDouble }; void boxUint32(Register source, ValueOperand dest, Uint32Mode uint32Mode, Label* fail); template void loadFromTypedArray(Scalar::Type arrayType, const T& src, AnyRegister dest, Register temp, Label* fail); template void loadFromTypedArray(Scalar::Type arrayType, const T& src, const ValueOperand& dest, Uint32Mode uint32Mode, Register temp, Label* fail); template void loadFromTypedBigIntArray(Scalar::Type arrayType, const T& src, Register bigInt, Register64 temp); template void storeToTypedIntArray(Scalar::Type arrayType, const S& value, const T& dest) { switch (arrayType) { case Scalar::Int8: case Scalar::Uint8: case Scalar::Uint8Clamped: store8(value, dest); break; case Scalar::Int16: case Scalar::Uint16: store16(value, dest); break; case Scalar::Int32: case Scalar::Uint32: store32(value, dest); break; default: MOZ_CRASH("Invalid typed array type"); } } void storeToTypedFloatArray(Scalar::Type arrayType, FloatRegister value, const BaseIndex& dest); void storeToTypedFloatArray(Scalar::Type arrayType, FloatRegister value, const Address& dest); void storeToTypedBigIntArray(Scalar::Type arrayType, Register64 value, const BaseIndex& dest); void storeToTypedBigIntArray(Scalar::Type arrayType, Register64 value, const Address& dest); void memoryBarrierBefore(const Synchronization& sync); void memoryBarrierAfter(const Synchronization& sync); void debugAssertIsObject(const ValueOperand& val); void debugAssertObjHasFixedSlots(Register obj, Register scratch); void debugAssertObjectHasClass(Register obj, Register scratch, const JSClass* clasp); void branchArrayIsNotPacked(Register array, Register temp1, Register temp2, Label* label); void setIsPackedArray(Register obj, Register output, Register temp); void packedArrayPop(Register array, ValueOperand output, Register temp1, Register temp2, Label* fail); void packedArrayShift(Register array, ValueOperand output, Register temp1, Register temp2, LiveRegisterSet volatileRegs, Label* fail); void loadArgumentsObjectElement(Register obj, Register index, ValueOperand output, Register temp, Label* fail); void loadArgumentsObjectElementHole(Register obj, Register index, ValueOperand output, Register temp, Label* fail); void loadArgumentsObjectElementExists(Register obj, Register index, Register output, Register temp, Label* fail); void loadArgumentsObjectLength(Register obj, Register output, Label* fail); void branchTestArgumentsObjectFlags(Register obj, Register temp, uint32_t flags, Condition cond, Label* label); void typedArrayElementSize(Register obj, Register output); void branchIfClassIsNotTypedArray(Register clasp, Label* notTypedArray); void branchIfHasDetachedArrayBuffer(Register obj, Register temp, Label* label); void branchIfNativeIteratorNotReusable(Register ni, Label* notReusable); void maybeLoadIteratorFromShape(Register obj, Register dest, Register temp, Register temp2, Register temp3, Label* failure); void iteratorMore(Register obj, ValueOperand output, Register temp); void iteratorClose(Register obj, Register temp1, Register temp2, Register temp3); void registerIterator(Register enumeratorsList, Register iter, Register temp); void toHashableNonGCThing(ValueOperand value, ValueOperand result, FloatRegister tempFloat); void toHashableValue(ValueOperand value, ValueOperand result, FloatRegister tempFloat, Label* atomizeString, Label* tagString); private: void scrambleHashCode(Register result); public: void prepareHashNonGCThing(ValueOperand value, Register result, Register temp); void prepareHashString(Register str, Register result, Register temp); void prepareHashSymbol(Register sym, Register result); void prepareHashBigInt(Register bigInt, Register result, Register temp1, Register temp2, Register temp3); void prepareHashObject(Register setObj, ValueOperand value, Register result, Register temp1, Register temp2, Register temp3, Register temp4); void prepareHashValue(Register setObj, ValueOperand value, Register result, Register temp1, Register temp2, Register temp3, Register temp4); private: enum class IsBigInt { No, Yes, Maybe }; /** * Search for a value in a OrderedHashTable. * * When we jump to |found|, |entryTemp| holds the found hashtable entry. */ template void orderedHashTableLookup(Register setOrMapObj, ValueOperand value, Register hash, Register entryTemp, Register temp1, Register temp3, Register temp4, Register temp5, Label* found, IsBigInt isBigInt); void setObjectHas(Register setObj, ValueOperand value, Register hash, Register result, Register temp1, Register temp2, Register temp3, Register temp4, IsBigInt isBigInt); void mapObjectHas(Register mapObj, ValueOperand value, Register hash, Register result, Register temp1, Register temp2, Register temp3, Register temp4, IsBigInt isBigInt); void mapObjectGet(Register mapObj, ValueOperand value, Register hash, ValueOperand result, Register temp1, Register temp2, Register temp3, Register temp4, Register temp5, IsBigInt isBigInt); public: void setObjectHasNonBigInt(Register setObj, ValueOperand value, Register hash, Register result, Register temp1, Register temp2) { return setObjectHas(setObj, value, hash, result, temp1, temp2, InvalidReg, InvalidReg, IsBigInt::No); } void setObjectHasBigInt(Register setObj, ValueOperand value, Register hash, Register result, Register temp1, Register temp2, Register temp3, Register temp4) { return setObjectHas(setObj, value, hash, result, temp1, temp2, temp3, temp4, IsBigInt::Yes); } void setObjectHasValue(Register setObj, ValueOperand value, Register hash, Register result, Register temp1, Register temp2, Register temp3, Register temp4) { return setObjectHas(setObj, value, hash, result, temp1, temp2, temp3, temp4, IsBigInt::Maybe); } void mapObjectHasNonBigInt(Register mapObj, ValueOperand value, Register hash, Register result, Register temp1, Register temp2) { return mapObjectHas(mapObj, value, hash, result, temp1, temp2, InvalidReg, InvalidReg, IsBigInt::No); } void mapObjectHasBigInt(Register mapObj, ValueOperand value, Register hash, Register result, Register temp1, Register temp2, Register temp3, Register temp4) { return mapObjectHas(mapObj, value, hash, result, temp1, temp2, temp3, temp4, IsBigInt::Yes); } void mapObjectHasValue(Register mapObj, ValueOperand value, Register hash, Register result, Register temp1, Register temp2, Register temp3, Register temp4) { return mapObjectHas(mapObj, value, hash, result, temp1, temp2, temp3, temp4, IsBigInt::Maybe); } void mapObjectGetNonBigInt(Register mapObj, ValueOperand value, Register hash, ValueOperand result, Register temp1, Register temp2, Register temp3) { return mapObjectGet(mapObj, value, hash, result, temp1, temp2, temp3, InvalidReg, InvalidReg, IsBigInt::No); } void mapObjectGetBigInt(Register mapObj, ValueOperand value, Register hash, ValueOperand result, Register temp1, Register temp2, Register temp3, Register temp4, Register temp5) { return mapObjectGet(mapObj, value, hash, result, temp1, temp2, temp3, temp4, temp5, IsBigInt::Yes); } void mapObjectGetValue(Register mapObj, ValueOperand value, Register hash, ValueOperand result, Register temp1, Register temp2, Register temp3, Register temp4, Register temp5) { return mapObjectGet(mapObj, value, hash, result, temp1, temp2, temp3, temp4, temp5, IsBigInt::Maybe); } private: template void loadOrderedHashTableCount(Register setOrMapObj, Register result); public: void loadSetObjectSize(Register setObj, Register result); void loadMapObjectSize(Register mapObj, Register result); // Inline version of js_TypedArray_uint8_clamp_double. // This function clobbers the input register. void clampDoubleToUint8(FloatRegister input, Register output) PER_ARCH; using MacroAssemblerSpecific::ensureDouble; template void ensureDouble(const S& source, FloatRegister dest, Label* failure) { Label isDouble, done; branchTestDouble(Assembler::Equal, source, &isDouble); branchTestInt32(Assembler::NotEqual, source, failure); convertInt32ToDouble(source, dest); jump(&done); bind(&isDouble); unboxDouble(source, dest); bind(&done); } // Inline allocation. private: void checkAllocatorState(Label* fail); bool shouldNurseryAllocate(gc::AllocKind allocKind, gc::InitialHeap initialHeap); void nurseryAllocateObject( Register result, Register temp, gc::AllocKind allocKind, size_t nDynamicSlots, Label* fail, const AllocSiteInput& allocSite = AllocSiteInput()); void bumpPointerAllocate(Register result, Register temp, Label* fail, CompileZone* zone, void* posAddr, const void* curEddAddr, JS::TraceKind traceKind, uint32_t size, const AllocSiteInput& allocSite = AllocSiteInput()); void updateAllocSite(Register temp, Register result, CompileZone* zone, Register site); void freeListAllocate(Register result, Register temp, gc::AllocKind allocKind, Label* fail); void allocateObject(Register result, Register temp, gc::AllocKind allocKind, uint32_t nDynamicSlots, gc::InitialHeap initialHeap, Label* fail, const AllocSiteInput& allocSite = AllocSiteInput()); void nurseryAllocateString(Register result, Register temp, gc::AllocKind allocKind, Label* fail); void allocateString(Register result, Register temp, gc::AllocKind allocKind, gc::InitialHeap initialHeap, Label* fail); void nurseryAllocateBigInt(Register result, Register temp, Label* fail); void copySlotsFromTemplate(Register obj, const TemplateNativeObject& templateObj, uint32_t start, uint32_t end); void fillSlotsWithConstantValue(Address addr, Register temp, uint32_t start, uint32_t end, const Value& v); void fillSlotsWithUndefined(Address addr, Register temp, uint32_t start, uint32_t end); void fillSlotsWithUninitialized(Address addr, Register temp, uint32_t start, uint32_t end); void initGCSlots(Register obj, Register temp, const TemplateNativeObject& templateObj); public: void callFreeStub(Register slots); void createGCObject(Register result, Register temp, const TemplateObject& templateObj, gc::InitialHeap initialHeap, Label* fail, bool initContents = true); void createPlainGCObject(Register result, Register shape, Register temp, Register temp2, uint32_t numFixedSlots, uint32_t numDynamicSlots, gc::AllocKind allocKind, gc::InitialHeap initialHeap, Label* fail, const AllocSiteInput& allocSite, bool initContents = true); void createArrayWithFixedElements( Register result, Register shape, Register temp, uint32_t arrayLength, uint32_t arrayCapacity, gc::AllocKind allocKind, gc::InitialHeap initialHeap, Label* fail, const AllocSiteInput& allocSite = AllocSiteInput()); void initGCThing(Register obj, Register temp, const TemplateObject& templateObj, bool initContents = true); enum class TypedArrayLength { Fixed, Dynamic }; void initTypedArraySlots(Register obj, Register temp, Register lengthReg, LiveRegisterSet liveRegs, Label* fail, TypedArrayObject* templateObj, TypedArrayLength lengthKind); void newGCString(Register result, Register temp, gc::InitialHeap initialHeap, Label* fail); void newGCFatInlineString(Register result, Register temp, gc::InitialHeap initialHeap, Label* fail); void newGCBigInt(Register result, Register temp, gc::InitialHeap initialHeap, Label* fail); // Compares two strings for equality based on the JSOP. // This checks for identical pointers, atoms and length and fails for // everything else. void compareStrings(JSOp op, Register left, Register right, Register result, Label* fail); // Result of the typeof operation. Falls back to slow-path for proxies. void typeOfObject(Register objReg, Register scratch, Label* slow, Label* isObject, Label* isCallable, Label* isUndefined); // Implementation of IsCallable. Doesn't handle proxies. void isCallable(Register obj, Register output, Label* isProxy) { isCallableOrConstructor(true, obj, output, isProxy); } void isConstructor(Register obj, Register output, Label* isProxy) { isCallableOrConstructor(false, obj, output, isProxy); } void setIsCrossRealmArrayConstructor(Register obj, Register output); void setIsDefinitelyTypedArrayConstructor(Register obj, Register output); void loadMegamorphicCache(Register dest); void loadStringToAtomCacheLastLookups(Register dest); void loadAtomOrSymbolAndHash(ValueOperand value, Register outId, Register outHash, Label* cacheMiss); void emitExtractValueFromMegamorphicCacheEntry( Register obj, Register entry, Register scratch1, Register scratch2, ValueOperand output, Label* cacheHit, Label* cacheMiss); void emitMegamorphicCacheLookupByValueCommon(ValueOperand id, Register obj, Register scratch1, Register scratch2, Register outEntryPtr, Label* cacheMiss); void emitMegamorphicCacheLookup(PropertyKey id, Register obj, Register scratch1, Register scratch2, Register scratch3, ValueOperand output, Label* cacheHit); void emitMegamorphicCacheLookupByValue(ValueOperand id, Register obj, Register scratch1, Register scratch2, Register scratch3, ValueOperand output, Label* cacheHit); void emitMegamorphicCacheLookupExists(ValueOperand id, Register obj, Register scratch1, Register scratch2, Register scratch3, Register output, Label* cacheHit, bool hasOwn); void loadDOMExpandoValueGuardGeneration( Register obj, ValueOperand output, JS::ExpandoAndGeneration* expandoAndGeneration, uint64_t generation, Label* fail); void guardNonNegativeIntPtrToInt32(Register reg, Label* fail); void loadArrayBufferByteLengthIntPtr(Register obj, Register output); void loadArrayBufferViewByteOffsetIntPtr(Register obj, Register output); void loadArrayBufferViewLengthIntPtr(Register obj, Register output); private: void isCallableOrConstructor(bool isCallable, Register obj, Register output, Label* isProxy); public: // Generates code used to complete a bailout. void generateBailoutTail(Register scratch, Register bailoutInfo); public: #ifndef JS_CODEGEN_ARM64 // StackPointer manipulation functions. // On ARM64, the StackPointer is implemented as two synchronized registers. // Code shared across platforms must use these functions to be valid. template inline void addToStackPtr(T t); template inline void addStackPtrTo(T t); void subFromStackPtr(Imm32 imm32) DEFINED_ON(mips32, mips64, loong64, wasm32, arm, x86, x64); void subFromStackPtr(Register reg); template void subStackPtrFrom(T t) { subPtr(getStackPointer(), t); } template void andToStackPtr(T t) { andPtr(t, getStackPointer()); } template void moveToStackPtr(T t) { movePtr(t, getStackPointer()); } template void moveStackPtrTo(T t) { movePtr(getStackPointer(), t); } template void loadStackPtr(T t) { loadPtr(t, getStackPointer()); } template void storeStackPtr(T t) { storePtr(getStackPointer(), t); } // StackPointer testing functions. // On ARM64, sp can function as the zero register depending on context. // Code shared across platforms must use these functions to be valid. template inline void branchTestStackPtr(Condition cond, T t, Label* label); template inline void branchStackPtr(Condition cond, T rhs, Label* label); template inline void branchStackPtrRhs(Condition cond, T lhs, Label* label); // Move the stack pointer based on the requested amount. inline void reserveStack(uint32_t amount); #else // !JS_CODEGEN_ARM64 void reserveStack(uint32_t amount); #endif public: void enableProfilingInstrumentation() { emitProfilingInstrumentation_ = true; } private: // This class is used to surround call sites throughout the assembler. This // is used by callWithABI, and callJit functions, except if suffixed by // NoProfiler. class MOZ_RAII AutoProfilerCallInstrumentation { public: explicit AutoProfilerCallInstrumentation(MacroAssembler& masm); ~AutoProfilerCallInstrumentation() = default; }; friend class AutoProfilerCallInstrumentation; void appendProfilerCallSite(CodeOffset label) { propagateOOM(profilerCallSites_.append(label)); } // Fix up the code pointers to be written for locations where profilerCallSite // emitted moves of RIP to a register. void linkProfilerCallSites(JitCode* code); // This field is used to manage profiling instrumentation output. If // provided and enabled, then instrumentation will be emitted around call // sites. bool emitProfilingInstrumentation_; // Record locations of the call sites. Vector profilerCallSites_; public: void loadJitCodeRaw(Register func, Register dest); void loadBaselineJitCodeRaw(Register func, Register dest, Label* failure = nullptr); void storeICScriptInJSContext(Register icScript); void loadBaselineFramePtr(Register framePtr, Register dest); void pushBaselineFramePtr(Register framePtr, Register scratch) { loadBaselineFramePtr(framePtr, scratch); push(scratch); } void PushBaselineFramePtr(Register framePtr, Register scratch) { loadBaselineFramePtr(framePtr, scratch); Push(scratch); } using MacroAssemblerSpecific::movePtr; void movePtr(TrampolinePtr ptr, Register dest) { movePtr(ImmPtr(ptr.value), dest); } private: void handleFailure(); public: Label* exceptionLabel() { // Exceptions are currently handled the same way as sequential failures. return &failureLabel_; } Label* failureLabel() { return &failureLabel_; } void finish(); void link(JitCode* code); void assumeUnreachable(const char* output); void printf(const char* output); void printf(const char* output, Register value); #define DISPATCH_FLOATING_POINT_OP(method, type, arg1d, arg1f, arg2) \ MOZ_ASSERT(IsFloatingPointType(type)); \ if (type == MIRType::Double) \ method##Double(arg1d, arg2); \ else \ method##Float32(arg1f, arg2); void loadConstantFloatingPoint(double d, float f, FloatRegister dest, MIRType destType) { DISPATCH_FLOATING_POINT_OP(loadConstant, destType, d, f, dest); } void boolValueToFloatingPoint(ValueOperand value, FloatRegister dest, MIRType destType) { DISPATCH_FLOATING_POINT_OP(boolValueTo, destType, value, value, dest); } void int32ValueToFloatingPoint(ValueOperand value, FloatRegister dest, MIRType destType) { DISPATCH_FLOATING_POINT_OP(int32ValueTo, destType, value, value, dest); } void convertInt32ToFloatingPoint(Register src, FloatRegister dest, MIRType destType) { DISPATCH_FLOATING_POINT_OP(convertInt32To, destType, src, src, dest); } #undef DISPATCH_FLOATING_POINT_OP void convertValueToFloatingPoint(ValueOperand value, FloatRegister output, Label* fail, MIRType outputType); void outOfLineTruncateSlow(FloatRegister src, Register dest, bool widenFloatToDouble, bool compilingWasm, wasm::BytecodeOffset callOffset); void convertInt32ValueToDouble(ValueOperand val); void convertValueToDouble(ValueOperand value, FloatRegister output, Label* fail) { convertValueToFloatingPoint(value, output, fail, MIRType::Double); } void convertValueToFloat(ValueOperand value, FloatRegister output, Label* fail) { convertValueToFloatingPoint(value, output, fail, MIRType::Float32); } // // Functions for converting values to int. // void convertDoubleToInt(FloatRegister src, Register output, FloatRegister temp, Label* truncateFail, Label* fail, IntConversionBehavior behavior); // Strings may be handled by providing labels to jump to when the behavior // is truncation or clamping. The subroutine, usually an OOL call, is // passed the unboxed string in |stringReg| and should convert it to a // double store into |temp|. void convertValueToInt( ValueOperand value, Label* handleStringEntry, Label* handleStringRejoin, Label* truncateDoubleSlow, Register stringReg, FloatRegister temp, Register output, Label* fail, IntConversionBehavior behavior, IntConversionInputKind conversion = IntConversionInputKind::Any); // This carries over the MToNumberInt32 operation on the ValueOperand // input; see comment at the top of this class. void convertValueToInt32( ValueOperand value, FloatRegister temp, Register output, Label* fail, bool negativeZeroCheck, IntConversionInputKind conversion = IntConversionInputKind::Any) { convertValueToInt( value, nullptr, nullptr, nullptr, InvalidReg, temp, output, fail, negativeZeroCheck ? IntConversionBehavior::NegativeZeroCheck : IntConversionBehavior::Normal, conversion); } // This carries over the MTruncateToInt32 operation on the ValueOperand // input; see the comment at the top of this class. void truncateValueToInt32(ValueOperand value, Label* handleStringEntry, Label* handleStringRejoin, Label* truncateDoubleSlow, Register stringReg, FloatRegister temp, Register output, Label* fail) { convertValueToInt(value, handleStringEntry, handleStringRejoin, truncateDoubleSlow, stringReg, temp, output, fail, IntConversionBehavior::Truncate); } void truncateValueToInt32(ValueOperand value, FloatRegister temp, Register output, Label* fail) { truncateValueToInt32(value, nullptr, nullptr, nullptr, InvalidReg, temp, output, fail); } // Truncates, i.e. removes any fractional parts, but doesn't wrap around to // the int32 range. void truncateNoWrapValueToInt32(ValueOperand value, FloatRegister temp, Register output, Label* truncateDoubleSlow, Label* fail) { convertValueToInt(value, nullptr, nullptr, truncateDoubleSlow, InvalidReg, temp, output, fail, IntConversionBehavior::TruncateNoWrap); } // Convenience functions for clamping values to uint8. void clampValueToUint8(ValueOperand value, Label* handleStringEntry, Label* handleStringRejoin, Register stringReg, FloatRegister temp, Register output, Label* fail) { convertValueToInt(value, handleStringEntry, handleStringRejoin, nullptr, stringReg, temp, output, fail, IntConversionBehavior::ClampToUint8); } [[nodiscard]] bool icBuildOOLFakeExitFrame(void* fakeReturnAddr, AutoSaveLiveRegisters& save); // Align the stack pointer based on the number of arguments which are pushed // on the stack, such that the JitFrameLayout would be correctly aligned on // the JitStackAlignment. void alignJitStackBasedOnNArgs(Register nargs, bool countIncludesThis); void alignJitStackBasedOnNArgs(uint32_t argc, bool countIncludesThis); inline void assertStackAlignment(uint32_t alignment, int32_t offset = 0); void touchFrameValues(Register numStackValues, Register scratch1, Register scratch2); #ifdef JS_64BIT // See comment block "64-bit GPRs carrying 32-bit values" above. This asserts // that the high bits of the register are appropriate for the architecture and // the value in the low bits. void debugAssertCanonicalInt32(Register r); #endif }; // StackMacroAssembler checks no GC will happen while it's on the stack. class MOZ_RAII StackMacroAssembler : public MacroAssembler { JS::AutoCheckCannotGC nogc; public: StackMacroAssembler(JSContext* cx, TempAllocator& alloc); }; // WasmMacroAssembler does not contain GC pointers, so it doesn't need the no-GC // checking StackMacroAssembler has. class MOZ_RAII WasmMacroAssembler : public MacroAssembler { public: explicit WasmMacroAssembler(TempAllocator& alloc, bool limitedSize = true); explicit WasmMacroAssembler(TempAllocator& alloc, const wasm::ModuleEnvironment& env, bool limitedSize = true); ~WasmMacroAssembler() { assertNoGCThings(); } }; // Heap-allocated MacroAssembler used for Ion off-thread code generation. // GC cancels off-thread compilations. class IonHeapMacroAssembler : public MacroAssembler { public: IonHeapMacroAssembler(TempAllocator& alloc, CompileRealm* realm); }; //{{{ check_macroassembler_style inline uint32_t MacroAssembler::framePushed() const { return framePushed_; } inline void MacroAssembler::setFramePushed(uint32_t framePushed) { framePushed_ = framePushed; } inline void MacroAssembler::adjustFrame(int32_t value) { MOZ_ASSERT_IF(value < 0, framePushed_ >= uint32_t(-value)); setFramePushed(framePushed_ + value); } inline void MacroAssembler::implicitPop(uint32_t bytes) { MOZ_ASSERT(bytes % sizeof(intptr_t) == 0); MOZ_ASSERT(bytes <= INT32_MAX); adjustFrame(-int32_t(bytes)); } //}}} check_macroassembler_style static inline Assembler::DoubleCondition JSOpToDoubleCondition(JSOp op) { switch (op) { case JSOp::Eq: case JSOp::StrictEq: return Assembler::DoubleEqual; case JSOp::Ne: case JSOp::StrictNe: return Assembler::DoubleNotEqualOrUnordered; case JSOp::Lt: return Assembler::DoubleLessThan; case JSOp::Le: return Assembler::DoubleLessThanOrEqual; case JSOp::Gt: return Assembler::DoubleGreaterThan; case JSOp::Ge: return Assembler::DoubleGreaterThanOrEqual; default: MOZ_CRASH("Unexpected comparison operation"); } } // Note: the op may have been inverted during lowering (to put constants in a // position where they can be immediates), so it is important to use the // lir->jsop() instead of the mir->jsop() when it is present. static inline Assembler::Condition JSOpToCondition(JSOp op, bool isSigned) { if (isSigned) { switch (op) { case JSOp::Eq: case JSOp::StrictEq: return Assembler::Equal; case JSOp::Ne: case JSOp::StrictNe: return Assembler::NotEqual; case JSOp::Lt: return Assembler::LessThan; case JSOp::Le: return Assembler::LessThanOrEqual; case JSOp::Gt: return Assembler::GreaterThan; case JSOp::Ge: return Assembler::GreaterThanOrEqual; default: MOZ_CRASH("Unrecognized comparison operation"); } } else { switch (op) { case JSOp::Eq: case JSOp::StrictEq: return Assembler::Equal; case JSOp::Ne: case JSOp::StrictNe: return Assembler::NotEqual; case JSOp::Lt: return Assembler::Below; case JSOp::Le: return Assembler::BelowOrEqual; case JSOp::Gt: return Assembler::Above; case JSOp::Ge: return Assembler::AboveOrEqual; default: MOZ_CRASH("Unrecognized comparison operation"); } } } static inline size_t StackDecrementForCall(uint32_t alignment, size_t bytesAlreadyPushed, size_t bytesToPush) { return bytesToPush + ComputeByteAlignment(bytesAlreadyPushed + bytesToPush, alignment); } // Helper for generatePreBarrier. inline DynFn JitPreWriteBarrier(MIRType type); } // namespace jit } // namespace js #endif /* jit_MacroAssembler_h */