// Copyright 2013 the V8 project authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #if V8_TARGET_ARCH_ARM64 #include "src/assembler.h" #include "src/base/bits.h" #include "src/base/division-by-constant.h" #include "src/bootstrapper.h" #include "src/callable.h" #include "src/code-factory.h" #include "src/code-stubs.h" #include "src/debug/debug.h" #include "src/external-reference-table.h" #include "src/frame-constants.h" #include "src/frames-inl.h" #include "src/heap/heap-inl.h" #include "src/instruction-stream.h" #include "src/register-configuration.h" #include "src/runtime/runtime.h" #include "src/snapshot/snapshot.h" #include "src/wasm/wasm-code-manager.h" #include "src/arm64/macro-assembler-arm64-inl.h" #include "src/arm64/macro-assembler-arm64.h" // Cannot be the first include namespace v8 { namespace internal { MacroAssembler::MacroAssembler(Isolate* isolate, const AssemblerOptions& options, void* buffer, int size, CodeObjectRequired create_code_object) : TurboAssembler(isolate, options, buffer, size, create_code_object) { if (create_code_object == CodeObjectRequired::kYes) { // Unlike TurboAssembler, which can be used off the main thread and may not // allocate, macro assembler creates its own copy of the self-reference // marker in order to disambiguate between self-references during nested // code generation (e.g.: codegen of the current object triggers stub // compilation through CodeStub::GetCode()). code_object_ = Handle::New( *isolate->factory()->NewSelfReferenceMarker(), isolate); } } CPURegList TurboAssembler::DefaultTmpList() { return CPURegList(ip0, ip1); } CPURegList TurboAssembler::DefaultFPTmpList() { return CPURegList(fp_scratch1, fp_scratch2); } int TurboAssembler::RequiredStackSizeForCallerSaved(SaveFPRegsMode fp_mode, Register exclusion) const { int bytes = 0; auto list = kCallerSaved; DCHECK_EQ(list.Count() % 2, 0); // We only allow one exclusion register, so if the list is of even length // before exclusions, it must still be afterwards, to maintain alignment. // Therefore, we can ignore the exclusion register in the computation. // However, we leave it in the argument list to mirror the prototype for // Push/PopCallerSaved(). USE(exclusion); bytes += list.Count() * kXRegSizeInBits / 8; if (fp_mode == kSaveFPRegs) { DCHECK_EQ(kCallerSavedV.Count() % 2, 0); bytes += kCallerSavedV.Count() * kDRegSizeInBits / 8; } return bytes; } int TurboAssembler::PushCallerSaved(SaveFPRegsMode fp_mode, Register exclusion) { int bytes = 0; auto list = kCallerSaved; DCHECK_EQ(list.Count() % 2, 0); if (!exclusion.Is(no_reg)) { // Replace the excluded register with padding to maintain alignment. list.Remove(exclusion); list.Combine(padreg); } PushCPURegList(list); bytes += list.Count() * kXRegSizeInBits / 8; if (fp_mode == kSaveFPRegs) { DCHECK_EQ(kCallerSavedV.Count() % 2, 0); PushCPURegList(kCallerSavedV); bytes += kCallerSavedV.Count() * kDRegSizeInBits / 8; } return bytes; } int TurboAssembler::PopCallerSaved(SaveFPRegsMode fp_mode, Register exclusion) { int bytes = 0; if (fp_mode == kSaveFPRegs) { DCHECK_EQ(kCallerSavedV.Count() % 2, 0); PopCPURegList(kCallerSavedV); bytes += kCallerSavedV.Count() * kDRegSizeInBits / 8; } auto list = kCallerSaved; DCHECK_EQ(list.Count() % 2, 0); if (!exclusion.Is(no_reg)) { // Replace the excluded register with padding to maintain alignment. list.Remove(exclusion); list.Combine(padreg); } PopCPURegList(list); bytes += list.Count() * kXRegSizeInBits / 8; return bytes; } void TurboAssembler::LogicalMacro(const Register& rd, const Register& rn, const Operand& operand, LogicalOp op) { UseScratchRegisterScope temps(this); if (operand.NeedsRelocation(this)) { Register temp = temps.AcquireX(); Ldr(temp, operand.immediate()); Logical(rd, rn, temp, op); } else if (operand.IsImmediate()) { int64_t immediate = operand.ImmediateValue(); unsigned reg_size = rd.SizeInBits(); // If the operation is NOT, invert the operation and immediate. if ((op & NOT) == NOT) { op = static_cast(op & ~NOT); immediate = ~immediate; } // Ignore the top 32 bits of an immediate if we're moving to a W register. if (rd.Is32Bits()) { // Check that the top 32 bits are consistent. DCHECK(((immediate >> kWRegSizeInBits) == 0) || ((immediate >> kWRegSizeInBits) == -1)); immediate &= kWRegMask; } DCHECK(rd.Is64Bits() || is_uint32(immediate)); // Special cases for all set or all clear immediates. if (immediate == 0) { switch (op) { case AND: Mov(rd, 0); return; case ORR: // Fall through. case EOR: Mov(rd, rn); return; case ANDS: // Fall through. case BICS: break; default: UNREACHABLE(); } } else if ((rd.Is64Bits() && (immediate == -1L)) || (rd.Is32Bits() && (immediate == 0xFFFFFFFFL))) { switch (op) { case AND: Mov(rd, rn); return; case ORR: Mov(rd, immediate); return; case EOR: Mvn(rd, rn); return; case ANDS: // Fall through. case BICS: break; default: UNREACHABLE(); } } unsigned n, imm_s, imm_r; if (IsImmLogical(immediate, reg_size, &n, &imm_s, &imm_r)) { // Immediate can be encoded in the instruction. LogicalImmediate(rd, rn, n, imm_s, imm_r, op); } else { // Immediate can't be encoded: synthesize using move immediate. Register temp = temps.AcquireSameSizeAs(rn); // If the left-hand input is the stack pointer, we can't pre-shift the // immediate, as the encoding won't allow the subsequent post shift. PreShiftImmMode mode = rn.Is(sp) ? kNoShift : kAnyShift; Operand imm_operand = MoveImmediateForShiftedOp(temp, immediate, mode); if (rd.IsSP()) { // If rd is the stack pointer we cannot use it as the destination // register so we use the temp register as an intermediate again. Logical(temp, rn, imm_operand, op); Mov(sp, temp); } else { Logical(rd, rn, imm_operand, op); } } } else if (operand.IsExtendedRegister()) { DCHECK(operand.reg().SizeInBits() <= rd.SizeInBits()); // Add/sub extended supports shift <= 4. We want to support exactly the // same modes here. DCHECK_LE(operand.shift_amount(), 4); DCHECK(operand.reg().Is64Bits() || ((operand.extend() != UXTX) && (operand.extend() != SXTX))); Register temp = temps.AcquireSameSizeAs(rn); EmitExtendShift(temp, operand.reg(), operand.extend(), operand.shift_amount()); Logical(rd, rn, temp, op); } else { // The operand can be encoded in the instruction. DCHECK(operand.IsShiftedRegister()); Logical(rd, rn, operand, op); } } void TurboAssembler::Mov(const Register& rd, uint64_t imm) { DCHECK(allow_macro_instructions()); DCHECK(is_uint32(imm) || is_int32(imm) || rd.Is64Bits()); DCHECK(!rd.IsZero()); // TODO(all) extend to support more immediates. // // Immediates on Aarch64 can be produced using an initial value, and zero to // three move keep operations. // // Initial values can be generated with: // 1. 64-bit move zero (movz). // 2. 32-bit move inverted (movn). // 3. 64-bit move inverted. // 4. 32-bit orr immediate. // 5. 64-bit orr immediate. // Move-keep may then be used to modify each of the 16-bit half-words. // // The code below supports all five initial value generators, and // applying move-keep operations to move-zero and move-inverted initial // values. // Try to move the immediate in one instruction, and if that fails, switch to // using multiple instructions. if (!TryOneInstrMoveImmediate(rd, imm)) { unsigned reg_size = rd.SizeInBits(); // Generic immediate case. Imm will be represented by // [imm3, imm2, imm1, imm0], where each imm is 16 bits. // A move-zero or move-inverted is generated for the first non-zero or // non-0xFFFF immX, and a move-keep for subsequent non-zero immX. uint64_t ignored_halfword = 0; bool invert_move = false; // If the number of 0xFFFF halfwords is greater than the number of 0x0000 // halfwords, it's more efficient to use move-inverted. if (CountClearHalfWords(~imm, reg_size) > CountClearHalfWords(imm, reg_size)) { ignored_halfword = 0xFFFFL; invert_move = true; } // Mov instructions can't move immediate values into the stack pointer, so // set up a temporary register, if needed. UseScratchRegisterScope temps(this); Register temp = rd.IsSP() ? temps.AcquireSameSizeAs(rd) : rd; // Iterate through the halfwords. Use movn/movz for the first non-ignored // halfword, and movk for subsequent halfwords. DCHECK_EQ(reg_size % 16, 0); bool first_mov_done = false; for (int i = 0; i < (rd.SizeInBits() / 16); i++) { uint64_t imm16 = (imm >> (16 * i)) & 0xFFFFL; if (imm16 != ignored_halfword) { if (!first_mov_done) { if (invert_move) { movn(temp, (~imm16) & 0xFFFFL, 16 * i); } else { movz(temp, imm16, 16 * i); } first_mov_done = true; } else { // Construct a wider constant. movk(temp, imm16, 16 * i); } } } DCHECK(first_mov_done); // Move the temporary if the original destination register was the stack // pointer. if (rd.IsSP()) { mov(rd, temp); } } } void TurboAssembler::Mov(const Register& rd, const Operand& operand, DiscardMoveMode discard_mode) { DCHECK(allow_macro_instructions()); DCHECK(!rd.IsZero()); // Provide a swap register for instructions that need to write into the // system stack pointer (and can't do this inherently). UseScratchRegisterScope temps(this); Register dst = (rd.IsSP()) ? temps.AcquireSameSizeAs(rd) : rd; if (operand.NeedsRelocation(this)) { if (FLAG_embedded_builtins) { if (root_array_available_ && options().isolate_independent_code) { if (operand.ImmediateRMode() == RelocInfo::EXTERNAL_REFERENCE) { Address addr = static_cast

(operand.ImmediateValue()); ExternalReference reference = bit_cast(addr); IndirectLoadExternalReference(rd, reference); return; } else if (operand.ImmediateRMode() == RelocInfo::EMBEDDED_OBJECT) { Handle x( reinterpret_cast(operand.ImmediateValue())); IndirectLoadConstant(rd, x); return; } } } Ldr(dst, operand); } else if (operand.IsImmediate()) { // Call the macro assembler for generic immediates. Mov(dst, operand.ImmediateValue()); } else if (operand.IsShiftedRegister() && (operand.shift_amount() != 0)) { // Emit a shift instruction if moving a shifted register. This operation // could also be achieved using an orr instruction (like orn used by Mvn), // but using a shift instruction makes the disassembly clearer. EmitShift(dst, operand.reg(), operand.shift(), operand.shift_amount()); } else if (operand.IsExtendedRegister()) { // Emit an extend instruction if moving an extended register. This handles // extend with post-shift operations, too. EmitExtendShift(dst, operand.reg(), operand.extend(), operand.shift_amount()); } else { // Otherwise, emit a register move only if the registers are distinct, or // if they are not X registers. // // Note that mov(w0, w0) is not a no-op because it clears the top word of // x0. A flag is provided (kDiscardForSameWReg) if a move between the same W // registers is not required to clear the top word of the X register. In // this case, the instruction is discarded. // // If sp is an operand, add #0 is emitted, otherwise, orr #0. if (!rd.Is(operand.reg()) || (rd.Is32Bits() && (discard_mode == kDontDiscardForSameWReg))) { Assembler::mov(rd, operand.reg()); } // This case can handle writes into the system stack pointer directly. dst = rd; } // Copy the result to the system stack pointer. if (!dst.Is(rd)) { DCHECK(rd.IsSP()); Assembler::mov(rd, dst); } } void TurboAssembler::Movi16bitHelper(const VRegister& vd, uint64_t imm) { DCHECK(is_uint16(imm)); int byte1 = (imm & 0xFF); int byte2 = ((imm >> 8) & 0xFF); if (byte1 == byte2) { movi(vd.Is64Bits() ? vd.V8B() : vd.V16B(), byte1); } else if (byte1 == 0) { movi(vd, byte2, LSL, 8); } else if (byte2 == 0) { movi(vd, byte1); } else if (byte1 == 0xFF) { mvni(vd, ~byte2 & 0xFF, LSL, 8); } else if (byte2 == 0xFF) { mvni(vd, ~byte1 & 0xFF); } else { UseScratchRegisterScope temps(this); Register temp = temps.AcquireW(); movz(temp, imm); dup(vd, temp); } } void TurboAssembler::Movi32bitHelper(const VRegister& vd, uint64_t imm) { DCHECK(is_uint32(imm)); uint8_t bytes[sizeof(imm)]; memcpy(bytes, &imm, sizeof(imm)); // All bytes are either 0x00 or 0xFF. { bool all0orff = true; for (int i = 0; i < 4; ++i) { if ((bytes[i] != 0) && (bytes[i] != 0xFF)) { all0orff = false; break; } } if (all0orff == true) { movi(vd.Is64Bits() ? vd.V1D() : vd.V2D(), ((imm << 32) | imm)); return; } } // Of the 4 bytes, only one byte is non-zero. for (int i = 0; i < 4; i++) { if ((imm & (0xFF << (i * 8))) == imm) { movi(vd, bytes[i], LSL, i * 8); return; } } // Of the 4 bytes, only one byte is not 0xFF. for (int i = 0; i < 4; i++) { uint32_t mask = ~(0xFF << (i * 8)); if ((imm & mask) == mask) { mvni(vd, ~bytes[i] & 0xFF, LSL, i * 8); return; } } // Immediate is of the form 0x00MMFFFF. if ((imm & 0xFF00FFFF) == 0x0000FFFF) { movi(vd, bytes[2], MSL, 16); return; } // Immediate is of the form 0x0000MMFF. if ((imm & 0xFFFF00FF) == 0x000000FF) { movi(vd, bytes[1], MSL, 8); return; } // Immediate is of the form 0xFFMM0000. if ((imm & 0xFF00FFFF) == 0xFF000000) { mvni(vd, ~bytes[2] & 0xFF, MSL, 16); return; } // Immediate is of the form 0xFFFFMM00. if ((imm & 0xFFFF00FF) == 0xFFFF0000) { mvni(vd, ~bytes[1] & 0xFF, MSL, 8); return; } // Top and bottom 16-bits are equal. if (((imm >> 16) & 0xFFFF) == (imm & 0xFFFF)) { Movi16bitHelper(vd.Is64Bits() ? vd.V4H() : vd.V8H(), imm & 0xFFFF); return; } // Default case. { UseScratchRegisterScope temps(this); Register temp = temps.AcquireW(); Mov(temp, imm); dup(vd, temp); } } void TurboAssembler::Movi64bitHelper(const VRegister& vd, uint64_t imm) { // All bytes are either 0x00 or 0xFF. { bool all0orff = true; for (int i = 0; i < 8; ++i) { int byteval = (imm >> (i * 8)) & 0xFF; if (byteval != 0 && byteval != 0xFF) { all0orff = false; break; } } if (all0orff == true) { movi(vd, imm); return; } } // Top and bottom 32-bits are equal. if (((imm >> 32) & 0xFFFFFFFF) == (imm & 0xFFFFFFFF)) { Movi32bitHelper(vd.Is64Bits() ? vd.V2S() : vd.V4S(), imm & 0xFFFFFFFF); return; } // Default case. { UseScratchRegisterScope temps(this); Register temp = temps.AcquireX(); Mov(temp, imm); if (vd.Is1D()) { mov(vd.D(), 0, temp); } else { dup(vd.V2D(), temp); } } } void TurboAssembler::Movi(const VRegister& vd, uint64_t imm, Shift shift, int shift_amount) { DCHECK(allow_macro_instructions()); if (shift_amount != 0 || shift != LSL) { movi(vd, imm, shift, shift_amount); } else if (vd.Is8B() || vd.Is16B()) { // 8-bit immediate. DCHECK(is_uint8(imm)); movi(vd, imm); } else if (vd.Is4H() || vd.Is8H()) { // 16-bit immediate. Movi16bitHelper(vd, imm); } else if (vd.Is2S() || vd.Is4S()) { // 32-bit immediate. Movi32bitHelper(vd, imm); } else { // 64-bit immediate. Movi64bitHelper(vd, imm); } } void TurboAssembler::Movi(const VRegister& vd, uint64_t hi, uint64_t lo) { // TODO(all): Move 128-bit values in a more efficient way. DCHECK(vd.Is128Bits()); UseScratchRegisterScope temps(this); Movi(vd.V2D(), lo); Register temp = temps.AcquireX(); Mov(temp, hi); Ins(vd.V2D(), 1, temp); } void TurboAssembler::Mvn(const Register& rd, const Operand& operand) { DCHECK(allow_macro_instructions()); if (operand.NeedsRelocation(this)) { Ldr(rd, operand.immediate()); mvn(rd, rd); } else if (operand.IsImmediate()) { // Call the macro assembler for generic immediates. Mov(rd, ~operand.ImmediateValue()); } else if (operand.IsExtendedRegister()) { // Emit two instructions for the extend case. This differs from Mov, as // the extend and invert can't be achieved in one instruction. EmitExtendShift(rd, operand.reg(), operand.extend(), operand.shift_amount()); mvn(rd, rd); } else { mvn(rd, operand); } } unsigned TurboAssembler::CountClearHalfWords(uint64_t imm, unsigned reg_size) { DCHECK_EQ(reg_size % 8, 0); int count = 0; for (unsigned i = 0; i < (reg_size / 16); i++) { if ((imm & 0xFFFF) == 0) { count++; } imm >>= 16; } return count; } // The movz instruction can generate immediates containing an arbitrary 16-bit // half-word, with remaining bits clear, eg. 0x00001234, 0x0000123400000000. bool TurboAssembler::IsImmMovz(uint64_t imm, unsigned reg_size) { DCHECK((reg_size == kXRegSizeInBits) || (reg_size == kWRegSizeInBits)); return CountClearHalfWords(imm, reg_size) >= ((reg_size / 16) - 1); } // The movn instruction can generate immediates containing an arbitrary 16-bit // half-word, with remaining bits set, eg. 0xFFFF1234, 0xFFFF1234FFFFFFFF. bool TurboAssembler::IsImmMovn(uint64_t imm, unsigned reg_size) { return IsImmMovz(~imm, reg_size); } void TurboAssembler::ConditionalCompareMacro(const Register& rn, const Operand& operand, StatusFlags nzcv, Condition cond, ConditionalCompareOp op) { DCHECK((cond != al) && (cond != nv)); if (operand.NeedsRelocation(this)) { UseScratchRegisterScope temps(this); Register temp = temps.AcquireX(); Ldr(temp, operand.immediate()); ConditionalCompareMacro(rn, temp, nzcv, cond, op); } else if ((operand.IsShiftedRegister() && (operand.shift_amount() == 0)) || (operand.IsImmediate() && IsImmConditionalCompare(operand.ImmediateValue()))) { // The immediate can be encoded in the instruction, or the operand is an // unshifted register: call the assembler. ConditionalCompare(rn, operand, nzcv, cond, op); } else { // The operand isn't directly supported by the instruction: perform the // operation on a temporary register. UseScratchRegisterScope temps(this); Register temp = temps.AcquireSameSizeAs(rn); Mov(temp, operand); ConditionalCompare(rn, temp, nzcv, cond, op); } } void TurboAssembler::Csel(const Register& rd, const Register& rn, const Operand& operand, Condition cond) { DCHECK(allow_macro_instructions()); DCHECK(!rd.IsZero()); DCHECK((cond != al) && (cond != nv)); if (operand.IsImmediate()) { // Immediate argument. Handle special cases of 0, 1 and -1 using zero // register. int64_t imm = operand.ImmediateValue(); Register zr = AppropriateZeroRegFor(rn); if (imm == 0) { csel(rd, rn, zr, cond); } else if (imm == 1) { csinc(rd, rn, zr, cond); } else if (imm == -1) { csinv(rd, rn, zr, cond); } else { UseScratchRegisterScope temps(this); Register temp = temps.AcquireSameSizeAs(rn); Mov(temp, imm); csel(rd, rn, temp, cond); } } else if (operand.IsShiftedRegister() && (operand.shift_amount() == 0)) { // Unshifted register argument. csel(rd, rn, operand.reg(), cond); } else { // All other arguments. UseScratchRegisterScope temps(this); Register temp = temps.AcquireSameSizeAs(rn); Mov(temp, operand); csel(rd, rn, temp, cond); } } bool TurboAssembler::TryOneInstrMoveImmediate(const Register& dst, int64_t imm) { unsigned n, imm_s, imm_r; int reg_size = dst.SizeInBits(); if (IsImmMovz(imm, reg_size) && !dst.IsSP()) { // Immediate can be represented in a move zero instruction. Movz can't write // to the stack pointer. movz(dst, imm); return true; } else if (IsImmMovn(imm, reg_size) && !dst.IsSP()) { // Immediate can be represented in a move not instruction. Movn can't write // to the stack pointer. movn(dst, dst.Is64Bits() ? ~imm : (~imm & kWRegMask)); return true; } else if (IsImmLogical(imm, reg_size, &n, &imm_s, &imm_r)) { // Immediate can be represented in a logical orr instruction. LogicalImmediate(dst, AppropriateZeroRegFor(dst), n, imm_s, imm_r, ORR); return true; } return false; } Operand TurboAssembler::MoveImmediateForShiftedOp(const Register& dst, int64_t imm, PreShiftImmMode mode) { int reg_size = dst.SizeInBits(); // Encode the immediate in a single move instruction, if possible. if (TryOneInstrMoveImmediate(dst, imm)) { // The move was successful; nothing to do here. } else { // Pre-shift the immediate to the least-significant bits of the register. int shift_low = CountTrailingZeros(imm, reg_size); if (mode == kLimitShiftForSP) { // When applied to the stack pointer, the subsequent arithmetic operation // can use the extend form to shift left by a maximum of four bits. Right // shifts are not allowed, so we filter them out later before the new // immediate is tested. shift_low = std::min(shift_low, 4); } int64_t imm_low = imm >> shift_low; // Pre-shift the immediate to the most-significant bits of the register. We // insert set bits in the least-significant bits, as this creates a // different immediate that may be encodable using movn or orr-immediate. // If this new immediate is encodable, the set bits will be eliminated by // the post shift on the following instruction. int shift_high = CountLeadingZeros(imm, reg_size); int64_t imm_high = (imm << shift_high) | ((INT64_C(1) << shift_high) - 1); if ((mode != kNoShift) && TryOneInstrMoveImmediate(dst, imm_low)) { // The new immediate has been moved into the destination's low bits: // return a new leftward-shifting operand. return Operand(dst, LSL, shift_low); } else if ((mode == kAnyShift) && TryOneInstrMoveImmediate(dst, imm_high)) { // The new immediate has been moved into the destination's high bits: // return a new rightward-shifting operand. return Operand(dst, LSR, shift_high); } else { // Use the generic move operation to set up the immediate. Mov(dst, imm); } } return Operand(dst); } void TurboAssembler::AddSubMacro(const Register& rd, const Register& rn, const Operand& operand, FlagsUpdate S, AddSubOp op) { if (operand.IsZero() && rd.Is(rn) && rd.Is64Bits() && rn.Is64Bits() && !operand.NeedsRelocation(this) && (S == LeaveFlags)) { // The instruction would be a nop. Avoid generating useless code. return; } if (operand.NeedsRelocation(this)) { UseScratchRegisterScope temps(this); Register temp = temps.AcquireX(); Ldr(temp, operand.immediate()); AddSubMacro(rd, rn, temp, S, op); } else if ((operand.IsImmediate() && !IsImmAddSub(operand.ImmediateValue())) || (rn.IsZero() && !operand.IsShiftedRegister()) || (operand.IsShiftedRegister() && (operand.shift() == ROR))) { UseScratchRegisterScope temps(this); Register temp = temps.AcquireSameSizeAs(rn); if (operand.IsImmediate()) { PreShiftImmMode mode = kAnyShift; // If the destination or source register is the stack pointer, we can // only pre-shift the immediate right by values supported in the add/sub // extend encoding. if (rd.Is(sp)) { // If the destination is SP and flags will be set, we can't pre-shift // the immediate at all. mode = (S == SetFlags) ? kNoShift : kLimitShiftForSP; } else if (rn.Is(sp)) { mode = kLimitShiftForSP; } Operand imm_operand = MoveImmediateForShiftedOp(temp, operand.ImmediateValue(), mode); AddSub(rd, rn, imm_operand, S, op); } else { Mov(temp, operand); AddSub(rd, rn, temp, S, op); } } else { AddSub(rd, rn, operand, S, op); } } void TurboAssembler::AddSubWithCarryMacro(const Register& rd, const Register& rn, const Operand& operand, FlagsUpdate S, AddSubWithCarryOp op) { DCHECK(rd.SizeInBits() == rn.SizeInBits()); UseScratchRegisterScope temps(this); if (operand.NeedsRelocation(this)) { Register temp = temps.AcquireX(); Ldr(temp, operand.immediate()); AddSubWithCarryMacro(rd, rn, temp, S, op); } else if (operand.IsImmediate() || (operand.IsShiftedRegister() && (operand.shift() == ROR))) { // Add/sub with carry (immediate or ROR shifted register.) Register temp = temps.AcquireSameSizeAs(rn); Mov(temp, operand); AddSubWithCarry(rd, rn, temp, S, op); } else if (operand.IsShiftedRegister() && (operand.shift_amount() != 0)) { // Add/sub with carry (shifted register). DCHECK(operand.reg().SizeInBits() == rd.SizeInBits()); DCHECK(operand.shift() != ROR); DCHECK(is_uintn(operand.shift_amount(), rd.SizeInBits() == kXRegSizeInBits ? kXRegSizeInBitsLog2 : kWRegSizeInBitsLog2)); Register temp = temps.AcquireSameSizeAs(rn); EmitShift(temp, operand.reg(), operand.shift(), operand.shift_amount()); AddSubWithCarry(rd, rn, temp, S, op); } else if (operand.IsExtendedRegister()) { // Add/sub with carry (extended register). DCHECK(operand.reg().SizeInBits() <= rd.SizeInBits()); // Add/sub extended supports a shift <= 4. We want to support exactly the // same modes. DCHECK_LE(operand.shift_amount(), 4); DCHECK(operand.reg().Is64Bits() || ((operand.extend() != UXTX) && (operand.extend() != SXTX))); Register temp = temps.AcquireSameSizeAs(rn); EmitExtendShift(temp, operand.reg(), operand.extend(), operand.shift_amount()); AddSubWithCarry(rd, rn, temp, S, op); } else { // The addressing mode is directly supported by the instruction. AddSubWithCarry(rd, rn, operand, S, op); } } void TurboAssembler::LoadStoreMacro(const CPURegister& rt, const MemOperand& addr, LoadStoreOp op) { int64_t offset = addr.offset(); unsigned size = CalcLSDataSize(op); // Check if an immediate offset fits in the immediate field of the // appropriate instruction. If not, emit two instructions to perform // the operation. if (addr.IsImmediateOffset() && !IsImmLSScaled(offset, size) && !IsImmLSUnscaled(offset)) { // Immediate offset that can't be encoded using unsigned or unscaled // addressing modes. UseScratchRegisterScope temps(this); Register temp = temps.AcquireSameSizeAs(addr.base()); Mov(temp, addr.offset()); LoadStore(rt, MemOperand(addr.base(), temp), op); } else if (addr.IsPostIndex() && !IsImmLSUnscaled(offset)) { // Post-index beyond unscaled addressing range. LoadStore(rt, MemOperand(addr.base()), op); add(addr.base(), addr.base(), offset); } else if (addr.IsPreIndex() && !IsImmLSUnscaled(offset)) { // Pre-index beyond unscaled addressing range. add(addr.base(), addr.base(), offset); LoadStore(rt, MemOperand(addr.base()), op); } else { // Encodable in one load/store instruction. LoadStore(rt, addr, op); } } void TurboAssembler::LoadStorePairMacro(const CPURegister& rt, const CPURegister& rt2, const MemOperand& addr, LoadStorePairOp op) { // TODO(all): Should we support register offset for load-store-pair? DCHECK(!addr.IsRegisterOffset()); int64_t offset = addr.offset(); unsigned size = CalcLSPairDataSize(op); // Check if the offset fits in the immediate field of the appropriate // instruction. If not, emit two instructions to perform the operation. if (IsImmLSPair(offset, size)) { // Encodable in one load/store pair instruction. LoadStorePair(rt, rt2, addr, op); } else { Register base = addr.base(); if (addr.IsImmediateOffset()) { UseScratchRegisterScope temps(this); Register temp = temps.AcquireSameSizeAs(base); Add(temp, base, offset); LoadStorePair(rt, rt2, MemOperand(temp), op); } else if (addr.IsPostIndex()) { LoadStorePair(rt, rt2, MemOperand(base), op); Add(base, base, offset); } else { DCHECK(addr.IsPreIndex()); Add(base, base, offset); LoadStorePair(rt, rt2, MemOperand(base), op); } } } bool TurboAssembler::NeedExtraInstructionsOrRegisterBranch( Label* label, ImmBranchType b_type) { bool need_longer_range = false; // There are two situations in which we care about the offset being out of // range: // - The label is bound but too far away. // - The label is not bound but linked, and the previous branch // instruction in the chain is too far away. if (label->is_bound() || label->is_linked()) { need_longer_range = !Instruction::IsValidImmPCOffset(b_type, label->pos() - pc_offset()); } if (!need_longer_range && !label->is_bound()) { int max_reachable_pc = pc_offset() + Instruction::ImmBranchRange(b_type); unresolved_branches_.insert( std::pair(max_reachable_pc, FarBranchInfo(pc_offset(), label))); // Also maintain the next pool check. next_veneer_pool_check_ = Min(next_veneer_pool_check_, max_reachable_pc - kVeneerDistanceCheckMargin); } return need_longer_range; } void TurboAssembler::Adr(const Register& rd, Label* label, AdrHint hint) { DCHECK(allow_macro_instructions()); DCHECK(!rd.IsZero()); if (hint == kAdrNear) { adr(rd, label); return; } DCHECK_EQ(hint, kAdrFar); if (label->is_bound()) { int label_offset = label->pos() - pc_offset(); if (Instruction::IsValidPCRelOffset(label_offset)) { adr(rd, label); } else { DCHECK_LE(label_offset, 0); int min_adr_offset = -(1 << (Instruction::ImmPCRelRangeBitwidth - 1)); adr(rd, min_adr_offset); Add(rd, rd, label_offset - min_adr_offset); } } else { UseScratchRegisterScope temps(this); Register scratch = temps.AcquireX(); InstructionAccurateScope scope( this, PatchingAssembler::kAdrFarPatchableNInstrs); adr(rd, label); for (int i = 0; i < PatchingAssembler::kAdrFarPatchableNNops; ++i) { nop(ADR_FAR_NOP); } movz(scratch, 0); } } void TurboAssembler::B(Label* label, BranchType type, Register reg, int bit) { DCHECK((reg.Is(NoReg) || type >= kBranchTypeFirstUsingReg) && (bit == -1 || type >= kBranchTypeFirstUsingBit)); if (kBranchTypeFirstCondition <= type && type <= kBranchTypeLastCondition) { B(static_cast(type), label); } else { switch (type) { case always: B(label); break; case never: break; case reg_zero: Cbz(reg, label); break; case reg_not_zero: Cbnz(reg, label); break; case reg_bit_clear: Tbz(reg, bit, label); break; case reg_bit_set: Tbnz(reg, bit, label); break; default: UNREACHABLE(); } } } void TurboAssembler::B(Label* label, Condition cond) { DCHECK(allow_macro_instructions()); DCHECK((cond != al) && (cond != nv)); Label done; bool need_extra_instructions = NeedExtraInstructionsOrRegisterBranch(label, CondBranchType); if (need_extra_instructions) { b(&done, NegateCondition(cond)); B(label); } else { b(label, cond); } bind(&done); } void TurboAssembler::Tbnz(const Register& rt, unsigned bit_pos, Label* label) { DCHECK(allow_macro_instructions()); Label done; bool need_extra_instructions = NeedExtraInstructionsOrRegisterBranch(label, TestBranchType); if (need_extra_instructions) { tbz(rt, bit_pos, &done); B(label); } else { tbnz(rt, bit_pos, label); } bind(&done); } void TurboAssembler::Tbz(const Register& rt, unsigned bit_pos, Label* label) { DCHECK(allow_macro_instructions()); Label done; bool need_extra_instructions = NeedExtraInstructionsOrRegisterBranch(label, TestBranchType); if (need_extra_instructions) { tbnz(rt, bit_pos, &done); B(label); } else { tbz(rt, bit_pos, label); } bind(&done); } void TurboAssembler::Cbnz(const Register& rt, Label* label) { DCHECK(allow_macro_instructions()); Label done; bool need_extra_instructions = NeedExtraInstructionsOrRegisterBranch(label, CompareBranchType); if (need_extra_instructions) { cbz(rt, &done); B(label); } else { cbnz(rt, label); } bind(&done); } void TurboAssembler::Cbz(const Register& rt, Label* label) { DCHECK(allow_macro_instructions()); Label done; bool need_extra_instructions = NeedExtraInstructionsOrRegisterBranch(label, CompareBranchType); if (need_extra_instructions) { cbnz(rt, &done); B(label); } else { cbz(rt, label); } bind(&done); } // Pseudo-instructions. void TurboAssembler::Abs(const Register& rd, const Register& rm, Label* is_not_representable, Label* is_representable) { DCHECK(allow_macro_instructions()); DCHECK(AreSameSizeAndType(rd, rm)); Cmp(rm, 1); Cneg(rd, rm, lt); // If the comparison sets the v flag, the input was the smallest value // representable by rm, and the mathematical result of abs(rm) is not // representable using two's complement. if ((is_not_representable != nullptr) && (is_representable != nullptr)) { B(is_not_representable, vs); B(is_representable); } else if (is_not_representable != nullptr) { B(is_not_representable, vs); } else if (is_representable != nullptr) { B(is_representable, vc); } } // Abstracted stack operations. void TurboAssembler::Push(const CPURegister& src0, const CPURegister& src1, const CPURegister& src2, const CPURegister& src3) { DCHECK(AreSameSizeAndType(src0, src1, src2, src3)); int count = 1 + src1.IsValid() + src2.IsValid() + src3.IsValid(); int size = src0.SizeInBytes(); DCHECK_EQ(0, (size * count) % 16); PushHelper(count, size, src0, src1, src2, src3); } void TurboAssembler::Push(const CPURegister& src0, const CPURegister& src1, const CPURegister& src2, const CPURegister& src3, const CPURegister& src4, const CPURegister& src5, const CPURegister& src6, const CPURegister& src7) { DCHECK(AreSameSizeAndType(src0, src1, src2, src3, src4, src5, src6, src7)); int count = 5 + src5.IsValid() + src6.IsValid() + src6.IsValid(); int size = src0.SizeInBytes(); DCHECK_EQ(0, (size * count) % 16); PushHelper(4, size, src0, src1, src2, src3); PushHelper(count - 4, size, src4, src5, src6, src7); } void TurboAssembler::Pop(const CPURegister& dst0, const CPURegister& dst1, const CPURegister& dst2, const CPURegister& dst3) { // It is not valid to pop into the same register more than once in one // instruction, not even into the zero register. DCHECK(!AreAliased(dst0, dst1, dst2, dst3)); DCHECK(AreSameSizeAndType(dst0, dst1, dst2, dst3)); DCHECK(dst0.IsValid()); int count = 1 + dst1.IsValid() + dst2.IsValid() + dst3.IsValid(); int size = dst0.SizeInBytes(); DCHECK_EQ(0, (size * count) % 16); PopHelper(count, size, dst0, dst1, dst2, dst3); } void TurboAssembler::Pop(const CPURegister& dst0, const CPURegister& dst1, const CPURegister& dst2, const CPURegister& dst3, const CPURegister& dst4, const CPURegister& dst5, const CPURegister& dst6, const CPURegister& dst7) { // It is not valid to pop into the same register more than once in one // instruction, not even into the zero register. DCHECK(!AreAliased(dst0, dst1, dst2, dst3, dst4, dst5, dst6, dst7)); DCHECK(AreSameSizeAndType(dst0, dst1, dst2, dst3, dst4, dst5, dst6, dst7)); DCHECK(dst0.IsValid()); int count = 5 + dst5.IsValid() + dst6.IsValid() + dst7.IsValid(); int size = dst0.SizeInBytes(); DCHECK_EQ(0, (size * count) % 16); PopHelper(4, size, dst0, dst1, dst2, dst3); PopHelper(count - 4, size, dst4, dst5, dst6, dst7); } void TurboAssembler::Push(const Register& src0, const VRegister& src1) { int size = src0.SizeInBytes() + src1.SizeInBytes(); DCHECK_EQ(0, size % 16); // Reserve room for src0 and push src1. str(src1, MemOperand(sp, -size, PreIndex)); // Fill the gap with src0. str(src0, MemOperand(sp, src1.SizeInBytes())); } void MacroAssembler::PushPopQueue::PushQueued() { DCHECK_EQ(0, size_ % 16); if (queued_.empty()) return; size_t count = queued_.size(); size_t index = 0; while (index < count) { // PushHelper can only handle registers with the same size and type, and it // can handle only four at a time. Batch them up accordingly. CPURegister batch[4] = {NoReg, NoReg, NoReg, NoReg}; int batch_index = 0; do { batch[batch_index++] = queued_[index++]; } while ((batch_index < 4) && (index < count) && batch[0].IsSameSizeAndType(queued_[index])); masm_->PushHelper(batch_index, batch[0].SizeInBytes(), batch[0], batch[1], batch[2], batch[3]); } queued_.clear(); } void MacroAssembler::PushPopQueue::PopQueued() { DCHECK_EQ(0, size_ % 16); if (queued_.empty()) return; size_t count = queued_.size(); size_t index = 0; while (index < count) { // PopHelper can only handle registers with the same size and type, and it // can handle only four at a time. Batch them up accordingly. CPURegister batch[4] = {NoReg, NoReg, NoReg, NoReg}; int batch_index = 0; do { batch[batch_index++] = queued_[index++]; } while ((batch_index < 4) && (index < count) && batch[0].IsSameSizeAndType(queued_[index])); masm_->PopHelper(batch_index, batch[0].SizeInBytes(), batch[0], batch[1], batch[2], batch[3]); } queued_.clear(); } void TurboAssembler::PushCPURegList(CPURegList registers) { int size = registers.RegisterSizeInBytes(); DCHECK_EQ(0, (size * registers.Count()) % 16); // Push up to four registers at a time. while (!registers.IsEmpty()) { int count_before = registers.Count(); const CPURegister& src0 = registers.PopHighestIndex(); const CPURegister& src1 = registers.PopHighestIndex(); const CPURegister& src2 = registers.PopHighestIndex(); const CPURegister& src3 = registers.PopHighestIndex(); int count = count_before - registers.Count(); PushHelper(count, size, src0, src1, src2, src3); } } void TurboAssembler::PopCPURegList(CPURegList registers) { int size = registers.RegisterSizeInBytes(); DCHECK_EQ(0, (size * registers.Count()) % 16); // Pop up to four registers at a time. while (!registers.IsEmpty()) { int count_before = registers.Count(); const CPURegister& dst0 = registers.PopLowestIndex(); const CPURegister& dst1 = registers.PopLowestIndex(); const CPURegister& dst2 = registers.PopLowestIndex(); const CPURegister& dst3 = registers.PopLowestIndex(); int count = count_before - registers.Count(); PopHelper(count, size, dst0, dst1, dst2, dst3); } } void MacroAssembler::PushMultipleTimes(CPURegister src, Register count) { UseScratchRegisterScope temps(this); Register temp = temps.AcquireSameSizeAs(count); if (FLAG_optimize_for_size) { Label loop, done; Subs(temp, count, 1); B(mi, &done); // Push all registers individually, to save code size. Bind(&loop); Subs(temp, temp, 1); PushHelper(1, src.SizeInBytes(), src, NoReg, NoReg, NoReg); B(pl, &loop); Bind(&done); } else { Label loop, leftover2, leftover1, done; Subs(temp, count, 4); B(mi, &leftover2); // Push groups of four first. Bind(&loop); Subs(temp, temp, 4); PushHelper(4, src.SizeInBytes(), src, src, src, src); B(pl, &loop); // Push groups of two. Bind(&leftover2); Tbz(count, 1, &leftover1); PushHelper(2, src.SizeInBytes(), src, src, NoReg, NoReg); // Push the last one (if required). Bind(&leftover1); Tbz(count, 0, &done); PushHelper(1, src.SizeInBytes(), src, NoReg, NoReg, NoReg); Bind(&done); } } void TurboAssembler::PushHelper(int count, int size, const CPURegister& src0, const CPURegister& src1, const CPURegister& src2, const CPURegister& src3) { // Ensure that we don't unintentially modify scratch or debug registers. InstructionAccurateScope scope(this); DCHECK(AreSameSizeAndType(src0, src1, src2, src3)); DCHECK(size == src0.SizeInBytes()); // When pushing multiple registers, the store order is chosen such that // Push(a, b) is equivalent to Push(a) followed by Push(b). switch (count) { case 1: DCHECK(src1.IsNone() && src2.IsNone() && src3.IsNone()); str(src0, MemOperand(sp, -1 * size, PreIndex)); break; case 2: DCHECK(src2.IsNone() && src3.IsNone()); stp(src1, src0, MemOperand(sp, -2 * size, PreIndex)); break; case 3: DCHECK(src3.IsNone()); stp(src2, src1, MemOperand(sp, -3 * size, PreIndex)); str(src0, MemOperand(sp, 2 * size)); break; case 4: // Skip over 4 * size, then fill in the gap. This allows four W registers // to be pushed using sp, whilst maintaining 16-byte alignment for sp // at all times. stp(src3, src2, MemOperand(sp, -4 * size, PreIndex)); stp(src1, src0, MemOperand(sp, 2 * size)); break; default: UNREACHABLE(); } } void TurboAssembler::PopHelper(int count, int size, const CPURegister& dst0, const CPURegister& dst1, const CPURegister& dst2, const CPURegister& dst3) { // Ensure that we don't unintentially modify scratch or debug registers. InstructionAccurateScope scope(this); DCHECK(AreSameSizeAndType(dst0, dst1, dst2, dst3)); DCHECK(size == dst0.SizeInBytes()); // When popping multiple registers, the load order is chosen such that // Pop(a, b) is equivalent to Pop(a) followed by Pop(b). switch (count) { case 1: DCHECK(dst1.IsNone() && dst2.IsNone() && dst3.IsNone()); ldr(dst0, MemOperand(sp, 1 * size, PostIndex)); break; case 2: DCHECK(dst2.IsNone() && dst3.IsNone()); ldp(dst0, dst1, MemOperand(sp, 2 * size, PostIndex)); break; case 3: DCHECK(dst3.IsNone()); ldr(dst2, MemOperand(sp, 2 * size)); ldp(dst0, dst1, MemOperand(sp, 3 * size, PostIndex)); break; case 4: // Load the higher addresses first, then load the lower addresses and // skip the whole block in the second instruction. This allows four W // registers to be popped using sp, whilst maintaining 16-byte alignment // for sp at all times. ldp(dst2, dst3, MemOperand(sp, 2 * size)); ldp(dst0, dst1, MemOperand(sp, 4 * size, PostIndex)); break; default: UNREACHABLE(); } } void TurboAssembler::Poke(const CPURegister& src, const Operand& offset) { if (offset.IsImmediate()) { DCHECK_GE(offset.ImmediateValue(), 0); } else if (emit_debug_code()) { Cmp(xzr, offset); Check(le, AbortReason::kStackAccessBelowStackPointer); } Str(src, MemOperand(sp, offset)); } void TurboAssembler::Peek(const CPURegister& dst, const Operand& offset) { if (offset.IsImmediate()) { DCHECK_GE(offset.ImmediateValue(), 0); } else if (emit_debug_code()) { Cmp(xzr, offset); Check(le, AbortReason::kStackAccessBelowStackPointer); } Ldr(dst, MemOperand(sp, offset)); } void TurboAssembler::PokePair(const CPURegister& src1, const CPURegister& src2, int offset) { DCHECK(AreSameSizeAndType(src1, src2)); DCHECK((offset >= 0) && ((offset % src1.SizeInBytes()) == 0)); Stp(src1, src2, MemOperand(sp, offset)); } void MacroAssembler::PeekPair(const CPURegister& dst1, const CPURegister& dst2, int offset) { DCHECK(AreSameSizeAndType(dst1, dst2)); DCHECK((offset >= 0) && ((offset % dst1.SizeInBytes()) == 0)); Ldp(dst1, dst2, MemOperand(sp, offset)); } void MacroAssembler::PushCalleeSavedRegisters() { // Ensure that the macro-assembler doesn't use any scratch registers. InstructionAccurateScope scope(this); MemOperand tos(sp, -2 * static_cast(kXRegSize), PreIndex); stp(d14, d15, tos); stp(d12, d13, tos); stp(d10, d11, tos); stp(d8, d9, tos); stp(x29, x30, tos); stp(x27, x28, tos); stp(x25, x26, tos); stp(x23, x24, tos); stp(x21, x22, tos); stp(x19, x20, tos); } void MacroAssembler::PopCalleeSavedRegisters() { // Ensure that the macro-assembler doesn't use any scratch registers. InstructionAccurateScope scope(this); MemOperand tos(sp, 2 * kXRegSize, PostIndex); ldp(x19, x20, tos); ldp(x21, x22, tos); ldp(x23, x24, tos); ldp(x25, x26, tos); ldp(x27, x28, tos); ldp(x29, x30, tos); ldp(d8, d9, tos); ldp(d10, d11, tos); ldp(d12, d13, tos); ldp(d14, d15, tos); } void TurboAssembler::AssertSpAligned() { if (emit_debug_code()) { HardAbortScope hard_abort(this); // Avoid calls to Abort. // Arm64 requires the stack pointer to be 16-byte aligned prior to address // calculation. UseScratchRegisterScope scope(this); Register temp = scope.AcquireX(); Mov(temp, sp); Tst(temp, 15); Check(eq, AbortReason::kUnexpectedStackPointer); } } void TurboAssembler::CopySlots(int dst, Register src, Register slot_count) { DCHECK(!src.IsZero()); UseScratchRegisterScope scope(this); Register dst_reg = scope.AcquireX(); SlotAddress(dst_reg, dst); SlotAddress(src, src); CopyDoubleWords(dst_reg, src, slot_count); } void TurboAssembler::CopySlots(Register dst, Register src, Register slot_count) { DCHECK(!dst.IsZero() && !src.IsZero()); SlotAddress(dst, dst); SlotAddress(src, src); CopyDoubleWords(dst, src, slot_count); } void TurboAssembler::CopyDoubleWords(Register dst, Register src, Register count, CopyDoubleWordsMode mode) { DCHECK(!AreAliased(dst, src, count)); if (emit_debug_code()) { Register pointer1 = dst; Register pointer2 = src; if (mode == kSrcLessThanDst) { pointer1 = src; pointer2 = dst; } // Copy requires pointer1 < pointer2 || (pointer1 - pointer2) >= count. Label pointer1_below_pointer2; Subs(pointer1, pointer1, pointer2); B(lt, &pointer1_below_pointer2); Cmp(pointer1, count); Check(ge, AbortReason::kOffsetOutOfRange); Bind(&pointer1_below_pointer2); Add(pointer1, pointer1, pointer2); } static_assert(kPointerSize == kDRegSize, "pointers must be the same size as doubles"); int direction = (mode == kDstLessThanSrc) ? 1 : -1; UseScratchRegisterScope scope(this); VRegister temp0 = scope.AcquireD(); VRegister temp1 = scope.AcquireD(); Label pairs, loop, done; Tbz(count, 0, &pairs); Ldr(temp0, MemOperand(src, direction * kPointerSize, PostIndex)); Sub(count, count, 1); Str(temp0, MemOperand(dst, direction * kPointerSize, PostIndex)); Bind(&pairs); if (mode == kSrcLessThanDst) { // Adjust pointers for post-index ldp/stp with negative offset: Sub(dst, dst, kPointerSize); Sub(src, src, kPointerSize); } Bind(&loop); Cbz(count, &done); Ldp(temp0, temp1, MemOperand(src, 2 * direction * kPointerSize, PostIndex)); Sub(count, count, 2); Stp(temp0, temp1, MemOperand(dst, 2 * direction * kPointerSize, PostIndex)); B(&loop); // TODO(all): large copies may benefit from using temporary Q registers // to copy four double words per iteration. Bind(&done); } void TurboAssembler::SlotAddress(Register dst, int slot_offset) { Add(dst, sp, slot_offset << kPointerSizeLog2); } void TurboAssembler::SlotAddress(Register dst, Register slot_offset) { Add(dst, sp, Operand(slot_offset, LSL, kPointerSizeLog2)); } void TurboAssembler::AssertFPCRState(Register fpcr) { if (emit_debug_code()) { Label unexpected_mode, done; UseScratchRegisterScope temps(this); if (fpcr.IsNone()) { fpcr = temps.AcquireX(); Mrs(fpcr, FPCR); } // Settings left to their default values: // - Assert that flush-to-zero is not set. Tbnz(fpcr, FZ_offset, &unexpected_mode); // - Assert that the rounding mode is nearest-with-ties-to-even. STATIC_ASSERT(FPTieEven == 0); Tst(fpcr, RMode_mask); B(eq, &done); Bind(&unexpected_mode); Abort(AbortReason::kUnexpectedFPCRMode); Bind(&done); } } void TurboAssembler::CanonicalizeNaN(const VRegister& dst, const VRegister& src) { AssertFPCRState(); // Subtracting 0.0 preserves all inputs except for signalling NaNs, which // become quiet NaNs. We use fsub rather than fadd because fsub preserves -0.0 // inputs: -0.0 + 0.0 = 0.0, but -0.0 - 0.0 = -0.0. Fsub(dst, src, fp_zero); } void TurboAssembler::LoadRoot(Register destination, RootIndex index) { // TODO(jbramley): Most root values are constants, and can be synthesized // without a load. Refer to the ARM back end for details. Ldr(destination, MemOperand(kRootRegister, RootRegisterOffset(index))); } void MacroAssembler::LoadObject(Register result, Handle