Blame - src/arm64/assembler-arm64.h - fp2-dev/platform/external/v8

blob: 53496f37ce23ee488dba879c14b350348a74dbd5 [file] [log] [blame]

Ben Murdoch	b8a8cc1	2014-11-26 15:28:44 +0000	[diff] [blame]	1	// Copyright 2013 the V8 project authors. All rights reserved.
				2	// Use of this source code is governed by a BSD-style license that can be
				3	// found in the LICENSE file.
				4
				5	#ifndef V8_ARM64_ASSEMBLER_ARM64_H_
				6	#define V8_ARM64_ASSEMBLER_ARM64_H_
				7
				8	#include <list>
				9	#include <map>
				10	#include <vector>
				11
				12	#include "src/arm64/instructions-arm64.h"
				13	#include "src/assembler.h"
				14	#include "src/globals.h"
				15	#include "src/serialize.h"
				16	#include "src/utils.h"
				17
				18
				19	namespace v8 {
				20	namespace internal {
				21
				22
				23	// -----------------------------------------------------------------------------
				24	// Registers.
				25	#define REGISTER_CODE_LIST(R) \
				26	R(0) R(1) R(2) R(3) R(4) R(5) R(6) R(7) \
				27	R(8) R(9) R(10) R(11) R(12) R(13) R(14) R(15) \
				28	R(16) R(17) R(18) R(19) R(20) R(21) R(22) R(23) \
				29	R(24) R(25) R(26) R(27) R(28) R(29) R(30) R(31)
				30
				31
				32	static const int kRegListSizeInBits = sizeof(RegList) * kBitsPerByte;
				33
				34
				35	// Some CPURegister methods can return Register and FPRegister types, so we
				36	// need to declare them in advance.
				37	struct Register;
				38	struct FPRegister;
				39
				40
				41	struct CPURegister {
				42	enum RegisterType {
				43	// The kInvalid value is used to detect uninitialized static instances,
				44	// which are always zero-initialized before any constructors are called.
				45	kInvalid = 0,
				46	kRegister,
				47	kFPRegister,
				48	kNoRegister
				49	};
				50
				51	static CPURegister Create(unsigned code, unsigned size, RegisterType type) {
				52	CPURegister r = {code, size, type};
				53	return r;
				54	}
				55
				56	unsigned code() const;
				57	RegisterType type() const;
				58	RegList Bit() const;
				59	unsigned SizeInBits() const;
				60	int SizeInBytes() const;
				61	bool Is32Bits() const;
				62	bool Is64Bits() const;
				63	bool IsValid() const;
				64	bool IsValidOrNone() const;
				65	bool IsValidRegister() const;
				66	bool IsValidFPRegister() const;
				67	bool IsNone() const;
				68	bool Is(const CPURegister& other) const;
				69	bool Aliases(const CPURegister& other) const;
				70
				71	bool IsZero() const;
				72	bool IsSP() const;
				73
				74	bool IsRegister() const;
				75	bool IsFPRegister() const;
				76
				77	Register X() const;
				78	Register W() const;
				79	FPRegister D() const;
				80	FPRegister S() const;
				81
				82	bool IsSameSizeAndType(const CPURegister& other) const;
				83
				84	// V8 compatibility.
				85	bool is(const CPURegister& other) const { return Is(other); }
				86	bool is_valid() const { return IsValid(); }
				87
				88	unsigned reg_code;
				89	unsigned reg_size;
				90	RegisterType reg_type;
				91	};
				92
				93
				94	struct Register : public CPURegister {
				95	static Register Create(unsigned code, unsigned size) {
				96	return Register(CPURegister::Create(code, size, CPURegister::kRegister));
				97	}
				98
				99	Register() {
				100	reg_code = 0;
				101	reg_size = 0;
				102	reg_type = CPURegister::kNoRegister;
				103	}
				104
				105	explicit Register(const CPURegister& r) {
				106	reg_code = r.reg_code;
				107	reg_size = r.reg_size;
				108	reg_type = r.reg_type;
				109	DCHECK(IsValidOrNone());
				110	}
				111
				112	Register(const Register& r) { // NOLINT(runtime/explicit)
				113	reg_code = r.reg_code;
				114	reg_size = r.reg_size;
				115	reg_type = r.reg_type;
				116	DCHECK(IsValidOrNone());
				117	}
				118
				119	bool IsValid() const {
				120	DCHECK(IsRegister() \|\| IsNone());
				121	return IsValidRegister();
				122	}
				123
				124	static Register XRegFromCode(unsigned code);
				125	static Register WRegFromCode(unsigned code);
				126
				127	// Start of V8 compatibility section ---------------------
				128	// These memebers are necessary for compilation.
				129	// A few of them may be unused for now.
				130
				131	static const int kNumRegisters = kNumberOfRegisters;
				132	static int NumRegisters() { return kNumRegisters; }
				133
				134	// We allow crankshaft to use the following registers:
				135	// - x0 to x15
				136	// - x18 to x24
				137	// - x27 (also context)
				138	//
				139	// TODO(all): Register x25 is currently free and could be available for
				140	// crankshaft, but we don't use it as we might use it as a per function
				141	// literal pool pointer in the future.
				142	//
				143	// TODO(all): Consider storing cp in x25 to have only two ranges.
				144	// We split allocatable registers in three ranges called
				145	// - "low range"
				146	// - "high range"
				147	// - "context"
				148	static const unsigned kAllocatableLowRangeBegin = 0;
				149	static const unsigned kAllocatableLowRangeEnd = 15;
				150	static const unsigned kAllocatableHighRangeBegin = 18;
				151	static const unsigned kAllocatableHighRangeEnd = 24;
				152	static const unsigned kAllocatableContext = 27;
				153
				154	// Gap between low and high ranges.
				155	static const int kAllocatableRangeGapSize =
				156	(kAllocatableHighRangeBegin - kAllocatableLowRangeEnd) - 1;
				157
				158	static const int kMaxNumAllocatableRegisters =
				159	(kAllocatableLowRangeEnd - kAllocatableLowRangeBegin + 1) +
				160	(kAllocatableHighRangeEnd - kAllocatableHighRangeBegin + 1) + 1; // cp
				161	static int NumAllocatableRegisters() { return kMaxNumAllocatableRegisters; }
				162
				163	// Return true if the register is one that crankshaft can allocate.
				164	bool IsAllocatable() const {
				165	return ((reg_code == kAllocatableContext) \|\|
				166	(reg_code <= kAllocatableLowRangeEnd) \|\|
				167	((reg_code >= kAllocatableHighRangeBegin) &&
				168	(reg_code <= kAllocatableHighRangeEnd)));
				169	}
				170
				171	static Register FromAllocationIndex(unsigned index) {
				172	DCHECK(index < static_cast<unsigned>(NumAllocatableRegisters()));
				173	// cp is the last allocatable register.
				174	if (index == (static_cast<unsigned>(NumAllocatableRegisters() - 1))) {
				175	return from_code(kAllocatableContext);
				176	}
				177
				178	// Handle low and high ranges.
				179	return (index <= kAllocatableLowRangeEnd)
				180	? from_code(index)
				181	: from_code(index + kAllocatableRangeGapSize);
				182	}
				183
				184	static const char* AllocationIndexToString(int index) {
				185	DCHECK((index >= 0) && (index < NumAllocatableRegisters()));
				186	DCHECK((kAllocatableLowRangeBegin == 0) &&
				187	(kAllocatableLowRangeEnd == 15) &&
				188	(kAllocatableHighRangeBegin == 18) &&
				189	(kAllocatableHighRangeEnd == 24) &&
				190	(kAllocatableContext == 27));
				191	const char* const names[] = {
				192	"x0", "x1", "x2", "x3", "x4",
				193	"x5", "x6", "x7", "x8", "x9",
				194	"x10", "x11", "x12", "x13", "x14",
				195	"x15", "x18", "x19", "x20", "x21",
				196	"x22", "x23", "x24", "x27",
				197	};
				198	return names[index];
				199	}
				200
				201	static int ToAllocationIndex(Register reg) {
				202	DCHECK(reg.IsAllocatable());
				203	unsigned code = reg.code();
				204	if (code == kAllocatableContext) {
				205	return NumAllocatableRegisters() - 1;
				206	}
				207
				208	return (code <= kAllocatableLowRangeEnd)
				209	? code
				210	: code - kAllocatableRangeGapSize;
				211	}
				212
				213	static Register from_code(int code) {
				214	// Always return an X register.
				215	return Register::Create(code, kXRegSizeInBits);
				216	}
				217
				218	// End of V8 compatibility section -----------------------
				219	};
				220
				221
				222	struct FPRegister : public CPURegister {
				223	static FPRegister Create(unsigned code, unsigned size) {
				224	return FPRegister(
				225	CPURegister::Create(code, size, CPURegister::kFPRegister));
				226	}
				227
				228	FPRegister() {
				229	reg_code = 0;
				230	reg_size = 0;
				231	reg_type = CPURegister::kNoRegister;
				232	}
				233
				234	explicit FPRegister(const CPURegister& r) {
				235	reg_code = r.reg_code;
				236	reg_size = r.reg_size;
				237	reg_type = r.reg_type;
				238	DCHECK(IsValidOrNone());
				239	}
				240
				241	FPRegister(const FPRegister& r) { // NOLINT(runtime/explicit)
				242	reg_code = r.reg_code;
				243	reg_size = r.reg_size;
				244	reg_type = r.reg_type;
				245	DCHECK(IsValidOrNone());
				246	}
				247
				248	bool IsValid() const {
				249	DCHECK(IsFPRegister() \|\| IsNone());
				250	return IsValidFPRegister();
				251	}
				252
				253	static FPRegister SRegFromCode(unsigned code);
				254	static FPRegister DRegFromCode(unsigned code);
				255
				256	// Start of V8 compatibility section ---------------------
				257	static const int kMaxNumRegisters = kNumberOfFPRegisters;
				258
				259	// Crankshaft can use all the FP registers except:
				260	// - d15 which is used to keep the 0 double value
				261	// - d30 which is used in crankshaft as a double scratch register
				262	// - d31 which is used in the MacroAssembler as a double scratch register
				263	static const unsigned kAllocatableLowRangeBegin = 0;
				264	static const unsigned kAllocatableLowRangeEnd = 14;
				265	static const unsigned kAllocatableHighRangeBegin = 16;
				266	static const unsigned kAllocatableHighRangeEnd = 28;
				267
				268	static const RegList kAllocatableFPRegisters = 0x1fff7fff;
				269
				270	// Gap between low and high ranges.
				271	static const int kAllocatableRangeGapSize =
				272	(kAllocatableHighRangeBegin - kAllocatableLowRangeEnd) - 1;
				273
				274	static const int kMaxNumAllocatableRegisters =
				275	(kAllocatableLowRangeEnd - kAllocatableLowRangeBegin + 1) +
				276	(kAllocatableHighRangeEnd - kAllocatableHighRangeBegin + 1);
				277	static int NumAllocatableRegisters() { return kMaxNumAllocatableRegisters; }
				278
Emily Bernier	d0a1eb7	2015-03-24 16:35:39 -0400	[diff] [blame^]	279	// TODO(turbofan): Proper float32 support.
				280	static int NumAllocatableAliasedRegisters() {
				281	return NumAllocatableRegisters();
				282	}
				283
Ben Murdoch	b8a8cc1	2014-11-26 15:28:44 +0000	[diff] [blame]	284	// Return true if the register is one that crankshaft can allocate.
				285	bool IsAllocatable() const {
				286	return (Bit() & kAllocatableFPRegisters) != 0;
				287	}
				288
				289	static FPRegister FromAllocationIndex(unsigned int index) {
				290	DCHECK(index < static_cast<unsigned>(NumAllocatableRegisters()));
				291
				292	return (index <= kAllocatableLowRangeEnd)
				293	? from_code(index)
				294	: from_code(index + kAllocatableRangeGapSize);
				295	}
				296
				297	static const char* AllocationIndexToString(int index) {
				298	DCHECK((index >= 0) && (index < NumAllocatableRegisters()));
				299	DCHECK((kAllocatableLowRangeBegin == 0) &&
				300	(kAllocatableLowRangeEnd == 14) &&
				301	(kAllocatableHighRangeBegin == 16) &&
				302	(kAllocatableHighRangeEnd == 28));
				303	const char* const names[] = {
				304	"d0", "d1", "d2", "d3", "d4", "d5", "d6", "d7",
				305	"d8", "d9", "d10", "d11", "d12", "d13", "d14",
				306	"d16", "d17", "d18", "d19", "d20", "d21", "d22", "d23",
				307	"d24", "d25", "d26", "d27", "d28"
				308	};
				309	return names[index];
				310	}
				311
				312	static int ToAllocationIndex(FPRegister reg) {
				313	DCHECK(reg.IsAllocatable());
				314	unsigned code = reg.code();
				315
				316	return (code <= kAllocatableLowRangeEnd)
				317	? code
				318	: code - kAllocatableRangeGapSize;
				319	}
				320
				321	static FPRegister from_code(int code) {
				322	// Always return a D register.
				323	return FPRegister::Create(code, kDRegSizeInBits);
				324	}
				325	// End of V8 compatibility section -----------------------
				326	};
				327
				328
				329	STATIC_ASSERT(sizeof(CPURegister) == sizeof(Register));
				330	STATIC_ASSERT(sizeof(CPURegister) == sizeof(FPRegister));
				331
				332
				333	#if defined(ARM64_DEFINE_REG_STATICS)
				334	#define INITIALIZE_REGISTER(register_class, name, code, size, type) \
				335	const CPURegister init_##register_class##_##name = {code, size, type}; \
				336	const register_class& name = reinterpret_cast<const register_class>( \
				337	&init_##register_class##_##name)
				338	#define ALIAS_REGISTER(register_class, alias, name) \
				339	const register_class& alias = reinterpret_cast<const register_class>( \
				340	&init_##register_class##_##name)
				341	#else
				342	#define INITIALIZE_REGISTER(register_class, name, code, size, type) \
				343	extern const register_class& name
				344	#define ALIAS_REGISTER(register_class, alias, name) \
				345	extern const register_class& alias
				346	#endif // defined(ARM64_DEFINE_REG_STATICS)
				347
				348	// No*Reg is used to indicate an unused argument, or an error case. Note that
				349	// these all compare equal (using the Is() method). The Register and FPRegister
				350	// variants are provided for convenience.
				351	INITIALIZE_REGISTER(Register, NoReg, 0, 0, CPURegister::kNoRegister);
				352	INITIALIZE_REGISTER(FPRegister, NoFPReg, 0, 0, CPURegister::kNoRegister);
				353	INITIALIZE_REGISTER(CPURegister, NoCPUReg, 0, 0, CPURegister::kNoRegister);
				354
				355	// v8 compatibility.
				356	INITIALIZE_REGISTER(Register, no_reg, 0, 0, CPURegister::kNoRegister);
				357
				358	#define DEFINE_REGISTERS(N) \
				359	INITIALIZE_REGISTER(Register, w##N, N, \
				360	kWRegSizeInBits, CPURegister::kRegister); \
				361	INITIALIZE_REGISTER(Register, x##N, N, \
				362	kXRegSizeInBits, CPURegister::kRegister);
				363	REGISTER_CODE_LIST(DEFINE_REGISTERS)
				364	#undef DEFINE_REGISTERS
				365
				366	INITIALIZE_REGISTER(Register, wcsp, kSPRegInternalCode, kWRegSizeInBits,
				367	CPURegister::kRegister);
				368	INITIALIZE_REGISTER(Register, csp, kSPRegInternalCode, kXRegSizeInBits,
				369	CPURegister::kRegister);
				370
				371	#define DEFINE_FPREGISTERS(N) \
				372	INITIALIZE_REGISTER(FPRegister, s##N, N, \
				373	kSRegSizeInBits, CPURegister::kFPRegister); \
				374	INITIALIZE_REGISTER(FPRegister, d##N, N, \
				375	kDRegSizeInBits, CPURegister::kFPRegister);
				376	REGISTER_CODE_LIST(DEFINE_FPREGISTERS)
				377	#undef DEFINE_FPREGISTERS
				378
				379	#undef INITIALIZE_REGISTER
				380
				381	// Registers aliases.
				382	ALIAS_REGISTER(Register, ip0, x16);
				383	ALIAS_REGISTER(Register, ip1, x17);
				384	ALIAS_REGISTER(Register, wip0, w16);
				385	ALIAS_REGISTER(Register, wip1, w17);
				386	// Root register.
				387	ALIAS_REGISTER(Register, root, x26);
				388	ALIAS_REGISTER(Register, rr, x26);
				389	// Context pointer register.
				390	ALIAS_REGISTER(Register, cp, x27);
				391	// We use a register as a JS stack pointer to overcome the restriction on the
				392	// architectural SP alignment.
				393	// We chose x28 because it is contiguous with the other specific purpose
				394	// registers.
				395	STATIC_ASSERT(kJSSPCode == 28);
				396	ALIAS_REGISTER(Register, jssp, x28);
				397	ALIAS_REGISTER(Register, wjssp, w28);
				398	ALIAS_REGISTER(Register, fp, x29);
				399	ALIAS_REGISTER(Register, lr, x30);
				400	ALIAS_REGISTER(Register, xzr, x31);
				401	ALIAS_REGISTER(Register, wzr, w31);
				402
				403	// Keeps the 0 double value.
				404	ALIAS_REGISTER(FPRegister, fp_zero, d15);
				405	// Crankshaft double scratch register.
				406	ALIAS_REGISTER(FPRegister, crankshaft_fp_scratch, d29);
				407	// MacroAssembler double scratch registers.
				408	ALIAS_REGISTER(FPRegister, fp_scratch, d30);
				409	ALIAS_REGISTER(FPRegister, fp_scratch1, d30);
				410	ALIAS_REGISTER(FPRegister, fp_scratch2, d31);
				411
				412	#undef ALIAS_REGISTER
				413
				414
				415	Register GetAllocatableRegisterThatIsNotOneOf(Register reg1,
				416	Register reg2 = NoReg,
				417	Register reg3 = NoReg,
				418	Register reg4 = NoReg);
				419
				420
				421	// AreAliased returns true if any of the named registers overlap. Arguments set
				422	// to NoReg are ignored. The system stack pointer may be specified.
				423	bool AreAliased(const CPURegister& reg1,
				424	const CPURegister& reg2,
				425	const CPURegister& reg3 = NoReg,
				426	const CPURegister& reg4 = NoReg,
				427	const CPURegister& reg5 = NoReg,
				428	const CPURegister& reg6 = NoReg,
				429	const CPURegister& reg7 = NoReg,
				430	const CPURegister& reg8 = NoReg);
				431
				432	// AreSameSizeAndType returns true if all of the specified registers have the
				433	// same size, and are of the same type. The system stack pointer may be
				434	// specified. Arguments set to NoReg are ignored, as are any subsequent
				435	// arguments. At least one argument (reg1) must be valid (not NoCPUReg).
				436	bool AreSameSizeAndType(const CPURegister& reg1,
				437	const CPURegister& reg2,
				438	const CPURegister& reg3 = NoCPUReg,
				439	const CPURegister& reg4 = NoCPUReg,
				440	const CPURegister& reg5 = NoCPUReg,
				441	const CPURegister& reg6 = NoCPUReg,
				442	const CPURegister& reg7 = NoCPUReg,
				443	const CPURegister& reg8 = NoCPUReg);
				444
				445
				446	typedef FPRegister DoubleRegister;
				447
				448
				449	// -----------------------------------------------------------------------------
				450	// Lists of registers.
				451	class CPURegList {
				452	public:
				453	explicit CPURegList(CPURegister reg1,
				454	CPURegister reg2 = NoCPUReg,
				455	CPURegister reg3 = NoCPUReg,
				456	CPURegister reg4 = NoCPUReg)
				457	: list_(reg1.Bit() \| reg2.Bit() \| reg3.Bit() \| reg4.Bit()),
				458	size_(reg1.SizeInBits()), type_(reg1.type()) {
				459	DCHECK(AreSameSizeAndType(reg1, reg2, reg3, reg4));
				460	DCHECK(IsValid());
				461	}
				462
				463	CPURegList(CPURegister::RegisterType type, unsigned size, RegList list)
				464	: list_(list), size_(size), type_(type) {
				465	DCHECK(IsValid());
				466	}
				467
				468	CPURegList(CPURegister::RegisterType type, unsigned size,
				469	unsigned first_reg, unsigned last_reg)
				470	: size_(size), type_(type) {
				471	DCHECK(((type == CPURegister::kRegister) &&
				472	(last_reg < kNumberOfRegisters)) \|\|
				473	((type == CPURegister::kFPRegister) &&
				474	(last_reg < kNumberOfFPRegisters)));
				475	DCHECK(last_reg >= first_reg);
				476	list_ = (1UL << (last_reg + 1)) - 1;
				477	list_ &= ~((1UL << first_reg) - 1);
				478	DCHECK(IsValid());
				479	}
				480
				481	CPURegister::RegisterType type() const {
				482	DCHECK(IsValid());
				483	return type_;
				484	}
				485
				486	RegList list() const {
				487	DCHECK(IsValid());
				488	return list_;
				489	}
				490
				491	inline void set_list(RegList new_list) {
				492	DCHECK(IsValid());
				493	list_ = new_list;
				494	}
				495
				496	// Combine another CPURegList into this one. Registers that already exist in
				497	// this list are left unchanged. The type and size of the registers in the
				498	// 'other' list must match those in this list.
				499	void Combine(const CPURegList& other);
				500
				501	// Remove every register in the other CPURegList from this one. Registers that
				502	// do not exist in this list are ignored. The type of the registers in the
				503	// 'other' list must match those in this list.
				504	void Remove(const CPURegList& other);
				505
				506	// Variants of Combine and Remove which take CPURegisters.
				507	void Combine(const CPURegister& other);
				508	void Remove(const CPURegister& other1,
				509	const CPURegister& other2 = NoCPUReg,
				510	const CPURegister& other3 = NoCPUReg,
				511	const CPURegister& other4 = NoCPUReg);
				512
				513	// Variants of Combine and Remove which take a single register by its code;
				514	// the type and size of the register is inferred from this list.
				515	void Combine(int code);
				516	void Remove(int code);
				517
				518	// Remove all callee-saved registers from the list. This can be useful when
				519	// preparing registers for an AAPCS64 function call, for example.
				520	void RemoveCalleeSaved();
				521
				522	CPURegister PopLowestIndex();
				523	CPURegister PopHighestIndex();
				524
				525	// AAPCS64 callee-saved registers.
				526	static CPURegList GetCalleeSaved(unsigned size = kXRegSizeInBits);
				527	static CPURegList GetCalleeSavedFP(unsigned size = kDRegSizeInBits);
				528
				529	// AAPCS64 caller-saved registers. Note that this includes lr.
				530	static CPURegList GetCallerSaved(unsigned size = kXRegSizeInBits);
				531	static CPURegList GetCallerSavedFP(unsigned size = kDRegSizeInBits);
				532
				533	// Registers saved as safepoints.
				534	static CPURegList GetSafepointSavedRegisters();
				535
				536	bool IsEmpty() const {
				537	DCHECK(IsValid());
				538	return list_ == 0;
				539	}
				540
				541	bool IncludesAliasOf(const CPURegister& other1,
				542	const CPURegister& other2 = NoCPUReg,
				543	const CPURegister& other3 = NoCPUReg,
				544	const CPURegister& other4 = NoCPUReg) const {
				545	DCHECK(IsValid());
				546	RegList list = 0;
				547	if (!other1.IsNone() && (other1.type() == type_)) list \|= other1.Bit();
				548	if (!other2.IsNone() && (other2.type() == type_)) list \|= other2.Bit();
				549	if (!other3.IsNone() && (other3.type() == type_)) list \|= other3.Bit();
				550	if (!other4.IsNone() && (other4.type() == type_)) list \|= other4.Bit();
				551	return (list_ & list) != 0;
				552	}
				553
				554	int Count() const {
				555	DCHECK(IsValid());
				556	return CountSetBits(list_, kRegListSizeInBits);
				557	}
				558
				559	unsigned RegisterSizeInBits() const {
				560	DCHECK(IsValid());
				561	return size_;
				562	}
				563
				564	unsigned RegisterSizeInBytes() const {
				565	int size_in_bits = RegisterSizeInBits();
				566	DCHECK((size_in_bits % kBitsPerByte) == 0);
				567	return size_in_bits / kBitsPerByte;
				568	}
				569
				570	unsigned TotalSizeInBytes() const {
				571	DCHECK(IsValid());
				572	return RegisterSizeInBytes() * Count();
				573	}
				574
				575	private:
				576	RegList list_;
				577	unsigned size_;
				578	CPURegister::RegisterType type_;
				579
				580	bool IsValid() const {
				581	const RegList kValidRegisters = 0x8000000ffffffff;
				582	const RegList kValidFPRegisters = 0x0000000ffffffff;
				583	switch (type_) {
				584	case CPURegister::kRegister:
				585	return (list_ & kValidRegisters) == list_;
				586	case CPURegister::kFPRegister:
				587	return (list_ & kValidFPRegisters) == list_;
				588	case CPURegister::kNoRegister:
				589	return list_ == 0;
				590	default:
				591	UNREACHABLE();
				592	return false;
				593	}
				594	}
				595	};
				596
				597
				598	// AAPCS64 callee-saved registers.
				599	#define kCalleeSaved CPURegList::GetCalleeSaved()
				600	#define kCalleeSavedFP CPURegList::GetCalleeSavedFP()
				601
				602
				603	// AAPCS64 caller-saved registers. Note that this includes lr.
				604	#define kCallerSaved CPURegList::GetCallerSaved()
				605	#define kCallerSavedFP CPURegList::GetCallerSavedFP()
				606
				607	// -----------------------------------------------------------------------------
				608	// Immediates.
				609	class Immediate {
				610	public:
				611	template<typename T>
				612	inline explicit Immediate(Handle<T> handle);
				613
				614	// This is allowed to be an implicit constructor because Immediate is
				615	// a wrapper class that doesn't normally perform any type conversion.
				616	template<typename T>
				617	inline Immediate(T value); // NOLINT(runtime/explicit)
				618
				619	template<typename T>
				620	inline Immediate(T value, RelocInfo::Mode rmode);
				621
				622	int64_t value() const { return value_; }
				623	RelocInfo::Mode rmode() const { return rmode_; }
				624
				625	private:
				626	void InitializeHandle(Handle<Object> value);
				627
				628	int64_t value_;
				629	RelocInfo::Mode rmode_;
				630	};
				631
				632
				633	// -----------------------------------------------------------------------------
				634	// Operands.
				635	const int kSmiShift = kSmiTagSize + kSmiShiftSize;
				636	const uint64_t kSmiShiftMask = (1UL << kSmiShift) - 1;
				637
				638	// Represents an operand in a machine instruction.
				639	class Operand {
				640	// TODO(all): If necessary, study more in details which methods
				641	// TODO(all): should be inlined or not.
				642	public:
				643	// rm, {<shift> {#<shift_amount>}}
				644	// where <shift> is one of {LSL, LSR, ASR, ROR}.
				645	// <shift_amount> is uint6_t.
				646	// This is allowed to be an implicit constructor because Operand is
				647	// a wrapper class that doesn't normally perform any type conversion.
				648	inline Operand(Register reg,
				649	Shift shift = LSL,
				650	unsigned shift_amount = 0); // NOLINT(runtime/explicit)
				651
				652	// rm, <extend> {#<shift_amount>}
				653	// where <extend> is one of {UXTB, UXTH, UXTW, UXTX, SXTB, SXTH, SXTW, SXTX}.
				654	// <shift_amount> is uint2_t.
				655	inline Operand(Register reg,
				656	Extend extend,
				657	unsigned shift_amount = 0);
				658
				659	template<typename T>
				660	inline explicit Operand(Handle<T> handle);
				661
				662	// Implicit constructor for all int types, ExternalReference, and Smi.
				663	template<typename T>
				664	inline Operand(T t); // NOLINT(runtime/explicit)
				665
				666	// Implicit constructor for int types.
				667	template<typename T>
				668	inline Operand(T t, RelocInfo::Mode rmode);
				669
				670	inline bool IsImmediate() const;
				671	inline bool IsShiftedRegister() const;
				672	inline bool IsExtendedRegister() const;
				673	inline bool IsZero() const;
				674
				675	// This returns an LSL shift (<= 4) operand as an equivalent extend operand,
				676	// which helps in the encoding of instructions that use the stack pointer.
				677	inline Operand ToExtendedRegister() const;
				678
				679	inline Immediate immediate() const;
				680	inline int64_t ImmediateValue() const;
				681	inline Register reg() const;
				682	inline Shift shift() const;
				683	inline Extend extend() const;
				684	inline unsigned shift_amount() const;
				685
				686	// Relocation information.
				687	bool NeedsRelocation(const Assembler* assembler) const;
				688
				689	// Helpers
				690	inline static Operand UntagSmi(Register smi);
				691	inline static Operand UntagSmiAndScale(Register smi, int scale);
				692
				693	private:
				694	Immediate immediate_;
				695	Register reg_;
				696	Shift shift_;
				697	Extend extend_;
				698	unsigned shift_amount_;
				699	};
				700
				701
				702	// MemOperand represents a memory operand in a load or store instruction.
				703	class MemOperand {
				704	public:
				705	inline MemOperand();
				706	inline explicit MemOperand(Register base,
				707	int64_t offset = 0,
				708	AddrMode addrmode = Offset);
				709	inline explicit MemOperand(Register base,
				710	Register regoffset,
				711	Shift shift = LSL,
				712	unsigned shift_amount = 0);
				713	inline explicit MemOperand(Register base,
				714	Register regoffset,
				715	Extend extend,
				716	unsigned shift_amount = 0);
				717	inline explicit MemOperand(Register base,
				718	const Operand& offset,
				719	AddrMode addrmode = Offset);
				720
				721	const Register& base() const { return base_; }
				722	const Register& regoffset() const { return regoffset_; }
				723	int64_t offset() const { return offset_; }
				724	AddrMode addrmode() const { return addrmode_; }
				725	Shift shift() const { return shift_; }
				726	Extend extend() const { return extend_; }
				727	unsigned shift_amount() const { return shift_amount_; }
				728	inline bool IsImmediateOffset() const;
				729	inline bool IsRegisterOffset() const;
				730	inline bool IsPreIndex() const;
				731	inline bool IsPostIndex() const;
				732
				733	// For offset modes, return the offset as an Operand. This helper cannot
				734	// handle indexed modes.
				735	inline Operand OffsetAsOperand() const;
				736
				737	enum PairResult {
				738	kNotPair, // Can't use a pair instruction.
				739	kPairAB, // Can use a pair instruction (operandA has lower address).
				740	kPairBA // Can use a pair instruction (operandB has lower address).
				741	};
				742	// Check if two MemOperand are consistent for stp/ldp use.
				743	static PairResult AreConsistentForPair(const MemOperand& operandA,
				744	const MemOperand& operandB,
				745	int access_size_log2 = kXRegSizeLog2);
				746
				747	private:
				748	Register base_;
				749	Register regoffset_;
				750	int64_t offset_;
				751	AddrMode addrmode_;
				752	Shift shift_;
				753	Extend extend_;
				754	unsigned shift_amount_;
				755	};
				756
				757
				758	class ConstPool {
				759	public:
				760	explicit ConstPool(Assembler* assm)
				761	: assm_(assm),
				762	first_use_(-1),
				763	shared_entries_count(0) {}
				764	void RecordEntry(intptr_t data, RelocInfo::Mode mode);
				765	int EntryCount() const {
				766	return shared_entries_count + unique_entries_.size();
				767	}
				768	bool IsEmpty() const {
				769	return shared_entries_.empty() && unique_entries_.empty();
				770	}
				771	// Distance in bytes between the current pc and the first instruction
				772	// using the pool. If there are no pending entries return kMaxInt.
				773	int DistanceToFirstUse();
				774	// Offset after which instructions using the pool will be out of range.
				775	int MaxPcOffset();
				776	// Maximum size the constant pool can be with current entries. It always
				777	// includes alignment padding and branch over.
				778	int WorstCaseSize();
				779	// Size in bytes of the literal pool if it is emitted at the current
				780	// pc. The size will include the branch over the pool if it was requested.
				781	int SizeIfEmittedAtCurrentPc(bool require_jump);
				782	// Emit the literal pool at the current pc with a branch over the pool if
				783	// requested.
				784	void Emit(bool require_jump);
				785	// Discard any pending pool entries.
				786	void Clear();
				787
				788	private:
				789	bool CanBeShared(RelocInfo::Mode mode);
				790	void EmitMarker();
				791	void EmitGuard();
				792	void EmitEntries();
				793
				794	Assembler* assm_;
				795	// Keep track of the first instruction requiring a constant pool entry
				796	// since the previous constant pool was emitted.
				797	int first_use_;
				798	// values, pc offset(s) of entries which can be shared.
				799	std::multimap<uint64_t, int> shared_entries_;
				800	// Number of distinct literal in shared entries.
				801	int shared_entries_count;
				802	// values, pc offset of entries which cannot be shared.
				803	std::vector<std::pair<uint64_t, int> > unique_entries_;
				804	};
				805
				806
				807	// -----------------------------------------------------------------------------
				808	// Assembler.
				809
				810	class Assembler : public AssemblerBase {
				811	public:
				812	// Create an assembler. Instructions and relocation information are emitted
				813	// into a buffer, with the instructions starting from the beginning and the
				814	// relocation information starting from the end of the buffer. See CodeDesc
				815	// for a detailed comment on the layout (globals.h).
				816	//
				817	// If the provided buffer is NULL, the assembler allocates and grows its own
				818	// buffer, and buffer_size determines the initial buffer size. The buffer is
				819	// owned by the assembler and deallocated upon destruction of the assembler.
				820	//
				821	// If the provided buffer is not NULL, the assembler uses the provided buffer
				822	// for code generation and assumes its size to be buffer_size. If the buffer
				823	// is too small, a fatal error occurs. No deallocation of the buffer is done
				824	// upon destruction of the assembler.
				825	Assembler(Isolate* arg_isolate, void* buffer, int buffer_size);
				826
				827	virtual ~Assembler();
				828
				829	virtual void AbortedCodeGeneration() {
				830	constpool_.Clear();
				831	}
				832
				833	// System functions ---------------------------------------------------------
				834	// Start generating code from the beginning of the buffer, discarding any code
				835	// and data that has already been emitted into the buffer.
				836	//
				837	// In order to avoid any accidental transfer of state, Reset DCHECKs that the
				838	// constant pool is not blocked.
				839	void Reset();
				840
				841	// GetCode emits any pending (non-emitted) code and fills the descriptor
				842	// desc. GetCode() is idempotent; it returns the same result if no other
				843	// Assembler functions are invoked in between GetCode() calls.
				844	//
				845	// The descriptor (desc) can be NULL. In that case, the code is finalized as
				846	// usual, but the descriptor is not populated.
				847	void GetCode(CodeDesc* desc);
				848
				849	// Insert the smallest number of nop instructions
				850	// possible to align the pc offset to a multiple
				851	// of m. m must be a power of 2 (>= 4).
				852	void Align(int m);
				853
				854	inline void Unreachable();
				855
				856	// Label --------------------------------------------------------------------
				857	// Bind a label to the current pc. Note that labels can only be bound once,
				858	// and if labels are linked to other instructions, they _must_ be bound
				859	// before they go out of scope.
				860	void bind(Label* label);
				861
				862
				863	// RelocInfo and pools ------------------------------------------------------
				864
				865	// Record relocation information for current pc_.
				866	void RecordRelocInfo(RelocInfo::Mode rmode, intptr_t data = 0);
				867
				868	// Return the address in the constant pool of the code target address used by
				869	// the branch/call instruction at pc.
				870	inline static Address target_pointer_address_at(Address pc);
				871
				872	// Read/Modify the code target address in the branch/call instruction at pc.
				873	inline static Address target_address_at(Address pc,
				874	ConstantPoolArray* constant_pool);
				875	inline static void set_target_address_at(Address pc,
				876	ConstantPoolArray* constant_pool,
				877	Address target,
				878	ICacheFlushMode icache_flush_mode =
				879	FLUSH_ICACHE_IF_NEEDED);
				880	static inline Address target_address_at(Address pc, Code* code);
				881	static inline void set_target_address_at(Address pc,
				882	Code* code,
				883	Address target,
				884	ICacheFlushMode icache_flush_mode =
				885	FLUSH_ICACHE_IF_NEEDED);
				886
				887	// Return the code target address at a call site from the return address of
				888	// that call in the instruction stream.
				889	inline static Address target_address_from_return_address(Address pc);
				890
				891	// Given the address of the beginning of a call, return the address in the
				892	// instruction stream that call will return from.
				893	inline static Address return_address_from_call_start(Address pc);
				894
				895	// Return the code target address of the patch debug break slot
				896	inline static Address break_address_from_return_address(Address pc);
				897
				898	// This sets the branch destination (which is in the constant pool on ARM).
				899	// This is for calls and branches within generated code.
				900	inline static void deserialization_set_special_target_at(
				901	Address constant_pool_entry, Code* code, Address target);
				902
				903	// All addresses in the constant pool are the same size as pointers.
				904	static const int kSpecialTargetSize = kPointerSize;
				905
				906	// The sizes of the call sequences emitted by MacroAssembler::Call.
				907	// Wherever possible, use MacroAssembler::CallSize instead of these constants,
				908	// as it will choose the correct value for a given relocation mode.
				909	//
				910	// Without relocation:
				911	// movz temp, #(target & 0x000000000000ffff)
				912	// movk temp, #(target & 0x00000000ffff0000)
				913	// movk temp, #(target & 0x0000ffff00000000)
				914	// blr temp
				915	//
				916	// With relocation:
				917	// ldr temp, =target
				918	// blr temp
				919	static const int kCallSizeWithoutRelocation = 4 * kInstructionSize;
				920	static const int kCallSizeWithRelocation = 2 * kInstructionSize;
				921
				922	// Size of the generated code in bytes
				923	uint64_t SizeOfGeneratedCode() const {
				924	DCHECK((pc_ >= buffer_) && (pc_ < (buffer_ + buffer_size_)));
				925	return pc_ - buffer_;
				926	}
				927
				928	// Return the code size generated from label to the current position.
				929	uint64_t SizeOfCodeGeneratedSince(const Label* label) {
				930	DCHECK(label->is_bound());
				931	DCHECK(pc_offset() >= label->pos());
				932	DCHECK(pc_offset() < buffer_size_);
				933	return pc_offset() - label->pos();
				934	}
				935
				936	// Check the size of the code generated since the given label. This function
				937	// is used primarily to work around comparisons between signed and unsigned
				938	// quantities, since V8 uses both.
				939	// TODO(jbramley): Work out what sign to use for these things and if possible,
				940	// change things to be consistent.
				941	void AssertSizeOfCodeGeneratedSince(const Label* label, ptrdiff_t size) {
				942	DCHECK(size >= 0);
				943	DCHECK(static_cast<uint64_t>(size) == SizeOfCodeGeneratedSince(label));
				944	}
				945
				946	// Return the number of instructions generated from label to the
				947	// current position.
				948	int InstructionsGeneratedSince(const Label* label) {
				949	return SizeOfCodeGeneratedSince(label) / kInstructionSize;
				950	}
				951
				952	// Number of instructions generated for the return sequence in
				953	// FullCodeGenerator::EmitReturnSequence.
				954	static const int kJSRetSequenceInstructions = 7;
				955	// Distance between start of patched return sequence and the emitted address
				956	// to jump to.
				957	static const int kPatchReturnSequenceAddressOffset = 0;
				958	static const int kPatchDebugBreakSlotAddressOffset = 0;
				959
				960	// Number of instructions necessary to be able to later patch it to a call.
				961	// See DebugCodegen::GenerateSlot() and
				962	// BreakLocationIterator::SetDebugBreakAtSlot().
				963	static const int kDebugBreakSlotInstructions = 4;
				964	static const int kDebugBreakSlotLength =
				965	kDebugBreakSlotInstructions * kInstructionSize;
				966
				967	static const int kPatchDebugBreakSlotReturnOffset = 2 * kInstructionSize;
				968
				969	// Prevent contant pool emission until EndBlockConstPool is called.
				970	// Call to this function can be nested but must be followed by an equal
				971	// number of call to EndBlockConstpool.
				972	void StartBlockConstPool();
				973
				974	// Resume constant pool emission. Need to be called as many time as
				975	// StartBlockConstPool to have an effect.
				976	void EndBlockConstPool();
				977
				978	bool is_const_pool_blocked() const;
				979	static bool IsConstantPoolAt(Instruction* instr);
				980	static int ConstantPoolSizeAt(Instruction* instr);
				981	// See Assembler::CheckConstPool for more info.
				982	void EmitPoolGuard();
				983
				984	// Prevent veneer pool emission until EndBlockVeneerPool is called.
				985	// Call to this function can be nested but must be followed by an equal
				986	// number of call to EndBlockConstpool.
				987	void StartBlockVeneerPool();
				988
				989	// Resume constant pool emission. Need to be called as many time as
				990	// StartBlockVeneerPool to have an effect.
				991	void EndBlockVeneerPool();
				992
				993	bool is_veneer_pool_blocked() const {
				994	return veneer_pool_blocked_nesting_ > 0;
				995	}
				996
				997	// Block/resume emission of constant pools and veneer pools.
				998	void StartBlockPools() {
				999	StartBlockConstPool();
				1000	StartBlockVeneerPool();
				1001	}
				1002	void EndBlockPools() {
				1003	EndBlockConstPool();
				1004	EndBlockVeneerPool();
				1005	}
				1006
				1007	// Debugging ----------------------------------------------------------------
				1008	PositionsRecorder* positions_recorder() { return &positions_recorder_; }
				1009	void RecordComment(const char* msg);
				1010	int buffer_space() const;
				1011
				1012	// Mark address of the ExitJSFrame code.
				1013	void RecordJSReturn();
				1014
				1015	// Mark address of a debug break slot.
				1016	void RecordDebugBreakSlot();
				1017
				1018	// Record the emission of a constant pool.
				1019	//
				1020	// The emission of constant and veneer pools depends on the size of the code
				1021	// generated and the number of RelocInfo recorded.
				1022	// The Debug mechanism needs to map code offsets between two versions of a
				1023	// function, compiled with and without debugger support (see for example
				1024	// Debug::PrepareForBreakPoints()).
				1025	// Compiling functions with debugger support generates additional code
				1026	// (DebugCodegen::GenerateSlot()). This may affect the emission of the pools
				1027	// and cause the version of the code with debugger support to have pools
				1028	// generated in different places.
				1029	// Recording the position and size of emitted pools allows to correctly
				1030	// compute the offset mappings between the different versions of a function in
				1031	// all situations.
				1032	//
				1033	// The parameter indicates the size of the pool (in bytes), including
				1034	// the marker and branch over the data.
				1035	void RecordConstPool(int size);
				1036
				1037
				1038	// Instruction set functions ------------------------------------------------
				1039
				1040	// Branch / Jump instructions.
				1041	// For branches offsets are scaled, i.e. they in instrcutions not in bytes.
				1042	// Branch to register.
				1043	void br(const Register& xn);
				1044
				1045	// Branch-link to register.
				1046	void blr(const Register& xn);
				1047
				1048	// Branch to register with return hint.
				1049	void ret(const Register& xn = lr);
				1050
				1051	// Unconditional branch to label.
				1052	void b(Label* label);
				1053
				1054	// Conditional branch to label.
				1055	void b(Label* label, Condition cond);
				1056
				1057	// Unconditional branch to PC offset.
				1058	void b(int imm26);
				1059
				1060	// Conditional branch to PC offset.
				1061	void b(int imm19, Condition cond);
				1062
				1063	// Branch-link to label / pc offset.
				1064	void bl(Label* label);
				1065	void bl(int imm26);
				1066
				1067	// Compare and branch to label / pc offset if zero.
				1068	void cbz(const Register& rt, Label* label);
				1069	void cbz(const Register& rt, int imm19);
				1070
				1071	// Compare and branch to label / pc offset if not zero.
				1072	void cbnz(const Register& rt, Label* label);
				1073	void cbnz(const Register& rt, int imm19);
				1074
				1075	// Test bit and branch to label / pc offset if zero.
				1076	void tbz(const Register& rt, unsigned bit_pos, Label* label);
				1077	void tbz(const Register& rt, unsigned bit_pos, int imm14);
				1078
				1079	// Test bit and branch to label / pc offset if not zero.
				1080	void tbnz(const Register& rt, unsigned bit_pos, Label* label);
				1081	void tbnz(const Register& rt, unsigned bit_pos, int imm14);
				1082
				1083	// Address calculation instructions.
				1084	// Calculate a PC-relative address. Unlike for branches the offset in adr is
				1085	// unscaled (i.e. the result can be unaligned).
				1086	void adr(const Register& rd, Label* label);
				1087	void adr(const Register& rd, int imm21);
				1088
				1089	// Data Processing instructions.
				1090	// Add.
				1091	void add(const Register& rd,
				1092	const Register& rn,
				1093	const Operand& operand);
				1094
				1095	// Add and update status flags.
				1096	void adds(const Register& rd,
				1097	const Register& rn,
				1098	const Operand& operand);
				1099
				1100	// Compare negative.
				1101	void cmn(const Register& rn, const Operand& operand);
				1102
				1103	// Subtract.
				1104	void sub(const Register& rd,
				1105	const Register& rn,
				1106	const Operand& operand);
				1107
				1108	// Subtract and update status flags.
				1109	void subs(const Register& rd,
				1110	const Register& rn,
				1111	const Operand& operand);
				1112
				1113	// Compare.
				1114	void cmp(const Register& rn, const Operand& operand);
				1115
				1116	// Negate.
				1117	void neg(const Register& rd,
				1118	const Operand& operand);
				1119
				1120	// Negate and update status flags.
				1121	void negs(const Register& rd,
				1122	const Operand& operand);
				1123
				1124	// Add with carry bit.
				1125	void adc(const Register& rd,
				1126	const Register& rn,
				1127	const Operand& operand);
				1128
				1129	// Add with carry bit and update status flags.
				1130	void adcs(const Register& rd,
				1131	const Register& rn,
				1132	const Operand& operand);
				1133
				1134	// Subtract with carry bit.
				1135	void sbc(const Register& rd,
				1136	const Register& rn,
				1137	const Operand& operand);
				1138
				1139	// Subtract with carry bit and update status flags.
				1140	void sbcs(const Register& rd,
				1141	const Register& rn,
				1142	const Operand& operand);
				1143
				1144	// Negate with carry bit.
				1145	void ngc(const Register& rd,
				1146	const Operand& operand);
				1147
				1148	// Negate with carry bit and update status flags.
				1149	void ngcs(const Register& rd,
				1150	const Operand& operand);
				1151
				1152	// Logical instructions.
				1153	// Bitwise and (A & B).
				1154	void and_(const Register& rd,
				1155	const Register& rn,
				1156	const Operand& operand);
				1157
				1158	// Bitwise and (A & B) and update status flags.
				1159	void ands(const Register& rd,
				1160	const Register& rn,
				1161	const Operand& operand);
				1162
				1163	// Bit test, and set flags.
				1164	void tst(const Register& rn, const Operand& operand);
				1165
				1166	// Bit clear (A & ~B).
				1167	void bic(const Register& rd,
				1168	const Register& rn,
				1169	const Operand& operand);
				1170
				1171	// Bit clear (A & ~B) and update status flags.
				1172	void bics(const Register& rd,
				1173	const Register& rn,
				1174	const Operand& operand);
				1175
				1176	// Bitwise or (A \| B).
				1177	void orr(const Register& rd, const Register& rn, const Operand& operand);
				1178
				1179	// Bitwise nor (A \| ~B).
				1180	void orn(const Register& rd, const Register& rn, const Operand& operand);
				1181
				1182	// Bitwise eor/xor (A ^ B).
				1183	void eor(const Register& rd, const Register& rn, const Operand& operand);
				1184
				1185	// Bitwise enor/xnor (A ^ ~B).
				1186	void eon(const Register& rd, const Register& rn, const Operand& operand);
				1187
				1188	// Logical shift left variable.
				1189	void lslv(const Register& rd, const Register& rn, const Register& rm);
				1190
				1191	// Logical shift right variable.
				1192	void lsrv(const Register& rd, const Register& rn, const Register& rm);
				1193
				1194	// Arithmetic shift right variable.
				1195	void asrv(const Register& rd, const Register& rn, const Register& rm);
				1196
				1197	// Rotate right variable.
				1198	void rorv(const Register& rd, const Register& rn, const Register& rm);
				1199
				1200	// Bitfield instructions.
				1201	// Bitfield move.
				1202	void bfm(const Register& rd,
				1203	const Register& rn,
				1204	unsigned immr,
				1205	unsigned imms);
				1206
				1207	// Signed bitfield move.
				1208	void sbfm(const Register& rd,
				1209	const Register& rn,
				1210	unsigned immr,
				1211	unsigned imms);
				1212
				1213	// Unsigned bitfield move.
				1214	void ubfm(const Register& rd,
				1215	const Register& rn,
				1216	unsigned immr,
				1217	unsigned imms);
				1218
				1219	// Bfm aliases.
				1220	// Bitfield insert.
				1221	void bfi(const Register& rd,
				1222	const Register& rn,
				1223	unsigned lsb,
				1224	unsigned width) {
				1225	DCHECK(width >= 1);
				1226	DCHECK(lsb + width <= rn.SizeInBits());
				1227	bfm(rd, rn, (rd.SizeInBits() - lsb) & (rd.SizeInBits() - 1), width - 1);
				1228	}
				1229
				1230	// Bitfield extract and insert low.
				1231	void bfxil(const Register& rd,
				1232	const Register& rn,
				1233	unsigned lsb,
				1234	unsigned width) {
				1235	DCHECK(width >= 1);
				1236	DCHECK(lsb + width <= rn.SizeInBits());
				1237	bfm(rd, rn, lsb, lsb + width - 1);
				1238	}
				1239
				1240	// Sbfm aliases.
				1241	// Arithmetic shift right.
				1242	void asr(const Register& rd, const Register& rn, unsigned shift) {
				1243	DCHECK(shift < rd.SizeInBits());
				1244	sbfm(rd, rn, shift, rd.SizeInBits() - 1);
				1245	}
				1246
				1247	// Signed bitfield insert in zero.
				1248	void sbfiz(const Register& rd,
				1249	const Register& rn,
				1250	unsigned lsb,
				1251	unsigned width) {
				1252	DCHECK(width >= 1);
				1253	DCHECK(lsb + width <= rn.SizeInBits());
				1254	sbfm(rd, rn, (rd.SizeInBits() - lsb) & (rd.SizeInBits() - 1), width - 1);
				1255	}
				1256
				1257	// Signed bitfield extract.
				1258	void sbfx(const Register& rd,
				1259	const Register& rn,
				1260	unsigned lsb,
				1261	unsigned width) {
				1262	DCHECK(width >= 1);
				1263	DCHECK(lsb + width <= rn.SizeInBits());
				1264	sbfm(rd, rn, lsb, lsb + width - 1);
				1265	}
				1266
				1267	// Signed extend byte.
				1268	void sxtb(const Register& rd, const Register& rn) {
				1269	sbfm(rd, rn, 0, 7);
				1270	}
				1271
				1272	// Signed extend halfword.
				1273	void sxth(const Register& rd, const Register& rn) {
				1274	sbfm(rd, rn, 0, 15);
				1275	}
				1276
				1277	// Signed extend word.
				1278	void sxtw(const Register& rd, const Register& rn) {
				1279	sbfm(rd, rn, 0, 31);
				1280	}
				1281
				1282	// Ubfm aliases.
				1283	// Logical shift left.
				1284	void lsl(const Register& rd, const Register& rn, unsigned shift) {
				1285	unsigned reg_size = rd.SizeInBits();
				1286	DCHECK(shift < reg_size);
				1287	ubfm(rd, rn, (reg_size - shift) % reg_size, reg_size - shift - 1);
				1288	}
				1289
				1290	// Logical shift right.
				1291	void lsr(const Register& rd, const Register& rn, unsigned shift) {
				1292	DCHECK(shift < rd.SizeInBits());
				1293	ubfm(rd, rn, shift, rd.SizeInBits() - 1);
				1294	}
				1295
				1296	// Unsigned bitfield insert in zero.
				1297	void ubfiz(const Register& rd,
				1298	const Register& rn,
				1299	unsigned lsb,
				1300	unsigned width) {
				1301	DCHECK(width >= 1);
				1302	DCHECK(lsb + width <= rn.SizeInBits());
				1303	ubfm(rd, rn, (rd.SizeInBits() - lsb) & (rd.SizeInBits() - 1), width - 1);
				1304	}
				1305
				1306	// Unsigned bitfield extract.
				1307	void ubfx(const Register& rd,
				1308	const Register& rn,
				1309	unsigned lsb,
				1310	unsigned width) {
				1311	DCHECK(width >= 1);
				1312	DCHECK(lsb + width <= rn.SizeInBits());
				1313	ubfm(rd, rn, lsb, lsb + width - 1);
				1314	}
				1315
				1316	// Unsigned extend byte.
				1317	void uxtb(const Register& rd, const Register& rn) {
				1318	ubfm(rd, rn, 0, 7);
				1319	}
				1320
				1321	// Unsigned extend halfword.
				1322	void uxth(const Register& rd, const Register& rn) {
				1323	ubfm(rd, rn, 0, 15);
				1324	}
				1325
				1326	// Unsigned extend word.
				1327	void uxtw(const Register& rd, const Register& rn) {
				1328	ubfm(rd, rn, 0, 31);
				1329	}
				1330
				1331	// Extract.
				1332	void extr(const Register& rd,
				1333	const Register& rn,
				1334	const Register& rm,
				1335	unsigned lsb);
				1336
				1337	// Conditional select: rd = cond ? rn : rm.
				1338	void csel(const Register& rd,
				1339	const Register& rn,
				1340	const Register& rm,
				1341	Condition cond);
				1342
				1343	// Conditional select increment: rd = cond ? rn : rm + 1.
				1344	void csinc(const Register& rd,
				1345	const Register& rn,
				1346	const Register& rm,
				1347	Condition cond);
				1348
				1349	// Conditional select inversion: rd = cond ? rn : ~rm.
				1350	void csinv(const Register& rd,
				1351	const Register& rn,
				1352	const Register& rm,
				1353	Condition cond);
				1354
				1355	// Conditional select negation: rd = cond ? rn : -rm.
				1356	void csneg(const Register& rd,
				1357	const Register& rn,
				1358	const Register& rm,
				1359	Condition cond);
				1360
				1361	// Conditional set: rd = cond ? 1 : 0.
				1362	void cset(const Register& rd, Condition cond);
				1363
				1364	// Conditional set minus: rd = cond ? -1 : 0.
				1365	void csetm(const Register& rd, Condition cond);
				1366
				1367	// Conditional increment: rd = cond ? rn + 1 : rn.
				1368	void cinc(const Register& rd, const Register& rn, Condition cond);
				1369
				1370	// Conditional invert: rd = cond ? ~rn : rn.
				1371	void cinv(const Register& rd, const Register& rn, Condition cond);
				1372
				1373	// Conditional negate: rd = cond ? -rn : rn.
				1374	void cneg(const Register& rd, const Register& rn, Condition cond);
				1375
				1376	// Extr aliases.
				1377	void ror(const Register& rd, const Register& rs, unsigned shift) {
				1378	extr(rd, rs, rs, shift);
				1379	}
				1380
				1381	// Conditional comparison.
				1382	// Conditional compare negative.
				1383	void ccmn(const Register& rn,
				1384	const Operand& operand,
				1385	StatusFlags nzcv,
				1386	Condition cond);
				1387
				1388	// Conditional compare.
				1389	void ccmp(const Register& rn,
				1390	const Operand& operand,
				1391	StatusFlags nzcv,
				1392	Condition cond);
				1393
				1394	// Multiplication.
				1395	// 32 x 32 -> 32-bit and 64 x 64 -> 64-bit multiply.
				1396	void mul(const Register& rd, const Register& rn, const Register& rm);
				1397
				1398	// 32 + 32 x 32 -> 32-bit and 64 + 64 x 64 -> 64-bit multiply accumulate.
				1399	void madd(const Register& rd,
				1400	const Register& rn,
				1401	const Register& rm,
				1402	const Register& ra);
				1403
				1404	// -(32 x 32) -> 32-bit and -(64 x 64) -> 64-bit multiply.
				1405	void mneg(const Register& rd, const Register& rn, const Register& rm);
				1406
				1407	// 32 - 32 x 32 -> 32-bit and 64 - 64 x 64 -> 64-bit multiply subtract.
				1408	void msub(const Register& rd,
				1409	const Register& rn,
				1410	const Register& rm,
				1411	const Register& ra);
				1412
				1413	// 32 x 32 -> 64-bit multiply.
				1414	void smull(const Register& rd, const Register& rn, const Register& rm);
				1415
				1416	// Xd = bits<127:64> of Xn * Xm.
				1417	void smulh(const Register& rd, const Register& rn, const Register& rm);
				1418
				1419	// Signed 32 x 32 -> 64-bit multiply and accumulate.
				1420	void smaddl(const Register& rd,
				1421	const Register& rn,
				1422	const Register& rm,
				1423	const Register& ra);
				1424
				1425	// Unsigned 32 x 32 -> 64-bit multiply and accumulate.
				1426	void umaddl(const Register& rd,
				1427	const Register& rn,
				1428	const Register& rm,
				1429	const Register& ra);
				1430
				1431	// Signed 32 x 32 -> 64-bit multiply and subtract.
				1432	void smsubl(const Register& rd,
				1433	const Register& rn,
				1434	const Register& rm,
				1435	const Register& ra);
				1436
				1437	// Unsigned 32 x 32 -> 64-bit multiply and subtract.
				1438	void umsubl(const Register& rd,
				1439	const Register& rn,
				1440	const Register& rm,
				1441	const Register& ra);
				1442
				1443	// Signed integer divide.
				1444	void sdiv(const Register& rd, const Register& rn, const Register& rm);
				1445
				1446	// Unsigned integer divide.
				1447	void udiv(const Register& rd, const Register& rn, const Register& rm);
				1448
				1449	// Bit count, bit reverse and endian reverse.
				1450	void rbit(const Register& rd, const Register& rn);
				1451	void rev16(const Register& rd, const Register& rn);
				1452	void rev32(const Register& rd, const Register& rn);
				1453	void rev(const Register& rd, const Register& rn);
				1454	void clz(const Register& rd, const Register& rn);
				1455	void cls(const Register& rd, const Register& rn);
				1456
				1457	// Memory instructions.
				1458
				1459	// Load integer or FP register.
				1460	void ldr(const CPURegister& rt, const MemOperand& src);
				1461
				1462	// Store integer or FP register.
				1463	void str(const CPURegister& rt, const MemOperand& dst);
				1464
				1465	// Load word with sign extension.
				1466	void ldrsw(const Register& rt, const MemOperand& src);
				1467
				1468	// Load byte.
				1469	void ldrb(const Register& rt, const MemOperand& src);
				1470
				1471	// Store byte.
				1472	void strb(const Register& rt, const MemOperand& dst);
				1473
				1474	// Load byte with sign extension.
				1475	void ldrsb(const Register& rt, const MemOperand& src);
				1476
				1477	// Load half-word.
				1478	void ldrh(const Register& rt, const MemOperand& src);
				1479
				1480	// Store half-word.
				1481	void strh(const Register& rt, const MemOperand& dst);
				1482
				1483	// Load half-word with sign extension.
				1484	void ldrsh(const Register& rt, const MemOperand& src);
				1485
				1486	// Load integer or FP register pair.
				1487	void ldp(const CPURegister& rt, const CPURegister& rt2,
				1488	const MemOperand& src);
				1489
				1490	// Store integer or FP register pair.
				1491	void stp(const CPURegister& rt, const CPURegister& rt2,
				1492	const MemOperand& dst);
				1493
				1494	// Load word pair with sign extension.
				1495	void ldpsw(const Register& rt, const Register& rt2, const MemOperand& src);
				1496
				1497	// Load integer or FP register pair, non-temporal.
				1498	void ldnp(const CPURegister& rt, const CPURegister& rt2,
				1499	const MemOperand& src);
				1500
				1501	// Store integer or FP register pair, non-temporal.
				1502	void stnp(const CPURegister& rt, const CPURegister& rt2,
				1503	const MemOperand& dst);
				1504
				1505	// Load literal to register from a pc relative address.
				1506	void ldr_pcrel(const CPURegister& rt, int imm19);
				1507
				1508	// Load literal to register.
				1509	void ldr(const CPURegister& rt, const Immediate& imm);
				1510
				1511	// Move instructions. The default shift of -1 indicates that the move
				1512	// instruction will calculate an appropriate 16-bit immediate and left shift
				1513	// that is equal to the 64-bit immediate argument. If an explicit left shift
				1514	// is specified (0, 16, 32 or 48), the immediate must be a 16-bit value.
				1515	//
				1516	// For movk, an explicit shift can be used to indicate which half word should
				1517	// be overwritten, eg. movk(x0, 0, 0) will overwrite the least-significant
				1518	// half word with zero, whereas movk(x0, 0, 48) will overwrite the
				1519	// most-significant.
				1520
				1521	// Move and keep.
				1522	void movk(const Register& rd, uint64_t imm, int shift = -1) {
				1523	MoveWide(rd, imm, shift, MOVK);
				1524	}
				1525
				1526	// Move with non-zero.
				1527	void movn(const Register& rd, uint64_t imm, int shift = -1) {
				1528	MoveWide(rd, imm, shift, MOVN);
				1529	}
				1530
				1531	// Move with zero.
				1532	void movz(const Register& rd, uint64_t imm, int shift = -1) {
				1533	MoveWide(rd, imm, shift, MOVZ);
				1534	}
				1535
				1536	// Misc instructions.
				1537	// Monitor debug-mode breakpoint.
				1538	void brk(int code);
				1539
				1540	// Halting debug-mode breakpoint.
				1541	void hlt(int code);
				1542
				1543	// Move register to register.
				1544	void mov(const Register& rd, const Register& rn);
				1545
				1546	// Move NOT(operand) to register.
				1547	void mvn(const Register& rd, const Operand& operand);
				1548
				1549	// System instructions.
				1550	// Move to register from system register.
				1551	void mrs(const Register& rt, SystemRegister sysreg);
				1552
				1553	// Move from register to system register.
				1554	void msr(SystemRegister sysreg, const Register& rt);
				1555
				1556	// System hint.
				1557	void hint(SystemHint code);
				1558
				1559	// Data memory barrier
				1560	void dmb(BarrierDomain domain, BarrierType type);
				1561
				1562	// Data synchronization barrier
				1563	void dsb(BarrierDomain domain, BarrierType type);
				1564
				1565	// Instruction synchronization barrier
				1566	void isb();
				1567
				1568	// Alias for system instructions.
				1569	void nop() { hint(NOP); }
				1570
				1571	// Different nop operations are used by the code generator to detect certain
				1572	// states of the generated code.
				1573	enum NopMarkerTypes {
				1574	DEBUG_BREAK_NOP,
				1575	INTERRUPT_CODE_NOP,
				1576	ADR_FAR_NOP,
				1577	FIRST_NOP_MARKER = DEBUG_BREAK_NOP,
				1578	LAST_NOP_MARKER = ADR_FAR_NOP
				1579	};
				1580
				1581	void nop(NopMarkerTypes n) {
				1582	DCHECK((FIRST_NOP_MARKER <= n) && (n <= LAST_NOP_MARKER));
				1583	mov(Register::XRegFromCode(n), Register::XRegFromCode(n));
				1584	}
				1585
				1586	// FP instructions.
				1587	// Move immediate to FP register.
				1588	void fmov(FPRegister fd, double imm);
				1589	void fmov(FPRegister fd, float imm);
				1590
				1591	// Move FP register to register.
				1592	void fmov(Register rd, FPRegister fn);
				1593
				1594	// Move register to FP register.
				1595	void fmov(FPRegister fd, Register rn);
				1596
				1597	// Move FP register to FP register.
				1598	void fmov(FPRegister fd, FPRegister fn);
				1599
				1600	// FP add.
				1601	void fadd(const FPRegister& fd, const FPRegister& fn, const FPRegister& fm);
				1602
				1603	// FP subtract.
				1604	void fsub(const FPRegister& fd, const FPRegister& fn, const FPRegister& fm);
				1605
				1606	// FP multiply.
				1607	void fmul(const FPRegister& fd, const FPRegister& fn, const FPRegister& fm);
				1608
				1609	// FP fused multiply and add.
				1610	void fmadd(const FPRegister& fd,
				1611	const FPRegister& fn,
				1612	const FPRegister& fm,
				1613	const FPRegister& fa);
				1614
				1615	// FP fused multiply and subtract.
				1616	void fmsub(const FPRegister& fd,
				1617	const FPRegister& fn,
				1618	const FPRegister& fm,
				1619	const FPRegister& fa);
				1620
				1621	// FP fused multiply, add and negate.
				1622	void fnmadd(const FPRegister& fd,
				1623	const FPRegister& fn,
				1624	const FPRegister& fm,
				1625	const FPRegister& fa);
				1626
				1627	// FP fused multiply, subtract and negate.
				1628	void fnmsub(const FPRegister& fd,
				1629	const FPRegister& fn,
				1630	const FPRegister& fm,
				1631	const FPRegister& fa);
				1632
				1633	// FP divide.
				1634	void fdiv(const FPRegister& fd, const FPRegister& fn, const FPRegister& fm);
				1635
				1636	// FP maximum.
				1637	void fmax(const FPRegister& fd, const FPRegister& fn, const FPRegister& fm);
				1638
				1639	// FP minimum.
				1640	void fmin(const FPRegister& fd, const FPRegister& fn, const FPRegister& fm);
				1641
				1642	// FP maximum.
				1643	void fmaxnm(const FPRegister& fd, const FPRegister& fn, const FPRegister& fm);
				1644
				1645	// FP minimum.
				1646	void fminnm(const FPRegister& fd, const FPRegister& fn, const FPRegister& fm);
				1647
				1648	// FP absolute.
				1649	void fabs(const FPRegister& fd, const FPRegister& fn);
				1650
				1651	// FP negate.
				1652	void fneg(const FPRegister& fd, const FPRegister& fn);
				1653
				1654	// FP square root.
				1655	void fsqrt(const FPRegister& fd, const FPRegister& fn);
				1656
				1657	// FP round to integer (nearest with ties to away).
				1658	void frinta(const FPRegister& fd, const FPRegister& fn);
				1659
				1660	// FP round to integer (toward minus infinity).
				1661	void frintm(const FPRegister& fd, const FPRegister& fn);
				1662
				1663	// FP round to integer (nearest with ties to even).
				1664	void frintn(const FPRegister& fd, const FPRegister& fn);
				1665
Emily Bernier	d0a1eb7	2015-03-24 16:35:39 -0400	[diff] [blame^]	1666	// FP round to integer (towards plus infinity).
				1667	void frintp(const FPRegister& fd, const FPRegister& fn);
				1668
Ben Murdoch	b8a8cc1	2014-11-26 15:28:44 +0000	[diff] [blame]	1669	// FP round to integer (towards zero.)
				1670	void frintz(const FPRegister& fd, const FPRegister& fn);
				1671
				1672	// FP compare registers.
				1673	void fcmp(const FPRegister& fn, const FPRegister& fm);
				1674
				1675	// FP compare immediate.
				1676	void fcmp(const FPRegister& fn, double value);
				1677
				1678	// FP conditional compare.
				1679	void fccmp(const FPRegister& fn,
				1680	const FPRegister& fm,
				1681	StatusFlags nzcv,
				1682	Condition cond);
				1683
				1684	// FP conditional select.
				1685	void fcsel(const FPRegister& fd,
				1686	const FPRegister& fn,
				1687	const FPRegister& fm,
				1688	Condition cond);
				1689
				1690	// Common FP Convert function
				1691	void FPConvertToInt(const Register& rd,
				1692	const FPRegister& fn,
				1693	FPIntegerConvertOp op);
				1694
				1695	// FP convert between single and double precision.
				1696	void fcvt(const FPRegister& fd, const FPRegister& fn);
				1697
				1698	// Convert FP to unsigned integer (nearest with ties to away).
				1699	void fcvtau(const Register& rd, const FPRegister& fn);
				1700
				1701	// Convert FP to signed integer (nearest with ties to away).
				1702	void fcvtas(const Register& rd, const FPRegister& fn);
				1703
				1704	// Convert FP to unsigned integer (round towards -infinity).
				1705	void fcvtmu(const Register& rd, const FPRegister& fn);
				1706
				1707	// Convert FP to signed integer (round towards -infinity).
				1708	void fcvtms(const Register& rd, const FPRegister& fn);
				1709
				1710	// Convert FP to unsigned integer (nearest with ties to even).
				1711	void fcvtnu(const Register& rd, const FPRegister& fn);
				1712
				1713	// Convert FP to signed integer (nearest with ties to even).
				1714	void fcvtns(const Register& rd, const FPRegister& fn);
				1715
				1716	// Convert FP to unsigned integer (round towards zero).
				1717	void fcvtzu(const Register& rd, const FPRegister& fn);
				1718
				1719	// Convert FP to signed integer (rounf towards zero).
				1720	void fcvtzs(const Register& rd, const FPRegister& fn);
				1721
				1722	// Convert signed integer or fixed point to FP.
				1723	void scvtf(const FPRegister& fd, const Register& rn, unsigned fbits = 0);
				1724
				1725	// Convert unsigned integer or fixed point to FP.
				1726	void ucvtf(const FPRegister& fd, const Register& rn, unsigned fbits = 0);
				1727
				1728	// Instruction functions used only for test, debug, and patching.
				1729	// Emit raw instructions in the instruction stream.
				1730	void dci(Instr raw_inst) { Emit(raw_inst); }
				1731
				1732	// Emit 8 bits of data in the instruction stream.
				1733	void dc8(uint8_t data) { EmitData(&data, sizeof(data)); }
				1734
				1735	// Emit 32 bits of data in the instruction stream.
				1736	void dc32(uint32_t data) { EmitData(&data, sizeof(data)); }
				1737
				1738	// Emit 64 bits of data in the instruction stream.
				1739	void dc64(uint64_t data) { EmitData(&data, sizeof(data)); }
				1740
				1741	// Copy a string into the instruction stream, including the terminating NULL
				1742	// character. The instruction pointer (pc_) is then aligned correctly for
				1743	// subsequent instructions.
				1744	void EmitStringData(const char* string);
				1745
				1746	// Pseudo-instructions ------------------------------------------------------
				1747
				1748	// Parameters are described in arm64/instructions-arm64.h.
				1749	void debug(const char* message, uint32_t code, Instr params = BREAK);
				1750
				1751	// Required by V8.
				1752	void dd(uint32_t data) { dc32(data); }
				1753	void db(uint8_t data) { dc8(data); }
				1754
				1755	// Code generation helpers --------------------------------------------------
				1756
				1757	bool IsConstPoolEmpty() const { return constpool_.IsEmpty(); }
				1758
				1759	Instruction* pc() const { return Instruction::Cast(pc_); }
				1760
				1761	Instruction* InstructionAt(int offset) const {
				1762	return reinterpret_cast<Instruction*>(buffer_ + offset);
				1763	}
				1764
				1765	ptrdiff_t InstructionOffset(Instruction* instr) const {
				1766	return reinterpret_cast<byte*>(instr) - buffer_;
				1767	}
				1768
				1769	// Register encoding.
				1770	static Instr Rd(CPURegister rd) {
				1771	DCHECK(rd.code() != kSPRegInternalCode);
				1772	return rd.code() << Rd_offset;
				1773	}
				1774
				1775	static Instr Rn(CPURegister rn) {
				1776	DCHECK(rn.code() != kSPRegInternalCode);
				1777	return rn.code() << Rn_offset;
				1778	}
				1779
				1780	static Instr Rm(CPURegister rm) {
				1781	DCHECK(rm.code() != kSPRegInternalCode);
				1782	return rm.code() << Rm_offset;
				1783	}
				1784
				1785	static Instr Ra(CPURegister ra) {
				1786	DCHECK(ra.code() != kSPRegInternalCode);
				1787	return ra.code() << Ra_offset;
				1788	}
				1789
				1790	static Instr Rt(CPURegister rt) {
				1791	DCHECK(rt.code() != kSPRegInternalCode);
				1792	return rt.code() << Rt_offset;
				1793	}
				1794
				1795	static Instr Rt2(CPURegister rt2) {
				1796	DCHECK(rt2.code() != kSPRegInternalCode);
				1797	return rt2.code() << Rt2_offset;
				1798	}
				1799
				1800	// These encoding functions allow the stack pointer to be encoded, and
				1801	// disallow the zero register.
				1802	static Instr RdSP(Register rd) {
				1803	DCHECK(!rd.IsZero());
				1804	return (rd.code() & kRegCodeMask) << Rd_offset;
				1805	}
				1806
				1807	static Instr RnSP(Register rn) {
				1808	DCHECK(!rn.IsZero());
				1809	return (rn.code() & kRegCodeMask) << Rn_offset;
				1810	}
				1811
				1812	// Flags encoding.
				1813	inline static Instr Flags(FlagsUpdate S);
				1814	inline static Instr Cond(Condition cond);
				1815
				1816	// PC-relative address encoding.
				1817	inline static Instr ImmPCRelAddress(int imm21);
				1818
				1819	// Branch encoding.
				1820	inline static Instr ImmUncondBranch(int imm26);
				1821	inline static Instr ImmCondBranch(int imm19);
				1822	inline static Instr ImmCmpBranch(int imm19);
				1823	inline static Instr ImmTestBranch(int imm14);
				1824	inline static Instr ImmTestBranchBit(unsigned bit_pos);
				1825
				1826	// Data Processing encoding.
				1827	inline static Instr SF(Register rd);
				1828	inline static Instr ImmAddSub(int64_t imm);
				1829	inline static Instr ImmS(unsigned imms, unsigned reg_size);
				1830	inline static Instr ImmR(unsigned immr, unsigned reg_size);
				1831	inline static Instr ImmSetBits(unsigned imms, unsigned reg_size);
				1832	inline static Instr ImmRotate(unsigned immr, unsigned reg_size);
				1833	inline static Instr ImmLLiteral(int imm19);
				1834	inline static Instr BitN(unsigned bitn, unsigned reg_size);
				1835	inline static Instr ShiftDP(Shift shift);
				1836	inline static Instr ImmDPShift(unsigned amount);
				1837	inline static Instr ExtendMode(Extend extend);
				1838	inline static Instr ImmExtendShift(unsigned left_shift);
				1839	inline static Instr ImmCondCmp(unsigned imm);
				1840	inline static Instr Nzcv(StatusFlags nzcv);
				1841
				1842	static bool IsImmAddSub(int64_t immediate);
				1843	static bool IsImmLogical(uint64_t value,
				1844	unsigned width,
				1845	unsigned* n,
				1846	unsigned* imm_s,
				1847	unsigned* imm_r);
				1848
				1849	// MemOperand offset encoding.
				1850	inline static Instr ImmLSUnsigned(int imm12);
				1851	inline static Instr ImmLS(int imm9);
				1852	inline static Instr ImmLSPair(int imm7, LSDataSize size);
				1853	inline static Instr ImmShiftLS(unsigned shift_amount);
				1854	inline static Instr ImmException(int imm16);
				1855	inline static Instr ImmSystemRegister(int imm15);
				1856	inline static Instr ImmHint(int imm7);
				1857	inline static Instr ImmBarrierDomain(int imm2);
				1858	inline static Instr ImmBarrierType(int imm2);
				1859	inline static LSDataSize CalcLSDataSize(LoadStoreOp op);
				1860
				1861	static bool IsImmLSUnscaled(int64_t offset);
				1862	static bool IsImmLSScaled(int64_t offset, LSDataSize size);
				1863
				1864	// Move immediates encoding.
				1865	inline static Instr ImmMoveWide(uint64_t imm);
				1866	inline static Instr ShiftMoveWide(int64_t shift);
				1867
				1868	// FP Immediates.
				1869	static Instr ImmFP32(float imm);
				1870	static Instr ImmFP64(double imm);
				1871	inline static Instr FPScale(unsigned scale);
				1872
				1873	// FP register type.
				1874	inline static Instr FPType(FPRegister fd);
				1875
				1876	// Class for scoping postponing the constant pool generation.
				1877	class BlockConstPoolScope {
				1878	public:
				1879	explicit BlockConstPoolScope(Assembler* assem) : assem_(assem) {
				1880	assem_->StartBlockConstPool();
				1881	}
				1882	~BlockConstPoolScope() {
				1883	assem_->EndBlockConstPool();
				1884	}
				1885
				1886	private:
				1887	Assembler* assem_;
				1888
				1889	DISALLOW_IMPLICIT_CONSTRUCTORS(BlockConstPoolScope);
				1890	};
				1891
				1892	// Check if is time to emit a constant pool.
				1893	void CheckConstPool(bool force_emit, bool require_jump);
				1894
				1895	// Allocate a constant pool of the correct size for the generated code.
				1896	Handle<ConstantPoolArray> NewConstantPool(Isolate* isolate);
				1897
				1898	// Generate the constant pool for the generated code.
				1899	void PopulateConstantPool(ConstantPoolArray* constant_pool);
				1900
				1901	// Returns true if we should emit a veneer as soon as possible for a branch
				1902	// which can at most reach to specified pc.
				1903	bool ShouldEmitVeneer(int max_reachable_pc,
				1904	int margin = kVeneerDistanceMargin);
				1905	bool ShouldEmitVeneers(int margin = kVeneerDistanceMargin) {
				1906	return ShouldEmitVeneer(unresolved_branches_first_limit(), margin);
				1907	}
				1908
				1909	// The maximum code size generated for a veneer. Currently one branch
				1910	// instruction. This is for code size checking purposes, and can be extended
				1911	// in the future for example if we decide to add nops between the veneers.
				1912	static const int kMaxVeneerCodeSize = 1 * kInstructionSize;
				1913
				1914	void RecordVeneerPool(int location_offset, int size);
				1915	// Emits veneers for branches that are approaching their maximum range.
				1916	// If need_protection is true, the veneers are protected by a branch jumping
				1917	// over the code.
				1918	void EmitVeneers(bool force_emit, bool need_protection,
				1919	int margin = kVeneerDistanceMargin);
				1920	void EmitVeneersGuard() { EmitPoolGuard(); }
				1921	// Checks whether veneers need to be emitted at this point.
				1922	// If force_emit is set, a veneer is generated for all unresolved branches.
				1923	void CheckVeneerPool(bool force_emit, bool require_jump,
				1924	int margin = kVeneerDistanceMargin);
				1925
				1926	class BlockPoolsScope {
				1927	public:
				1928	explicit BlockPoolsScope(Assembler* assem) : assem_(assem) {
				1929	assem_->StartBlockPools();
				1930	}
				1931	~BlockPoolsScope() {
				1932	assem_->EndBlockPools();
				1933	}
				1934
				1935	private:
				1936	Assembler* assem_;
				1937
				1938	DISALLOW_IMPLICIT_CONSTRUCTORS(BlockPoolsScope);
				1939	};
				1940
				1941	protected:
				1942	inline const Register& AppropriateZeroRegFor(const CPURegister& reg) const;
				1943
				1944	void LoadStore(const CPURegister& rt,
				1945	const MemOperand& addr,
				1946	LoadStoreOp op);
				1947
				1948	void LoadStorePair(const CPURegister& rt, const CPURegister& rt2,
				1949	const MemOperand& addr, LoadStorePairOp op);
				1950	static bool IsImmLSPair(int64_t offset, LSDataSize size);
				1951
				1952	void Logical(const Register& rd,
				1953	const Register& rn,
				1954	const Operand& operand,
				1955	LogicalOp op);
				1956	void LogicalImmediate(const Register& rd,
				1957	const Register& rn,
				1958	unsigned n,
				1959	unsigned imm_s,
				1960	unsigned imm_r,
				1961	LogicalOp op);
				1962
				1963	void ConditionalCompare(const Register& rn,
				1964	const Operand& operand,
				1965	StatusFlags nzcv,
				1966	Condition cond,
				1967	ConditionalCompareOp op);
				1968	static bool IsImmConditionalCompare(int64_t immediate);
				1969
				1970	void AddSubWithCarry(const Register& rd,
				1971	const Register& rn,
				1972	const Operand& operand,
				1973	FlagsUpdate S,
				1974	AddSubWithCarryOp op);
				1975
				1976	// Functions for emulating operands not directly supported by the instruction
				1977	// set.
				1978	void EmitShift(const Register& rd,
				1979	const Register& rn,
				1980	Shift shift,
				1981	unsigned amount);
				1982	void EmitExtendShift(const Register& rd,
				1983	const Register& rn,
				1984	Extend extend,
				1985	unsigned left_shift);
				1986
				1987	void AddSub(const Register& rd,
				1988	const Register& rn,
				1989	const Operand& operand,
				1990	FlagsUpdate S,
				1991	AddSubOp op);
				1992
				1993	static bool IsImmFP32(float imm);
				1994	static bool IsImmFP64(double imm);
				1995
				1996	// Find an appropriate LoadStoreOp or LoadStorePairOp for the specified
				1997	// registers. Only simple loads are supported; sign- and zero-extension (such
				1998	// as in LDPSW_x or LDRB_w) are not supported.
				1999	static inline LoadStoreOp LoadOpFor(const CPURegister& rt);
				2000	static inline LoadStorePairOp LoadPairOpFor(const CPURegister& rt,
				2001	const CPURegister& rt2);
				2002	static inline LoadStoreOp StoreOpFor(const CPURegister& rt);
				2003	static inline LoadStorePairOp StorePairOpFor(const CPURegister& rt,
				2004	const CPURegister& rt2);
				2005	static inline LoadStorePairNonTemporalOp LoadPairNonTemporalOpFor(
				2006	const CPURegister& rt, const CPURegister& rt2);
				2007	static inline LoadStorePairNonTemporalOp StorePairNonTemporalOpFor(
				2008	const CPURegister& rt, const CPURegister& rt2);
				2009	static inline LoadLiteralOp LoadLiteralOpFor(const CPURegister& rt);
				2010
				2011	// Remove the specified branch from the unbound label link chain.
				2012	// If available, a veneer for this label can be used for other branches in the
				2013	// chain if the link chain cannot be fixed up without this branch.
				2014	void RemoveBranchFromLabelLinkChain(Instruction* branch,
				2015	Label* label,
				2016	Instruction* label_veneer = NULL);
				2017
				2018	private:
				2019	// Instruction helpers.
				2020	void MoveWide(const Register& rd,
				2021	uint64_t imm,
				2022	int shift,
				2023	MoveWideImmediateOp mov_op);
				2024	void DataProcShiftedRegister(const Register& rd,
				2025	const Register& rn,
				2026	const Operand& operand,
				2027	FlagsUpdate S,
				2028	Instr op);
				2029	void DataProcExtendedRegister(const Register& rd,
				2030	const Register& rn,
				2031	const Operand& operand,
				2032	FlagsUpdate S,
				2033	Instr op);
				2034	void LoadStorePairNonTemporal(const CPURegister& rt,
				2035	const CPURegister& rt2,
				2036	const MemOperand& addr,
				2037	LoadStorePairNonTemporalOp op);
				2038	void ConditionalSelect(const Register& rd,
				2039	const Register& rn,
				2040	const Register& rm,
				2041	Condition cond,
				2042	ConditionalSelectOp op);
				2043	void DataProcessing1Source(const Register& rd,
				2044	const Register& rn,
				2045	DataProcessing1SourceOp op);
				2046	void DataProcessing3Source(const Register& rd,
				2047	const Register& rn,
				2048	const Register& rm,
				2049	const Register& ra,
				2050	DataProcessing3SourceOp op);
				2051	void FPDataProcessing1Source(const FPRegister& fd,
				2052	const FPRegister& fn,
				2053	FPDataProcessing1SourceOp op);
				2054	void FPDataProcessing2Source(const FPRegister& fd,
				2055	const FPRegister& fn,
				2056	const FPRegister& fm,
				2057	FPDataProcessing2SourceOp op);
				2058	void FPDataProcessing3Source(const FPRegister& fd,
				2059	const FPRegister& fn,
				2060	const FPRegister& fm,
				2061	const FPRegister& fa,
				2062	FPDataProcessing3SourceOp op);
				2063
				2064	// Label helpers.
				2065
				2066	// Return an offset for a label-referencing instruction, typically a branch.
				2067	int LinkAndGetByteOffsetTo(Label* label);
				2068
				2069	// This is the same as LinkAndGetByteOffsetTo, but return an offset
				2070	// suitable for fields that take instruction offsets.
				2071	inline int LinkAndGetInstructionOffsetTo(Label* label);
				2072
				2073	static const int kStartOfLabelLinkChain = 0;
				2074
				2075	// Verify that a label's link chain is intact.
				2076	void CheckLabelLinkChain(Label const * label);
				2077
				2078	void RecordLiteral(int64_t imm, unsigned size);
				2079
				2080	// Postpone the generation of the constant pool for the specified number of
				2081	// instructions.
				2082	void BlockConstPoolFor(int instructions);
				2083
				2084	// Set how far from current pc the next constant pool check will be.
				2085	void SetNextConstPoolCheckIn(int instructions) {
				2086	next_constant_pool_check_ = pc_offset() + instructions * kInstructionSize;
				2087	}
				2088
				2089	// Emit the instruction at pc_.
				2090	void Emit(Instr instruction) {
				2091	STATIC_ASSERT(sizeof(*pc_) == 1);
				2092	STATIC_ASSERT(sizeof(instruction) == kInstructionSize);
				2093	DCHECK((pc_ + sizeof(instruction)) <= (buffer_ + buffer_size_));
				2094
				2095	memcpy(pc_, &instruction, sizeof(instruction));
				2096	pc_ += sizeof(instruction);
				2097	CheckBuffer();
				2098	}
				2099
				2100	// Emit data inline in the instruction stream.
				2101	void EmitData(void const * data, unsigned size) {
				2102	DCHECK(sizeof(*pc_) == 1);
				2103	DCHECK((pc_ + size) <= (buffer_ + buffer_size_));
				2104
				2105	// TODO(all): Somehow register we have some data here. Then we can
				2106	// disassemble it correctly.
				2107	memcpy(pc_, data, size);
				2108	pc_ += size;
				2109	CheckBuffer();
				2110	}
				2111
				2112	void GrowBuffer();
				2113	void CheckBufferSpace();
				2114	void CheckBuffer();
				2115
				2116	// Pc offset of the next constant pool check.
				2117	int next_constant_pool_check_;
				2118
				2119	// Constant pool generation
				2120	// Pools are emitted in the instruction stream. They are emitted when:
				2121	// * the distance to the first use is above a pre-defined distance or
				2122	// * the numbers of entries in the pool is above a pre-defined size or
				2123	// * code generation is finished
				2124	// If a pool needs to be emitted before code generation is finished a branch
				2125	// over the emitted pool will be inserted.
				2126
				2127	// Constants in the pool may be addresses of functions that gets relocated;
				2128	// if so, a relocation info entry is associated to the constant pool entry.
				2129
				2130	// Repeated checking whether the constant pool should be emitted is rather
				2131	// expensive. By default we only check again once a number of instructions
				2132	// has been generated. That also means that the sizing of the buffers is not
				2133	// an exact science, and that we rely on some slop to not overrun buffers.
				2134	static const int kCheckConstPoolInterval = 128;
				2135
				2136	// Distance to first use after a which a pool will be emitted. Pool entries
				2137	// are accessed with pc relative load therefore this cannot be more than
				2138	// 1 * MB. Since constant pool emission checks are interval based this value
				2139	// is an approximation.
				2140	static const int kApproxMaxDistToConstPool = 64 * KB;
				2141
				2142	// Number of pool entries after which a pool will be emitted. Since constant
				2143	// pool emission checks are interval based this value is an approximation.
				2144	static const int kApproxMaxPoolEntryCount = 512;
				2145
				2146	// Emission of the constant pool may be blocked in some code sequences.
				2147	int const_pool_blocked_nesting_; // Block emission if this is not zero.
				2148	int no_const_pool_before_; // Block emission before this pc offset.
				2149
				2150	// Emission of the veneer pools may be blocked in some code sequences.
				2151	int veneer_pool_blocked_nesting_; // Block emission if this is not zero.
				2152
				2153	// Relocation info generation
				2154	// Each relocation is encoded as a variable size value
				2155	static const int kMaxRelocSize = RelocInfoWriter::kMaxSize;
				2156	RelocInfoWriter reloc_info_writer;
				2157
				2158	// Relocation info records are also used during code generation as temporary
				2159	// containers for constants and code target addresses until they are emitted
				2160	// to the constant pool. These pending relocation info records are temporarily
				2161	// stored in a separate buffer until a constant pool is emitted.
				2162	// If every instruction in a long sequence is accessing the pool, we need one
				2163	// pending relocation entry per instruction.
				2164
				2165	// The pending constant pool.
				2166	ConstPool constpool_;
				2167
				2168	// Relocation for a type-recording IC has the AST id added to it. This
				2169	// member variable is a way to pass the information from the call site to
				2170	// the relocation info.
				2171	TypeFeedbackId recorded_ast_id_;
				2172
				2173	inline TypeFeedbackId RecordedAstId();
				2174	inline void ClearRecordedAstId();
				2175
				2176	protected:
				2177	// Record the AST id of the CallIC being compiled, so that it can be placed
				2178	// in the relocation information.
				2179	void SetRecordedAstId(TypeFeedbackId ast_id) {
				2180	DCHECK(recorded_ast_id_.IsNone());
				2181	recorded_ast_id_ = ast_id;
				2182	}
				2183
				2184	// Code generation
				2185	// The relocation writer's position is at least kGap bytes below the end of
				2186	// the generated instructions. This is so that multi-instruction sequences do
				2187	// not have to check for overflow. The same is true for writes of large
				2188	// relocation info entries, and debug strings encoded in the instruction
				2189	// stream.
				2190	static const int kGap = 128;
				2191
				2192	public:
				2193	class FarBranchInfo {
				2194	public:
				2195	FarBranchInfo(int offset, Label* label)
				2196	: pc_offset_(offset), label_(label) {}
				2197	// Offset of the branch in the code generation buffer.
				2198	int pc_offset_;
				2199	// The label branched to.
				2200	Label* label_;
				2201	};
				2202
				2203	protected:
				2204	// Information about unresolved (forward) branches.
				2205	// The Assembler is only allowed to delete out-of-date information from here
				2206	// after a label is bound. The MacroAssembler uses this information to
				2207	// generate veneers.
				2208	//
				2209	// The second member gives information about the unresolved branch. The first
				2210	// member of the pair is the maximum offset that the branch can reach in the
				2211	// buffer. The map is sorted according to this reachable offset, allowing to
				2212	// easily check when veneers need to be emitted.
				2213	// Note that the maximum reachable offset (first member of the pairs) should
				2214	// always be positive but has the same type as the return value for
				2215	// pc_offset() for convenience.
				2216	std::multimap<int, FarBranchInfo> unresolved_branches_;
				2217
				2218	// We generate a veneer for a branch if we reach within this distance of the
				2219	// limit of the range.
				2220	static const int kVeneerDistanceMargin = 1 * KB;
				2221	// The factor of 2 is a finger in the air guess. With a default margin of
				2222	// 1KB, that leaves us an addional 256 instructions to avoid generating a
				2223	// protective branch.
				2224	static const int kVeneerNoProtectionFactor = 2;
				2225	static const int kVeneerDistanceCheckMargin =
				2226	kVeneerNoProtectionFactor * kVeneerDistanceMargin;
				2227	int unresolved_branches_first_limit() const {
				2228	DCHECK(!unresolved_branches_.empty());
				2229	return unresolved_branches_.begin()->first;
				2230	}
				2231	// This is similar to next_constant_pool_check_ and helps reduce the overhead
				2232	// of checking for veneer pools.
				2233	// It is maintained to the closest unresolved branch limit minus the maximum
				2234	// veneer margin (or kMaxInt if there are no unresolved branches).
				2235	int next_veneer_pool_check_;
				2236
				2237	private:
				2238	// If a veneer is emitted for a branch instruction, that instruction must be
				2239	// removed from the associated label's link chain so that the assembler does
				2240	// not later attempt (likely unsuccessfully) to patch it to branch directly to
				2241	// the label.
				2242	void DeleteUnresolvedBranchInfoForLabel(Label* label);
				2243	// This function deletes the information related to the label by traversing
				2244	// the label chain, and for each PC-relative instruction in the chain checking
				2245	// if pending unresolved information exists. Its complexity is proportional to
				2246	// the length of the label chain.
				2247	void DeleteUnresolvedBranchInfoForLabelTraverse(Label* label);
				2248
				2249	private:
				2250	PositionsRecorder positions_recorder_;
				2251	friend class PositionsRecorder;
				2252	friend class EnsureSpace;
				2253	friend class ConstPool;
				2254	};
				2255
				2256	class PatchingAssembler : public Assembler {
				2257	public:
				2258	// Create an Assembler with a buffer starting at 'start'.
				2259	// The buffer size is
				2260	// size of instructions to patch + kGap
				2261	// Where kGap is the distance from which the Assembler tries to grow the
				2262	// buffer.
				2263	// If more or fewer instructions than expected are generated or if some
				2264	// relocation information takes space in the buffer, the PatchingAssembler
				2265	// will crash trying to grow the buffer.
				2266	PatchingAssembler(Instruction* start, unsigned count)
				2267	: Assembler(NULL,
				2268	reinterpret_cast<byte*>(start),
				2269	count * kInstructionSize + kGap) {
				2270	StartBlockPools();
				2271	}
				2272
				2273	PatchingAssembler(byte* start, unsigned count)
				2274	: Assembler(NULL, start, count * kInstructionSize + kGap) {
				2275	// Block constant pool emission.
				2276	StartBlockPools();
				2277	}
				2278
				2279	~PatchingAssembler() {
				2280	// Const pool should still be blocked.
				2281	DCHECK(is_const_pool_blocked());
				2282	EndBlockPools();
				2283	// Verify we have generated the number of instruction we expected.
				2284	DCHECK((pc_offset() + kGap) == buffer_size_);
				2285	// Verify no relocation information has been emitted.
				2286	DCHECK(IsConstPoolEmpty());
				2287	// Flush the Instruction cache.
				2288	size_t length = buffer_size_ - kGap;
				2289	CpuFeatures::FlushICache(buffer_, length);
				2290	}
				2291
				2292	// See definition of PatchAdrFar() for details.
				2293	static const int kAdrFarPatchableNNops = 2;
				2294	static const int kAdrFarPatchableNInstrs = kAdrFarPatchableNNops + 2;
				2295	void PatchAdrFar(int64_t target_offset);
				2296	};
				2297
				2298
				2299	class EnsureSpace BASE_EMBEDDED {
				2300	public:
				2301	explicit EnsureSpace(Assembler* assembler) {
				2302	assembler->CheckBufferSpace();
				2303	}
				2304	};
				2305
				2306	} } // namespace v8::internal
				2307
				2308	#endif // V8_ARM64_ASSEMBLER_ARM64_H_