Ben Murdoch | b8a8cc1 | 2014-11-26 15:28:44 +0000 | [diff] [blame] | 1 | // Copyright 2012 the V8 project authors. All rights reserved. |
| 2 | // Use of this source code is governed by a BSD-style license that can be |
| 3 | // found in the LICENSE file. |
| 4 | |
| 5 | #include "src/v8.h" |
| 6 | |
| 7 | #if V8_TARGET_ARCH_MIPS64 |
| 8 | |
| 9 | #include "src/codegen.h" |
| 10 | #include "src/macro-assembler.h" |
| 11 | #include "src/mips64/simulator-mips64.h" |
| 12 | |
| 13 | namespace v8 { |
| 14 | namespace internal { |
| 15 | |
| 16 | |
| 17 | #define __ masm. |
| 18 | |
| 19 | |
| 20 | #if defined(USE_SIMULATOR) |
| 21 | byte* fast_exp_mips_machine_code = NULL; |
| 22 | double fast_exp_simulator(double x) { |
| 23 | return Simulator::current(Isolate::Current())->CallFP( |
| 24 | fast_exp_mips_machine_code, x, 0); |
| 25 | } |
| 26 | #endif |
| 27 | |
| 28 | |
| 29 | UnaryMathFunction CreateExpFunction() { |
| 30 | if (!FLAG_fast_math) return &std::exp; |
| 31 | size_t actual_size; |
| 32 | byte* buffer = |
| 33 | static_cast<byte*>(base::OS::Allocate(1 * KB, &actual_size, true)); |
| 34 | if (buffer == NULL) return &std::exp; |
| 35 | ExternalReference::InitializeMathExpData(); |
| 36 | |
| 37 | MacroAssembler masm(NULL, buffer, static_cast<int>(actual_size)); |
| 38 | |
| 39 | { |
| 40 | DoubleRegister input = f12; |
| 41 | DoubleRegister result = f0; |
| 42 | DoubleRegister double_scratch1 = f4; |
| 43 | DoubleRegister double_scratch2 = f6; |
| 44 | Register temp1 = a4; |
| 45 | Register temp2 = a5; |
| 46 | Register temp3 = a6; |
| 47 | |
| 48 | if (!IsMipsSoftFloatABI) { |
| 49 | // Input value is in f12 anyway, nothing to do. |
| 50 | } else { |
| 51 | __ Move(input, a0, a1); |
| 52 | } |
| 53 | __ Push(temp3, temp2, temp1); |
| 54 | MathExpGenerator::EmitMathExp( |
| 55 | &masm, input, result, double_scratch1, double_scratch2, |
| 56 | temp1, temp2, temp3); |
| 57 | __ Pop(temp3, temp2, temp1); |
| 58 | if (!IsMipsSoftFloatABI) { |
| 59 | // Result is already in f0, nothing to do. |
| 60 | } else { |
| 61 | __ Move(v0, v1, result); |
| 62 | } |
| 63 | __ Ret(); |
| 64 | } |
| 65 | |
| 66 | CodeDesc desc; |
| 67 | masm.GetCode(&desc); |
| 68 | DCHECK(!RelocInfo::RequiresRelocation(desc)); |
| 69 | |
| 70 | CpuFeatures::FlushICache(buffer, actual_size); |
| 71 | base::OS::ProtectCode(buffer, actual_size); |
| 72 | |
| 73 | #if !defined(USE_SIMULATOR) |
| 74 | return FUNCTION_CAST<UnaryMathFunction>(buffer); |
| 75 | #else |
| 76 | fast_exp_mips_machine_code = buffer; |
| 77 | return &fast_exp_simulator; |
| 78 | #endif |
| 79 | } |
| 80 | |
| 81 | |
| 82 | #if defined(V8_HOST_ARCH_MIPS) |
| 83 | MemCopyUint8Function CreateMemCopyUint8Function(MemCopyUint8Function stub) { |
| 84 | #if defined(USE_SIMULATOR) |
| 85 | return stub; |
| 86 | #else |
| 87 | |
| 88 | size_t actual_size; |
| 89 | byte* buffer = |
| 90 | static_cast<byte*>(base::OS::Allocate(3 * KB, &actual_size, true)); |
| 91 | if (buffer == NULL) return stub; |
| 92 | |
| 93 | // This code assumes that cache lines are 32 bytes and if the cache line is |
| 94 | // larger it will not work correctly. |
| 95 | MacroAssembler masm(NULL, buffer, static_cast<int>(actual_size)); |
| 96 | |
| 97 | { |
| 98 | Label lastb, unaligned, aligned, chkw, |
| 99 | loop16w, chk1w, wordCopy_loop, skip_pref, lastbloop, |
| 100 | leave, ua_chk16w, ua_loop16w, ua_skip_pref, ua_chkw, |
| 101 | ua_chk1w, ua_wordCopy_loop, ua_smallCopy, ua_smallCopy_loop; |
| 102 | |
| 103 | // The size of each prefetch. |
| 104 | uint32_t pref_chunk = 32; |
| 105 | // The maximum size of a prefetch, it must not be less then pref_chunk. |
| 106 | // If the real size of a prefetch is greater then max_pref_size and |
| 107 | // the kPrefHintPrepareForStore hint is used, the code will not work |
| 108 | // correctly. |
| 109 | uint32_t max_pref_size = 128; |
| 110 | DCHECK(pref_chunk < max_pref_size); |
| 111 | |
| 112 | // pref_limit is set based on the fact that we never use an offset |
| 113 | // greater then 5 on a store pref and that a single pref can |
| 114 | // never be larger then max_pref_size. |
| 115 | uint32_t pref_limit = (5 * pref_chunk) + max_pref_size; |
| 116 | int32_t pref_hint_load = kPrefHintLoadStreamed; |
| 117 | int32_t pref_hint_store = kPrefHintPrepareForStore; |
| 118 | uint32_t loadstore_chunk = 4; |
| 119 | |
| 120 | // The initial prefetches may fetch bytes that are before the buffer being |
| 121 | // copied. Start copies with an offset of 4 so avoid this situation when |
| 122 | // using kPrefHintPrepareForStore. |
| 123 | DCHECK(pref_hint_store != kPrefHintPrepareForStore || |
| 124 | pref_chunk * 4 >= max_pref_size); |
| 125 | // If the size is less than 8, go to lastb. Regardless of size, |
| 126 | // copy dst pointer to v0 for the retuen value. |
| 127 | __ slti(a6, a2, 2 * loadstore_chunk); |
| 128 | __ bne(a6, zero_reg, &lastb); |
| 129 | __ mov(v0, a0); // In delay slot. |
| 130 | |
| 131 | // If src and dst have different alignments, go to unaligned, if they |
| 132 | // have the same alignment (but are not actually aligned) do a partial |
| 133 | // load/store to make them aligned. If they are both already aligned |
| 134 | // we can start copying at aligned. |
| 135 | __ xor_(t8, a1, a0); |
| 136 | __ andi(t8, t8, loadstore_chunk - 1); // t8 is a0/a1 word-displacement. |
| 137 | __ bne(t8, zero_reg, &unaligned); |
| 138 | __ subu(a3, zero_reg, a0); // In delay slot. |
| 139 | |
| 140 | __ andi(a3, a3, loadstore_chunk - 1); // Copy a3 bytes to align a0/a1. |
| 141 | __ beq(a3, zero_reg, &aligned); // Already aligned. |
| 142 | __ subu(a2, a2, a3); // In delay slot. a2 is the remining bytes count. |
| 143 | |
| 144 | __ lwr(t8, MemOperand(a1)); |
| 145 | __ addu(a1, a1, a3); |
| 146 | __ swr(t8, MemOperand(a0)); |
| 147 | __ addu(a0, a0, a3); |
| 148 | |
| 149 | // Now dst/src are both aligned to (word) aligned addresses. Set a2 to |
| 150 | // count how many bytes we have to copy after all the 64 byte chunks are |
| 151 | // copied and a3 to the dst pointer after all the 64 byte chunks have been |
| 152 | // copied. We will loop, incrementing a0 and a1 until a0 equals a3. |
| 153 | __ bind(&aligned); |
| 154 | __ andi(t8, a2, 0x3f); |
| 155 | __ beq(a2, t8, &chkw); // Less than 64? |
| 156 | __ subu(a3, a2, t8); // In delay slot. |
| 157 | __ addu(a3, a0, a3); // Now a3 is the final dst after loop. |
| 158 | |
| 159 | // When in the loop we prefetch with kPrefHintPrepareForStore hint, |
| 160 | // in this case the a0+x should be past the "a4-32" address. This means: |
| 161 | // for x=128 the last "safe" a0 address is "a4-160". Alternatively, for |
| 162 | // x=64 the last "safe" a0 address is "a4-96". In the current version we |
| 163 | // will use "pref hint, 128(a0)", so "a4-160" is the limit. |
| 164 | if (pref_hint_store == kPrefHintPrepareForStore) { |
| 165 | __ addu(a4, a0, a2); // a4 is the "past the end" address. |
| 166 | __ Subu(t9, a4, pref_limit); // t9 is the "last safe pref" address. |
| 167 | } |
| 168 | |
| 169 | __ Pref(pref_hint_load, MemOperand(a1, 0 * pref_chunk)); |
| 170 | __ Pref(pref_hint_load, MemOperand(a1, 1 * pref_chunk)); |
| 171 | __ Pref(pref_hint_load, MemOperand(a1, 2 * pref_chunk)); |
| 172 | __ Pref(pref_hint_load, MemOperand(a1, 3 * pref_chunk)); |
| 173 | |
| 174 | if (pref_hint_store != kPrefHintPrepareForStore) { |
| 175 | __ Pref(pref_hint_store, MemOperand(a0, 1 * pref_chunk)); |
| 176 | __ Pref(pref_hint_store, MemOperand(a0, 2 * pref_chunk)); |
| 177 | __ Pref(pref_hint_store, MemOperand(a0, 3 * pref_chunk)); |
| 178 | } |
| 179 | __ bind(&loop16w); |
| 180 | __ lw(a4, MemOperand(a1)); |
| 181 | |
| 182 | if (pref_hint_store == kPrefHintPrepareForStore) { |
| 183 | __ sltu(v1, t9, a0); // If a0 > t9, don't use next prefetch. |
| 184 | __ Branch(USE_DELAY_SLOT, &skip_pref, gt, v1, Operand(zero_reg)); |
| 185 | } |
| 186 | __ lw(a5, MemOperand(a1, 1, loadstore_chunk)); // Maybe in delay slot. |
| 187 | |
| 188 | __ Pref(pref_hint_store, MemOperand(a0, 4 * pref_chunk)); |
| 189 | __ Pref(pref_hint_store, MemOperand(a0, 5 * pref_chunk)); |
| 190 | |
| 191 | __ bind(&skip_pref); |
| 192 | __ lw(a6, MemOperand(a1, 2, loadstore_chunk)); |
| 193 | __ lw(a7, MemOperand(a1, 3, loadstore_chunk)); |
| 194 | __ lw(t0, MemOperand(a1, 4, loadstore_chunk)); |
| 195 | __ lw(t1, MemOperand(a1, 5, loadstore_chunk)); |
| 196 | __ lw(t2, MemOperand(a1, 6, loadstore_chunk)); |
| 197 | __ lw(t3, MemOperand(a1, 7, loadstore_chunk)); |
| 198 | __ Pref(pref_hint_load, MemOperand(a1, 4 * pref_chunk)); |
| 199 | |
| 200 | __ sw(a4, MemOperand(a0)); |
| 201 | __ sw(a5, MemOperand(a0, 1, loadstore_chunk)); |
| 202 | __ sw(a6, MemOperand(a0, 2, loadstore_chunk)); |
| 203 | __ sw(a7, MemOperand(a0, 3, loadstore_chunk)); |
| 204 | __ sw(t0, MemOperand(a0, 4, loadstore_chunk)); |
| 205 | __ sw(t1, MemOperand(a0, 5, loadstore_chunk)); |
| 206 | __ sw(t2, MemOperand(a0, 6, loadstore_chunk)); |
| 207 | __ sw(t3, MemOperand(a0, 7, loadstore_chunk)); |
| 208 | |
| 209 | __ lw(a4, MemOperand(a1, 8, loadstore_chunk)); |
| 210 | __ lw(a5, MemOperand(a1, 9, loadstore_chunk)); |
| 211 | __ lw(a6, MemOperand(a1, 10, loadstore_chunk)); |
| 212 | __ lw(a7, MemOperand(a1, 11, loadstore_chunk)); |
| 213 | __ lw(t0, MemOperand(a1, 12, loadstore_chunk)); |
| 214 | __ lw(t1, MemOperand(a1, 13, loadstore_chunk)); |
| 215 | __ lw(t2, MemOperand(a1, 14, loadstore_chunk)); |
| 216 | __ lw(t3, MemOperand(a1, 15, loadstore_chunk)); |
| 217 | __ Pref(pref_hint_load, MemOperand(a1, 5 * pref_chunk)); |
| 218 | |
| 219 | __ sw(a4, MemOperand(a0, 8, loadstore_chunk)); |
| 220 | __ sw(a5, MemOperand(a0, 9, loadstore_chunk)); |
| 221 | __ sw(a6, MemOperand(a0, 10, loadstore_chunk)); |
| 222 | __ sw(a7, MemOperand(a0, 11, loadstore_chunk)); |
| 223 | __ sw(t0, MemOperand(a0, 12, loadstore_chunk)); |
| 224 | __ sw(t1, MemOperand(a0, 13, loadstore_chunk)); |
| 225 | __ sw(t2, MemOperand(a0, 14, loadstore_chunk)); |
| 226 | __ sw(t3, MemOperand(a0, 15, loadstore_chunk)); |
| 227 | __ addiu(a0, a0, 16 * loadstore_chunk); |
| 228 | __ bne(a0, a3, &loop16w); |
| 229 | __ addiu(a1, a1, 16 * loadstore_chunk); // In delay slot. |
| 230 | __ mov(a2, t8); |
| 231 | |
| 232 | // Here we have src and dest word-aligned but less than 64-bytes to go. |
| 233 | // Check for a 32 bytes chunk and copy if there is one. Otherwise jump |
| 234 | // down to chk1w to handle the tail end of the copy. |
| 235 | __ bind(&chkw); |
| 236 | __ Pref(pref_hint_load, MemOperand(a1, 0 * pref_chunk)); |
| 237 | __ andi(t8, a2, 0x1f); |
| 238 | __ beq(a2, t8, &chk1w); // Less than 32? |
| 239 | __ nop(); // In delay slot. |
| 240 | __ lw(a4, MemOperand(a1)); |
| 241 | __ lw(a5, MemOperand(a1, 1, loadstore_chunk)); |
| 242 | __ lw(a6, MemOperand(a1, 2, loadstore_chunk)); |
| 243 | __ lw(a7, MemOperand(a1, 3, loadstore_chunk)); |
| 244 | __ lw(t0, MemOperand(a1, 4, loadstore_chunk)); |
| 245 | __ lw(t1, MemOperand(a1, 5, loadstore_chunk)); |
| 246 | __ lw(t2, MemOperand(a1, 6, loadstore_chunk)); |
| 247 | __ lw(t3, MemOperand(a1, 7, loadstore_chunk)); |
| 248 | __ addiu(a1, a1, 8 * loadstore_chunk); |
| 249 | __ sw(a4, MemOperand(a0)); |
| 250 | __ sw(a5, MemOperand(a0, 1, loadstore_chunk)); |
| 251 | __ sw(a6, MemOperand(a0, 2, loadstore_chunk)); |
| 252 | __ sw(a7, MemOperand(a0, 3, loadstore_chunk)); |
| 253 | __ sw(t0, MemOperand(a0, 4, loadstore_chunk)); |
| 254 | __ sw(t1, MemOperand(a0, 5, loadstore_chunk)); |
| 255 | __ sw(t2, MemOperand(a0, 6, loadstore_chunk)); |
| 256 | __ sw(t3, MemOperand(a0, 7, loadstore_chunk)); |
| 257 | __ addiu(a0, a0, 8 * loadstore_chunk); |
| 258 | |
| 259 | // Here we have less than 32 bytes to copy. Set up for a loop to copy |
| 260 | // one word at a time. Set a2 to count how many bytes we have to copy |
| 261 | // after all the word chunks are copied and a3 to the dst pointer after |
| 262 | // all the word chunks have been copied. We will loop, incrementing a0 |
| 263 | // and a1 untill a0 equals a3. |
| 264 | __ bind(&chk1w); |
| 265 | __ andi(a2, t8, loadstore_chunk - 1); |
| 266 | __ beq(a2, t8, &lastb); |
| 267 | __ subu(a3, t8, a2); // In delay slot. |
| 268 | __ addu(a3, a0, a3); |
| 269 | |
| 270 | __ bind(&wordCopy_loop); |
| 271 | __ lw(a7, MemOperand(a1)); |
| 272 | __ addiu(a0, a0, loadstore_chunk); |
| 273 | __ addiu(a1, a1, loadstore_chunk); |
| 274 | __ bne(a0, a3, &wordCopy_loop); |
| 275 | __ sw(a7, MemOperand(a0, -1, loadstore_chunk)); // In delay slot. |
| 276 | |
| 277 | __ bind(&lastb); |
| 278 | __ Branch(&leave, le, a2, Operand(zero_reg)); |
| 279 | __ addu(a3, a0, a2); |
| 280 | |
| 281 | __ bind(&lastbloop); |
| 282 | __ lb(v1, MemOperand(a1)); |
| 283 | __ addiu(a0, a0, 1); |
| 284 | __ addiu(a1, a1, 1); |
| 285 | __ bne(a0, a3, &lastbloop); |
| 286 | __ sb(v1, MemOperand(a0, -1)); // In delay slot. |
| 287 | |
| 288 | __ bind(&leave); |
| 289 | __ jr(ra); |
| 290 | __ nop(); |
| 291 | |
| 292 | // Unaligned case. Only the dst gets aligned so we need to do partial |
| 293 | // loads of the source followed by normal stores to the dst (once we |
| 294 | // have aligned the destination). |
| 295 | __ bind(&unaligned); |
| 296 | __ andi(a3, a3, loadstore_chunk - 1); // Copy a3 bytes to align a0/a1. |
| 297 | __ beq(a3, zero_reg, &ua_chk16w); |
| 298 | __ subu(a2, a2, a3); // In delay slot. |
| 299 | |
| 300 | __ lwr(v1, MemOperand(a1)); |
| 301 | __ lwl(v1, |
| 302 | MemOperand(a1, 1, loadstore_chunk, MemOperand::offset_minus_one)); |
| 303 | __ addu(a1, a1, a3); |
| 304 | __ swr(v1, MemOperand(a0)); |
| 305 | __ addu(a0, a0, a3); |
| 306 | |
| 307 | // Now the dst (but not the source) is aligned. Set a2 to count how many |
| 308 | // bytes we have to copy after all the 64 byte chunks are copied and a3 to |
| 309 | // the dst pointer after all the 64 byte chunks have been copied. We will |
| 310 | // loop, incrementing a0 and a1 until a0 equals a3. |
| 311 | __ bind(&ua_chk16w); |
| 312 | __ andi(t8, a2, 0x3f); |
| 313 | __ beq(a2, t8, &ua_chkw); |
| 314 | __ subu(a3, a2, t8); // In delay slot. |
| 315 | __ addu(a3, a0, a3); |
| 316 | |
| 317 | if (pref_hint_store == kPrefHintPrepareForStore) { |
| 318 | __ addu(a4, a0, a2); |
| 319 | __ Subu(t9, a4, pref_limit); |
| 320 | } |
| 321 | |
| 322 | __ Pref(pref_hint_load, MemOperand(a1, 0 * pref_chunk)); |
| 323 | __ Pref(pref_hint_load, MemOperand(a1, 1 * pref_chunk)); |
| 324 | __ Pref(pref_hint_load, MemOperand(a1, 2 * pref_chunk)); |
| 325 | |
| 326 | if (pref_hint_store != kPrefHintPrepareForStore) { |
| 327 | __ Pref(pref_hint_store, MemOperand(a0, 1 * pref_chunk)); |
| 328 | __ Pref(pref_hint_store, MemOperand(a0, 2 * pref_chunk)); |
| 329 | __ Pref(pref_hint_store, MemOperand(a0, 3 * pref_chunk)); |
| 330 | } |
| 331 | |
| 332 | __ bind(&ua_loop16w); |
| 333 | __ Pref(pref_hint_load, MemOperand(a1, 3 * pref_chunk)); |
| 334 | __ lwr(a4, MemOperand(a1)); |
| 335 | __ lwr(a5, MemOperand(a1, 1, loadstore_chunk)); |
| 336 | __ lwr(a6, MemOperand(a1, 2, loadstore_chunk)); |
| 337 | |
| 338 | if (pref_hint_store == kPrefHintPrepareForStore) { |
| 339 | __ sltu(v1, t9, a0); |
| 340 | __ Branch(USE_DELAY_SLOT, &ua_skip_pref, gt, v1, Operand(zero_reg)); |
| 341 | } |
| 342 | __ lwr(a7, MemOperand(a1, 3, loadstore_chunk)); // Maybe in delay slot. |
| 343 | |
| 344 | __ Pref(pref_hint_store, MemOperand(a0, 4 * pref_chunk)); |
| 345 | __ Pref(pref_hint_store, MemOperand(a0, 5 * pref_chunk)); |
| 346 | |
| 347 | __ bind(&ua_skip_pref); |
| 348 | __ lwr(t0, MemOperand(a1, 4, loadstore_chunk)); |
| 349 | __ lwr(t1, MemOperand(a1, 5, loadstore_chunk)); |
| 350 | __ lwr(t2, MemOperand(a1, 6, loadstore_chunk)); |
| 351 | __ lwr(t3, MemOperand(a1, 7, loadstore_chunk)); |
| 352 | __ lwl(a4, |
| 353 | MemOperand(a1, 1, loadstore_chunk, MemOperand::offset_minus_one)); |
| 354 | __ lwl(a5, |
| 355 | MemOperand(a1, 2, loadstore_chunk, MemOperand::offset_minus_one)); |
| 356 | __ lwl(a6, |
| 357 | MemOperand(a1, 3, loadstore_chunk, MemOperand::offset_minus_one)); |
| 358 | __ lwl(a7, |
| 359 | MemOperand(a1, 4, loadstore_chunk, MemOperand::offset_minus_one)); |
| 360 | __ lwl(t0, |
| 361 | MemOperand(a1, 5, loadstore_chunk, MemOperand::offset_minus_one)); |
| 362 | __ lwl(t1, |
| 363 | MemOperand(a1, 6, loadstore_chunk, MemOperand::offset_minus_one)); |
| 364 | __ lwl(t2, |
| 365 | MemOperand(a1, 7, loadstore_chunk, MemOperand::offset_minus_one)); |
| 366 | __ lwl(t3, |
| 367 | MemOperand(a1, 8, loadstore_chunk, MemOperand::offset_minus_one)); |
| 368 | __ Pref(pref_hint_load, MemOperand(a1, 4 * pref_chunk)); |
| 369 | __ sw(a4, MemOperand(a0)); |
| 370 | __ sw(a5, MemOperand(a0, 1, loadstore_chunk)); |
| 371 | __ sw(a6, MemOperand(a0, 2, loadstore_chunk)); |
| 372 | __ sw(a7, MemOperand(a0, 3, loadstore_chunk)); |
| 373 | __ sw(t0, MemOperand(a0, 4, loadstore_chunk)); |
| 374 | __ sw(t1, MemOperand(a0, 5, loadstore_chunk)); |
| 375 | __ sw(t2, MemOperand(a0, 6, loadstore_chunk)); |
| 376 | __ sw(t3, MemOperand(a0, 7, loadstore_chunk)); |
| 377 | __ lwr(a4, MemOperand(a1, 8, loadstore_chunk)); |
| 378 | __ lwr(a5, MemOperand(a1, 9, loadstore_chunk)); |
| 379 | __ lwr(a6, MemOperand(a1, 10, loadstore_chunk)); |
| 380 | __ lwr(a7, MemOperand(a1, 11, loadstore_chunk)); |
| 381 | __ lwr(t0, MemOperand(a1, 12, loadstore_chunk)); |
| 382 | __ lwr(t1, MemOperand(a1, 13, loadstore_chunk)); |
| 383 | __ lwr(t2, MemOperand(a1, 14, loadstore_chunk)); |
| 384 | __ lwr(t3, MemOperand(a1, 15, loadstore_chunk)); |
| 385 | __ lwl(a4, |
| 386 | MemOperand(a1, 9, loadstore_chunk, MemOperand::offset_minus_one)); |
| 387 | __ lwl(a5, |
| 388 | MemOperand(a1, 10, loadstore_chunk, MemOperand::offset_minus_one)); |
| 389 | __ lwl(a6, |
| 390 | MemOperand(a1, 11, loadstore_chunk, MemOperand::offset_minus_one)); |
| 391 | __ lwl(a7, |
| 392 | MemOperand(a1, 12, loadstore_chunk, MemOperand::offset_minus_one)); |
| 393 | __ lwl(t0, |
| 394 | MemOperand(a1, 13, loadstore_chunk, MemOperand::offset_minus_one)); |
| 395 | __ lwl(t1, |
| 396 | MemOperand(a1, 14, loadstore_chunk, MemOperand::offset_minus_one)); |
| 397 | __ lwl(t2, |
| 398 | MemOperand(a1, 15, loadstore_chunk, MemOperand::offset_minus_one)); |
| 399 | __ lwl(t3, |
| 400 | MemOperand(a1, 16, loadstore_chunk, MemOperand::offset_minus_one)); |
| 401 | __ Pref(pref_hint_load, MemOperand(a1, 5 * pref_chunk)); |
| 402 | __ sw(a4, MemOperand(a0, 8, loadstore_chunk)); |
| 403 | __ sw(a5, MemOperand(a0, 9, loadstore_chunk)); |
| 404 | __ sw(a6, MemOperand(a0, 10, loadstore_chunk)); |
| 405 | __ sw(a7, MemOperand(a0, 11, loadstore_chunk)); |
| 406 | __ sw(t0, MemOperand(a0, 12, loadstore_chunk)); |
| 407 | __ sw(t1, MemOperand(a0, 13, loadstore_chunk)); |
| 408 | __ sw(t2, MemOperand(a0, 14, loadstore_chunk)); |
| 409 | __ sw(t3, MemOperand(a0, 15, loadstore_chunk)); |
| 410 | __ addiu(a0, a0, 16 * loadstore_chunk); |
| 411 | __ bne(a0, a3, &ua_loop16w); |
| 412 | __ addiu(a1, a1, 16 * loadstore_chunk); // In delay slot. |
| 413 | __ mov(a2, t8); |
| 414 | |
| 415 | // Here less than 64-bytes. Check for |
| 416 | // a 32 byte chunk and copy if there is one. Otherwise jump down to |
| 417 | // ua_chk1w to handle the tail end of the copy. |
| 418 | __ bind(&ua_chkw); |
| 419 | __ Pref(pref_hint_load, MemOperand(a1)); |
| 420 | __ andi(t8, a2, 0x1f); |
| 421 | |
| 422 | __ beq(a2, t8, &ua_chk1w); |
| 423 | __ nop(); // In delay slot. |
| 424 | __ lwr(a4, MemOperand(a1)); |
| 425 | __ lwr(a5, MemOperand(a1, 1, loadstore_chunk)); |
| 426 | __ lwr(a6, MemOperand(a1, 2, loadstore_chunk)); |
| 427 | __ lwr(a7, MemOperand(a1, 3, loadstore_chunk)); |
| 428 | __ lwr(t0, MemOperand(a1, 4, loadstore_chunk)); |
| 429 | __ lwr(t1, MemOperand(a1, 5, loadstore_chunk)); |
| 430 | __ lwr(t2, MemOperand(a1, 6, loadstore_chunk)); |
| 431 | __ lwr(t3, MemOperand(a1, 7, loadstore_chunk)); |
| 432 | __ lwl(a4, |
| 433 | MemOperand(a1, 1, loadstore_chunk, MemOperand::offset_minus_one)); |
| 434 | __ lwl(a5, |
| 435 | MemOperand(a1, 2, loadstore_chunk, MemOperand::offset_minus_one)); |
| 436 | __ lwl(a6, |
| 437 | MemOperand(a1, 3, loadstore_chunk, MemOperand::offset_minus_one)); |
| 438 | __ lwl(a7, |
| 439 | MemOperand(a1, 4, loadstore_chunk, MemOperand::offset_minus_one)); |
| 440 | __ lwl(t0, |
| 441 | MemOperand(a1, 5, loadstore_chunk, MemOperand::offset_minus_one)); |
| 442 | __ lwl(t1, |
| 443 | MemOperand(a1, 6, loadstore_chunk, MemOperand::offset_minus_one)); |
| 444 | __ lwl(t2, |
| 445 | MemOperand(a1, 7, loadstore_chunk, MemOperand::offset_minus_one)); |
| 446 | __ lwl(t3, |
| 447 | MemOperand(a1, 8, loadstore_chunk, MemOperand::offset_minus_one)); |
| 448 | __ addiu(a1, a1, 8 * loadstore_chunk); |
| 449 | __ sw(a4, MemOperand(a0)); |
| 450 | __ sw(a5, MemOperand(a0, 1, loadstore_chunk)); |
| 451 | __ sw(a6, MemOperand(a0, 2, loadstore_chunk)); |
| 452 | __ sw(a7, MemOperand(a0, 3, loadstore_chunk)); |
| 453 | __ sw(t0, MemOperand(a0, 4, loadstore_chunk)); |
| 454 | __ sw(t1, MemOperand(a0, 5, loadstore_chunk)); |
| 455 | __ sw(t2, MemOperand(a0, 6, loadstore_chunk)); |
| 456 | __ sw(t3, MemOperand(a0, 7, loadstore_chunk)); |
| 457 | __ addiu(a0, a0, 8 * loadstore_chunk); |
| 458 | |
| 459 | // Less than 32 bytes to copy. Set up for a loop to |
| 460 | // copy one word at a time. |
| 461 | __ bind(&ua_chk1w); |
| 462 | __ andi(a2, t8, loadstore_chunk - 1); |
| 463 | __ beq(a2, t8, &ua_smallCopy); |
| 464 | __ subu(a3, t8, a2); // In delay slot. |
| 465 | __ addu(a3, a0, a3); |
| 466 | |
| 467 | __ bind(&ua_wordCopy_loop); |
| 468 | __ lwr(v1, MemOperand(a1)); |
| 469 | __ lwl(v1, |
| 470 | MemOperand(a1, 1, loadstore_chunk, MemOperand::offset_minus_one)); |
| 471 | __ addiu(a0, a0, loadstore_chunk); |
| 472 | __ addiu(a1, a1, loadstore_chunk); |
| 473 | __ bne(a0, a3, &ua_wordCopy_loop); |
| 474 | __ sw(v1, MemOperand(a0, -1, loadstore_chunk)); // In delay slot. |
| 475 | |
| 476 | // Copy the last 8 bytes. |
| 477 | __ bind(&ua_smallCopy); |
| 478 | __ beq(a2, zero_reg, &leave); |
| 479 | __ addu(a3, a0, a2); // In delay slot. |
| 480 | |
| 481 | __ bind(&ua_smallCopy_loop); |
| 482 | __ lb(v1, MemOperand(a1)); |
| 483 | __ addiu(a0, a0, 1); |
| 484 | __ addiu(a1, a1, 1); |
| 485 | __ bne(a0, a3, &ua_smallCopy_loop); |
| 486 | __ sb(v1, MemOperand(a0, -1)); // In delay slot. |
| 487 | |
| 488 | __ jr(ra); |
| 489 | __ nop(); |
| 490 | } |
| 491 | CodeDesc desc; |
| 492 | masm.GetCode(&desc); |
| 493 | DCHECK(!RelocInfo::RequiresRelocation(desc)); |
| 494 | |
| 495 | CpuFeatures::FlushICache(buffer, actual_size); |
| 496 | base::OS::ProtectCode(buffer, actual_size); |
| 497 | return FUNCTION_CAST<MemCopyUint8Function>(buffer); |
| 498 | #endif |
| 499 | } |
| 500 | #endif |
| 501 | |
| 502 | UnaryMathFunction CreateSqrtFunction() { |
| 503 | #if defined(USE_SIMULATOR) |
| 504 | return &std::sqrt; |
| 505 | #else |
| 506 | size_t actual_size; |
| 507 | byte* buffer = |
| 508 | static_cast<byte*>(base::OS::Allocate(1 * KB, &actual_size, true)); |
| 509 | if (buffer == NULL) return &std::sqrt; |
| 510 | |
| 511 | MacroAssembler masm(NULL, buffer, static_cast<int>(actual_size)); |
| 512 | |
| 513 | __ MovFromFloatParameter(f12); |
| 514 | __ sqrt_d(f0, f12); |
| 515 | __ MovToFloatResult(f0); |
| 516 | __ Ret(); |
| 517 | |
| 518 | CodeDesc desc; |
| 519 | masm.GetCode(&desc); |
| 520 | DCHECK(!RelocInfo::RequiresRelocation(desc)); |
| 521 | |
| 522 | CpuFeatures::FlushICache(buffer, actual_size); |
| 523 | base::OS::ProtectCode(buffer, actual_size); |
| 524 | return FUNCTION_CAST<UnaryMathFunction>(buffer); |
| 525 | #endif |
| 526 | } |
| 527 | |
| 528 | #undef __ |
| 529 | |
| 530 | |
| 531 | // ------------------------------------------------------------------------- |
| 532 | // Platform-specific RuntimeCallHelper functions. |
| 533 | |
| 534 | void StubRuntimeCallHelper::BeforeCall(MacroAssembler* masm) const { |
| 535 | masm->EnterFrame(StackFrame::INTERNAL); |
| 536 | DCHECK(!masm->has_frame()); |
| 537 | masm->set_has_frame(true); |
| 538 | } |
| 539 | |
| 540 | |
| 541 | void StubRuntimeCallHelper::AfterCall(MacroAssembler* masm) const { |
| 542 | masm->LeaveFrame(StackFrame::INTERNAL); |
| 543 | DCHECK(masm->has_frame()); |
| 544 | masm->set_has_frame(false); |
| 545 | } |
| 546 | |
| 547 | |
| 548 | // ------------------------------------------------------------------------- |
| 549 | // Code generators |
| 550 | |
| 551 | #define __ ACCESS_MASM(masm) |
| 552 | |
| 553 | void ElementsTransitionGenerator::GenerateMapChangeElementsTransition( |
| 554 | MacroAssembler* masm, |
| 555 | Register receiver, |
| 556 | Register key, |
| 557 | Register value, |
| 558 | Register target_map, |
| 559 | AllocationSiteMode mode, |
| 560 | Label* allocation_memento_found) { |
| 561 | Register scratch_elements = a4; |
| 562 | DCHECK(!AreAliased(receiver, key, value, target_map, |
| 563 | scratch_elements)); |
| 564 | |
| 565 | if (mode == TRACK_ALLOCATION_SITE) { |
| 566 | __ JumpIfJSArrayHasAllocationMemento( |
| 567 | receiver, scratch_elements, allocation_memento_found); |
| 568 | } |
| 569 | |
| 570 | // Set transitioned map. |
| 571 | __ sd(target_map, FieldMemOperand(receiver, HeapObject::kMapOffset)); |
| 572 | __ RecordWriteField(receiver, |
| 573 | HeapObject::kMapOffset, |
| 574 | target_map, |
| 575 | t1, |
| 576 | kRAHasNotBeenSaved, |
| 577 | kDontSaveFPRegs, |
| 578 | EMIT_REMEMBERED_SET, |
| 579 | OMIT_SMI_CHECK); |
| 580 | } |
| 581 | |
| 582 | |
| 583 | void ElementsTransitionGenerator::GenerateSmiToDouble( |
| 584 | MacroAssembler* masm, |
| 585 | Register receiver, |
| 586 | Register key, |
| 587 | Register value, |
| 588 | Register target_map, |
| 589 | AllocationSiteMode mode, |
| 590 | Label* fail) { |
| 591 | // Register ra contains the return address. |
| 592 | Label loop, entry, convert_hole, gc_required, only_change_map, done; |
| 593 | Register elements = a4; |
| 594 | Register length = a5; |
| 595 | Register array = a6; |
| 596 | Register array_end = array; |
| 597 | |
| 598 | // target_map parameter can be clobbered. |
| 599 | Register scratch1 = target_map; |
| 600 | Register scratch2 = t1; |
| 601 | Register scratch3 = a7; |
| 602 | |
| 603 | // Verify input registers don't conflict with locals. |
| 604 | DCHECK(!AreAliased(receiver, key, value, target_map, |
| 605 | elements, length, array, scratch2)); |
| 606 | |
| 607 | Register scratch = t2; |
| 608 | if (mode == TRACK_ALLOCATION_SITE) { |
| 609 | __ JumpIfJSArrayHasAllocationMemento(receiver, elements, fail); |
| 610 | } |
| 611 | |
| 612 | // Check for empty arrays, which only require a map transition and no changes |
| 613 | // to the backing store. |
| 614 | __ ld(elements, FieldMemOperand(receiver, JSObject::kElementsOffset)); |
| 615 | __ LoadRoot(at, Heap::kEmptyFixedArrayRootIndex); |
| 616 | __ Branch(&only_change_map, eq, at, Operand(elements)); |
| 617 | |
| 618 | __ push(ra); |
| 619 | __ ld(length, FieldMemOperand(elements, FixedArray::kLengthOffset)); |
| 620 | // elements: source FixedArray |
| 621 | // length: number of elements (smi-tagged) |
| 622 | |
| 623 | // Allocate new FixedDoubleArray. |
| 624 | __ SmiScale(scratch, length, kDoubleSizeLog2); |
| 625 | __ Daddu(scratch, scratch, FixedDoubleArray::kHeaderSize); |
| 626 | __ Allocate(scratch, array, t3, scratch2, &gc_required, DOUBLE_ALIGNMENT); |
| 627 | // array: destination FixedDoubleArray, not tagged as heap object |
| 628 | |
| 629 | // Set destination FixedDoubleArray's length and map. |
| 630 | __ LoadRoot(scratch2, Heap::kFixedDoubleArrayMapRootIndex); |
| 631 | __ sd(length, MemOperand(array, FixedDoubleArray::kLengthOffset)); |
| 632 | // Update receiver's map. |
| 633 | __ sd(scratch2, MemOperand(array, HeapObject::kMapOffset)); |
| 634 | |
| 635 | __ sd(target_map, FieldMemOperand(receiver, HeapObject::kMapOffset)); |
| 636 | __ RecordWriteField(receiver, |
| 637 | HeapObject::kMapOffset, |
| 638 | target_map, |
| 639 | scratch2, |
| 640 | kRAHasBeenSaved, |
| 641 | kDontSaveFPRegs, |
| 642 | OMIT_REMEMBERED_SET, |
| 643 | OMIT_SMI_CHECK); |
| 644 | // Replace receiver's backing store with newly created FixedDoubleArray. |
| 645 | __ Daddu(scratch1, array, Operand(kHeapObjectTag)); |
| 646 | __ sd(scratch1, FieldMemOperand(a2, JSObject::kElementsOffset)); |
| 647 | __ RecordWriteField(receiver, |
| 648 | JSObject::kElementsOffset, |
| 649 | scratch1, |
| 650 | scratch2, |
| 651 | kRAHasBeenSaved, |
| 652 | kDontSaveFPRegs, |
| 653 | EMIT_REMEMBERED_SET, |
| 654 | OMIT_SMI_CHECK); |
| 655 | |
| 656 | |
| 657 | // Prepare for conversion loop. |
| 658 | __ Daddu(scratch1, elements, |
| 659 | Operand(FixedArray::kHeaderSize - kHeapObjectTag)); |
| 660 | __ Daddu(scratch3, array, Operand(FixedDoubleArray::kHeaderSize)); |
| 661 | __ SmiScale(array_end, length, kDoubleSizeLog2); |
| 662 | __ Daddu(array_end, array_end, scratch3); |
| 663 | |
| 664 | // Repurpose registers no longer in use. |
| 665 | Register hole_lower = elements; |
| 666 | Register hole_upper = length; |
| 667 | __ li(hole_lower, Operand(kHoleNanLower32)); |
| 668 | // scratch1: begin of source FixedArray element fields, not tagged |
| 669 | // hole_lower: kHoleNanLower32 |
| 670 | // hole_upper: kHoleNanUpper32 |
| 671 | // array_end: end of destination FixedDoubleArray, not tagged |
| 672 | // scratch3: begin of FixedDoubleArray element fields, not tagged |
| 673 | __ Branch(USE_DELAY_SLOT, &entry); |
| 674 | __ li(hole_upper, Operand(kHoleNanUpper32)); // In delay slot. |
| 675 | |
| 676 | __ bind(&only_change_map); |
| 677 | __ sd(target_map, FieldMemOperand(receiver, HeapObject::kMapOffset)); |
| 678 | __ RecordWriteField(receiver, |
| 679 | HeapObject::kMapOffset, |
| 680 | target_map, |
| 681 | scratch2, |
| 682 | kRAHasBeenSaved, |
| 683 | kDontSaveFPRegs, |
| 684 | OMIT_REMEMBERED_SET, |
| 685 | OMIT_SMI_CHECK); |
| 686 | __ Branch(&done); |
| 687 | |
| 688 | // Call into runtime if GC is required. |
| 689 | __ bind(&gc_required); |
| 690 | __ ld(ra, MemOperand(sp, 0)); |
| 691 | __ Branch(USE_DELAY_SLOT, fail); |
| 692 | __ daddiu(sp, sp, kPointerSize); // In delay slot. |
| 693 | |
| 694 | // Convert and copy elements. |
| 695 | __ bind(&loop); |
| 696 | __ ld(scratch2, MemOperand(scratch1)); |
| 697 | __ Daddu(scratch1, scratch1, kIntSize); |
| 698 | // scratch2: current element |
| 699 | __ JumpIfNotSmi(scratch2, &convert_hole); |
| 700 | __ SmiUntag(scratch2); |
| 701 | |
| 702 | // Normal smi, convert to double and store. |
| 703 | __ mtc1(scratch2, f0); |
| 704 | __ cvt_d_w(f0, f0); |
| 705 | __ sdc1(f0, MemOperand(scratch3)); |
| 706 | __ Branch(USE_DELAY_SLOT, &entry); |
| 707 | __ daddiu(scratch3, scratch3, kDoubleSize); // In delay slot. |
| 708 | |
| 709 | // Hole found, store the-hole NaN. |
| 710 | __ bind(&convert_hole); |
| 711 | if (FLAG_debug_code) { |
| 712 | // Restore a "smi-untagged" heap object. |
| 713 | __ Or(scratch2, scratch2, Operand(1)); |
| 714 | __ LoadRoot(at, Heap::kTheHoleValueRootIndex); |
| 715 | __ Assert(eq, kObjectFoundInSmiOnlyArray, at, Operand(scratch2)); |
| 716 | } |
| 717 | // mantissa |
| 718 | __ sw(hole_lower, MemOperand(scratch3)); |
| 719 | // exponent |
| 720 | __ sw(hole_upper, MemOperand(scratch3, kIntSize)); |
| 721 | __ Daddu(scratch3, scratch3, kDoubleSize); |
| 722 | |
| 723 | __ bind(&entry); |
| 724 | __ Branch(&loop, lt, scratch3, Operand(array_end)); |
| 725 | |
| 726 | __ bind(&done); |
| 727 | __ pop(ra); |
| 728 | } |
| 729 | |
| 730 | |
| 731 | void ElementsTransitionGenerator::GenerateDoubleToObject( |
| 732 | MacroAssembler* masm, |
| 733 | Register receiver, |
| 734 | Register key, |
| 735 | Register value, |
| 736 | Register target_map, |
| 737 | AllocationSiteMode mode, |
| 738 | Label* fail) { |
| 739 | // Register ra contains the return address. |
| 740 | Label entry, loop, convert_hole, gc_required, only_change_map; |
| 741 | Register elements = a4; |
| 742 | Register array = a6; |
| 743 | Register length = a5; |
| 744 | Register scratch = t1; |
| 745 | |
| 746 | // Verify input registers don't conflict with locals. |
| 747 | DCHECK(!AreAliased(receiver, key, value, target_map, |
| 748 | elements, array, length, scratch)); |
| 749 | if (mode == TRACK_ALLOCATION_SITE) { |
| 750 | __ JumpIfJSArrayHasAllocationMemento(receiver, elements, fail); |
| 751 | } |
| 752 | |
| 753 | // Check for empty arrays, which only require a map transition and no changes |
| 754 | // to the backing store. |
| 755 | __ ld(elements, FieldMemOperand(receiver, JSObject::kElementsOffset)); |
| 756 | __ LoadRoot(at, Heap::kEmptyFixedArrayRootIndex); |
| 757 | __ Branch(&only_change_map, eq, at, Operand(elements)); |
| 758 | |
| 759 | __ MultiPush( |
| 760 | value.bit() | key.bit() | receiver.bit() | target_map.bit() | ra.bit()); |
| 761 | |
| 762 | __ ld(length, FieldMemOperand(elements, FixedArray::kLengthOffset)); |
| 763 | // elements: source FixedArray |
| 764 | // length: number of elements (smi-tagged) |
| 765 | |
| 766 | // Allocate new FixedArray. |
| 767 | // Re-use value and target_map registers, as they have been saved on the |
| 768 | // stack. |
| 769 | Register array_size = value; |
| 770 | Register allocate_scratch = target_map; |
| 771 | __ SmiScale(array_size, length, kPointerSizeLog2); |
| 772 | __ Daddu(array_size, array_size, FixedDoubleArray::kHeaderSize); |
| 773 | __ Allocate(array_size, array, allocate_scratch, scratch, &gc_required, |
| 774 | NO_ALLOCATION_FLAGS); |
| 775 | // array: destination FixedArray, not tagged as heap object |
| 776 | // Set destination FixedDoubleArray's length and map. |
| 777 | __ LoadRoot(scratch, Heap::kFixedArrayMapRootIndex); |
| 778 | __ sd(length, MemOperand(array, FixedDoubleArray::kLengthOffset)); |
| 779 | __ sd(scratch, MemOperand(array, HeapObject::kMapOffset)); |
| 780 | |
| 781 | // Prepare for conversion loop. |
| 782 | Register src_elements = elements; |
| 783 | Register dst_elements = target_map; |
| 784 | Register dst_end = length; |
| 785 | Register heap_number_map = scratch; |
| 786 | __ Daddu(src_elements, src_elements, |
| 787 | Operand(FixedDoubleArray::kHeaderSize - kHeapObjectTag + 4)); |
| 788 | __ Daddu(dst_elements, array, Operand(FixedArray::kHeaderSize)); |
| 789 | __ Daddu(array, array, Operand(kHeapObjectTag)); |
| 790 | __ SmiScale(dst_end, dst_end, kPointerSizeLog2); |
| 791 | __ Daddu(dst_end, dst_elements, dst_end); |
| 792 | __ LoadRoot(heap_number_map, Heap::kHeapNumberMapRootIndex); |
| 793 | // Using offsetted addresses. |
| 794 | // dst_elements: begin of destination FixedArray element fields, not tagged |
| 795 | // src_elements: begin of source FixedDoubleArray element fields, not tagged, |
| 796 | // points to the exponent |
| 797 | // dst_end: end of destination FixedArray, not tagged |
| 798 | // array: destination FixedArray |
| 799 | // heap_number_map: heap number map |
| 800 | __ Branch(&entry); |
| 801 | |
| 802 | // Call into runtime if GC is required. |
| 803 | __ bind(&gc_required); |
| 804 | __ MultiPop( |
| 805 | value.bit() | key.bit() | receiver.bit() | target_map.bit() | ra.bit()); |
| 806 | |
| 807 | __ Branch(fail); |
| 808 | |
| 809 | __ bind(&loop); |
| 810 | Register upper_bits = key; |
| 811 | __ lw(upper_bits, MemOperand(src_elements)); |
| 812 | __ Daddu(src_elements, src_elements, kDoubleSize); |
| 813 | // upper_bits: current element's upper 32 bit |
| 814 | // src_elements: address of next element's upper 32 bit |
| 815 | __ Branch(&convert_hole, eq, a1, Operand(kHoleNanUpper32)); |
| 816 | |
| 817 | // Non-hole double, copy value into a heap number. |
| 818 | Register heap_number = receiver; |
| 819 | Register scratch2 = value; |
| 820 | Register scratch3 = t2; |
| 821 | __ AllocateHeapNumber(heap_number, scratch2, scratch3, heap_number_map, |
| 822 | &gc_required); |
| 823 | // heap_number: new heap number |
| 824 | // Load mantissa of current element, src_elements |
| 825 | // point to exponent of next element. |
| 826 | __ lw(scratch2, MemOperand(heap_number, -12)); |
| 827 | __ sw(scratch2, FieldMemOperand(heap_number, HeapNumber::kMantissaOffset)); |
| 828 | __ sw(upper_bits, FieldMemOperand(heap_number, HeapNumber::kExponentOffset)); |
| 829 | __ mov(scratch2, dst_elements); |
| 830 | __ sd(heap_number, MemOperand(dst_elements)); |
| 831 | __ Daddu(dst_elements, dst_elements, kPointerSize); |
| 832 | __ RecordWrite(array, |
| 833 | scratch2, |
| 834 | heap_number, |
| 835 | kRAHasBeenSaved, |
| 836 | kDontSaveFPRegs, |
| 837 | EMIT_REMEMBERED_SET, |
| 838 | OMIT_SMI_CHECK); |
| 839 | __ Branch(&entry); |
| 840 | |
| 841 | // Replace the-hole NaN with the-hole pointer. |
| 842 | __ bind(&convert_hole); |
| 843 | __ LoadRoot(scratch2, Heap::kTheHoleValueRootIndex); |
| 844 | __ sd(scratch2, MemOperand(dst_elements)); |
| 845 | __ Daddu(dst_elements, dst_elements, kPointerSize); |
| 846 | |
| 847 | __ bind(&entry); |
| 848 | __ Branch(&loop, lt, dst_elements, Operand(dst_end)); |
| 849 | |
| 850 | __ MultiPop(receiver.bit() | target_map.bit() | value.bit() | key.bit()); |
| 851 | // Replace receiver's backing store with newly created and filled FixedArray. |
| 852 | __ sd(array, FieldMemOperand(receiver, JSObject::kElementsOffset)); |
| 853 | __ RecordWriteField(receiver, |
| 854 | JSObject::kElementsOffset, |
| 855 | array, |
| 856 | scratch, |
| 857 | kRAHasBeenSaved, |
| 858 | kDontSaveFPRegs, |
| 859 | EMIT_REMEMBERED_SET, |
| 860 | OMIT_SMI_CHECK); |
| 861 | __ pop(ra); |
| 862 | |
| 863 | __ bind(&only_change_map); |
| 864 | // Update receiver's map. |
| 865 | __ sd(target_map, FieldMemOperand(receiver, HeapObject::kMapOffset)); |
| 866 | __ RecordWriteField(receiver, |
| 867 | HeapObject::kMapOffset, |
| 868 | target_map, |
| 869 | scratch, |
| 870 | kRAHasNotBeenSaved, |
| 871 | kDontSaveFPRegs, |
| 872 | OMIT_REMEMBERED_SET, |
| 873 | OMIT_SMI_CHECK); |
| 874 | } |
| 875 | |
| 876 | |
| 877 | void StringCharLoadGenerator::Generate(MacroAssembler* masm, |
| 878 | Register string, |
| 879 | Register index, |
| 880 | Register result, |
| 881 | Label* call_runtime) { |
| 882 | // Fetch the instance type of the receiver into result register. |
| 883 | __ ld(result, FieldMemOperand(string, HeapObject::kMapOffset)); |
| 884 | __ lbu(result, FieldMemOperand(result, Map::kInstanceTypeOffset)); |
| 885 | |
| 886 | // We need special handling for indirect strings. |
| 887 | Label check_sequential; |
| 888 | __ And(at, result, Operand(kIsIndirectStringMask)); |
| 889 | __ Branch(&check_sequential, eq, at, Operand(zero_reg)); |
| 890 | |
| 891 | // Dispatch on the indirect string shape: slice or cons. |
| 892 | Label cons_string; |
| 893 | __ And(at, result, Operand(kSlicedNotConsMask)); |
| 894 | __ Branch(&cons_string, eq, at, Operand(zero_reg)); |
| 895 | |
| 896 | // Handle slices. |
| 897 | Label indirect_string_loaded; |
| 898 | __ ld(result, FieldMemOperand(string, SlicedString::kOffsetOffset)); |
| 899 | __ ld(string, FieldMemOperand(string, SlicedString::kParentOffset)); |
| 900 | __ dsra32(at, result, 0); |
| 901 | __ Daddu(index, index, at); |
| 902 | __ jmp(&indirect_string_loaded); |
| 903 | |
| 904 | // Handle cons strings. |
| 905 | // Check whether the right hand side is the empty string (i.e. if |
| 906 | // this is really a flat string in a cons string). If that is not |
| 907 | // the case we would rather go to the runtime system now to flatten |
| 908 | // the string. |
| 909 | __ bind(&cons_string); |
| 910 | __ ld(result, FieldMemOperand(string, ConsString::kSecondOffset)); |
| 911 | __ LoadRoot(at, Heap::kempty_stringRootIndex); |
| 912 | __ Branch(call_runtime, ne, result, Operand(at)); |
| 913 | // Get the first of the two strings and load its instance type. |
| 914 | __ ld(string, FieldMemOperand(string, ConsString::kFirstOffset)); |
| 915 | |
| 916 | __ bind(&indirect_string_loaded); |
| 917 | __ ld(result, FieldMemOperand(string, HeapObject::kMapOffset)); |
| 918 | __ lbu(result, FieldMemOperand(result, Map::kInstanceTypeOffset)); |
| 919 | |
| 920 | // Distinguish sequential and external strings. Only these two string |
| 921 | // representations can reach here (slices and flat cons strings have been |
| 922 | // reduced to the underlying sequential or external string). |
| 923 | Label external_string, check_encoding; |
| 924 | __ bind(&check_sequential); |
| 925 | STATIC_ASSERT(kSeqStringTag == 0); |
| 926 | __ And(at, result, Operand(kStringRepresentationMask)); |
| 927 | __ Branch(&external_string, ne, at, Operand(zero_reg)); |
| 928 | |
| 929 | // Prepare sequential strings |
| 930 | STATIC_ASSERT(SeqTwoByteString::kHeaderSize == SeqOneByteString::kHeaderSize); |
| 931 | __ Daddu(string, |
| 932 | string, |
| 933 | SeqTwoByteString::kHeaderSize - kHeapObjectTag); |
| 934 | __ jmp(&check_encoding); |
| 935 | |
| 936 | // Handle external strings. |
| 937 | __ bind(&external_string); |
| 938 | if (FLAG_debug_code) { |
| 939 | // Assert that we do not have a cons or slice (indirect strings) here. |
| 940 | // Sequential strings have already been ruled out. |
| 941 | __ And(at, result, Operand(kIsIndirectStringMask)); |
| 942 | __ Assert(eq, kExternalStringExpectedButNotFound, |
| 943 | at, Operand(zero_reg)); |
| 944 | } |
| 945 | // Rule out short external strings. |
| 946 | STATIC_ASSERT(kShortExternalStringTag != 0); |
| 947 | __ And(at, result, Operand(kShortExternalStringMask)); |
| 948 | __ Branch(call_runtime, ne, at, Operand(zero_reg)); |
| 949 | __ ld(string, FieldMemOperand(string, ExternalString::kResourceDataOffset)); |
| 950 | |
| 951 | Label one_byte, done; |
| 952 | __ bind(&check_encoding); |
| 953 | STATIC_ASSERT(kTwoByteStringTag == 0); |
| 954 | __ And(at, result, Operand(kStringEncodingMask)); |
| 955 | __ Branch(&one_byte, ne, at, Operand(zero_reg)); |
| 956 | // Two-byte string. |
| 957 | __ dsll(at, index, 1); |
| 958 | __ Daddu(at, string, at); |
| 959 | __ lhu(result, MemOperand(at)); |
| 960 | __ jmp(&done); |
| 961 | __ bind(&one_byte); |
| 962 | // One_byte string. |
| 963 | __ Daddu(at, string, index); |
| 964 | __ lbu(result, MemOperand(at)); |
| 965 | __ bind(&done); |
| 966 | } |
| 967 | |
| 968 | |
| 969 | static MemOperand ExpConstant(int index, Register base) { |
| 970 | return MemOperand(base, index * kDoubleSize); |
| 971 | } |
| 972 | |
| 973 | |
| 974 | void MathExpGenerator::EmitMathExp(MacroAssembler* masm, |
| 975 | DoubleRegister input, |
| 976 | DoubleRegister result, |
| 977 | DoubleRegister double_scratch1, |
| 978 | DoubleRegister double_scratch2, |
| 979 | Register temp1, |
| 980 | Register temp2, |
| 981 | Register temp3) { |
| 982 | DCHECK(!input.is(result)); |
| 983 | DCHECK(!input.is(double_scratch1)); |
| 984 | DCHECK(!input.is(double_scratch2)); |
| 985 | DCHECK(!result.is(double_scratch1)); |
| 986 | DCHECK(!result.is(double_scratch2)); |
| 987 | DCHECK(!double_scratch1.is(double_scratch2)); |
| 988 | DCHECK(!temp1.is(temp2)); |
| 989 | DCHECK(!temp1.is(temp3)); |
| 990 | DCHECK(!temp2.is(temp3)); |
| 991 | DCHECK(ExternalReference::math_exp_constants(0).address() != NULL); |
| 992 | DCHECK(!masm->serializer_enabled()); // External references not serializable. |
| 993 | |
| 994 | Label zero, infinity, done; |
| 995 | __ li(temp3, Operand(ExternalReference::math_exp_constants(0))); |
| 996 | |
| 997 | __ ldc1(double_scratch1, ExpConstant(0, temp3)); |
| 998 | __ BranchF(&zero, NULL, ge, double_scratch1, input); |
| 999 | |
| 1000 | __ ldc1(double_scratch2, ExpConstant(1, temp3)); |
| 1001 | __ BranchF(&infinity, NULL, ge, input, double_scratch2); |
| 1002 | |
| 1003 | __ ldc1(double_scratch1, ExpConstant(3, temp3)); |
| 1004 | __ ldc1(result, ExpConstant(4, temp3)); |
| 1005 | __ mul_d(double_scratch1, double_scratch1, input); |
| 1006 | __ add_d(double_scratch1, double_scratch1, result); |
| 1007 | __ FmoveLow(temp2, double_scratch1); |
| 1008 | __ sub_d(double_scratch1, double_scratch1, result); |
| 1009 | __ ldc1(result, ExpConstant(6, temp3)); |
| 1010 | __ ldc1(double_scratch2, ExpConstant(5, temp3)); |
| 1011 | __ mul_d(double_scratch1, double_scratch1, double_scratch2); |
| 1012 | __ sub_d(double_scratch1, double_scratch1, input); |
| 1013 | __ sub_d(result, result, double_scratch1); |
| 1014 | __ mul_d(double_scratch2, double_scratch1, double_scratch1); |
| 1015 | __ mul_d(result, result, double_scratch2); |
| 1016 | __ ldc1(double_scratch2, ExpConstant(7, temp3)); |
| 1017 | __ mul_d(result, result, double_scratch2); |
| 1018 | __ sub_d(result, result, double_scratch1); |
| 1019 | // Mov 1 in double_scratch2 as math_exp_constants_array[8] == 1. |
| 1020 | DCHECK(*reinterpret_cast<double*> |
| 1021 | (ExternalReference::math_exp_constants(8).address()) == 1); |
| 1022 | __ Move(double_scratch2, 1); |
| 1023 | __ add_d(result, result, double_scratch2); |
| 1024 | __ dsrl(temp1, temp2, 11); |
| 1025 | __ Ext(temp2, temp2, 0, 11); |
| 1026 | __ Daddu(temp1, temp1, Operand(0x3ff)); |
| 1027 | |
| 1028 | // Must not call ExpConstant() after overwriting temp3! |
| 1029 | __ li(temp3, Operand(ExternalReference::math_exp_log_table())); |
| 1030 | __ dsll(at, temp2, 3); |
| 1031 | __ Daddu(temp3, temp3, Operand(at)); |
| 1032 | __ lwu(temp2, MemOperand(temp3, 0)); |
| 1033 | __ lwu(temp3, MemOperand(temp3, kIntSize)); |
| 1034 | // The first word is loaded is the lower number register. |
| 1035 | if (temp2.code() < temp3.code()) { |
| 1036 | __ dsll(at, temp1, 20); |
| 1037 | __ Or(temp1, temp3, at); |
| 1038 | __ Move(double_scratch1, temp2, temp1); |
| 1039 | } else { |
| 1040 | __ dsll(at, temp1, 20); |
| 1041 | __ Or(temp1, temp2, at); |
| 1042 | __ Move(double_scratch1, temp3, temp1); |
| 1043 | } |
| 1044 | __ mul_d(result, result, double_scratch1); |
| 1045 | __ BranchShort(&done); |
| 1046 | |
| 1047 | __ bind(&zero); |
| 1048 | __ Move(result, kDoubleRegZero); |
| 1049 | __ BranchShort(&done); |
| 1050 | |
| 1051 | __ bind(&infinity); |
| 1052 | __ ldc1(result, ExpConstant(2, temp3)); |
| 1053 | |
| 1054 | __ bind(&done); |
| 1055 | } |
| 1056 | |
| 1057 | #ifdef DEBUG |
| 1058 | // nop(CODE_AGE_MARKER_NOP) |
| 1059 | static const uint32_t kCodeAgePatchFirstInstruction = 0x00010180; |
| 1060 | #endif |
| 1061 | |
| 1062 | |
| 1063 | CodeAgingHelper::CodeAgingHelper() { |
| 1064 | DCHECK(young_sequence_.length() == kNoCodeAgeSequenceLength); |
| 1065 | // Since patcher is a large object, allocate it dynamically when needed, |
| 1066 | // to avoid overloading the stack in stress conditions. |
| 1067 | // DONT_FLUSH is used because the CodeAgingHelper is initialized early in |
| 1068 | // the process, before MIPS simulator ICache is setup. |
| 1069 | SmartPointer<CodePatcher> patcher( |
| 1070 | new CodePatcher(young_sequence_.start(), |
| 1071 | young_sequence_.length() / Assembler::kInstrSize, |
| 1072 | CodePatcher::DONT_FLUSH)); |
| 1073 | PredictableCodeSizeScope scope(patcher->masm(), young_sequence_.length()); |
| 1074 | patcher->masm()->Push(ra, fp, cp, a1); |
| 1075 | patcher->masm()->nop(Assembler::CODE_AGE_SEQUENCE_NOP); |
| 1076 | patcher->masm()->nop(Assembler::CODE_AGE_SEQUENCE_NOP); |
| 1077 | patcher->masm()->nop(Assembler::CODE_AGE_SEQUENCE_NOP); |
| 1078 | patcher->masm()->Daddu( |
| 1079 | fp, sp, Operand(StandardFrameConstants::kFixedFrameSizeFromFp)); |
| 1080 | } |
| 1081 | |
| 1082 | |
| 1083 | #ifdef DEBUG |
| 1084 | bool CodeAgingHelper::IsOld(byte* candidate) const { |
| 1085 | return Memory::uint32_at(candidate) == kCodeAgePatchFirstInstruction; |
| 1086 | } |
| 1087 | #endif |
| 1088 | |
| 1089 | |
| 1090 | bool Code::IsYoungSequence(Isolate* isolate, byte* sequence) { |
| 1091 | bool result = isolate->code_aging_helper()->IsYoung(sequence); |
| 1092 | DCHECK(result || isolate->code_aging_helper()->IsOld(sequence)); |
| 1093 | return result; |
| 1094 | } |
| 1095 | |
| 1096 | |
| 1097 | void Code::GetCodeAgeAndParity(Isolate* isolate, byte* sequence, Age* age, |
| 1098 | MarkingParity* parity) { |
| 1099 | if (IsYoungSequence(isolate, sequence)) { |
| 1100 | *age = kNoAgeCodeAge; |
| 1101 | *parity = NO_MARKING_PARITY; |
| 1102 | } else { |
| 1103 | Address target_address = Assembler::target_address_at( |
| 1104 | sequence + Assembler::kInstrSize); |
| 1105 | Code* stub = GetCodeFromTargetAddress(target_address); |
| 1106 | GetCodeAgeAndParity(stub, age, parity); |
| 1107 | } |
| 1108 | } |
| 1109 | |
| 1110 | |
| 1111 | void Code::PatchPlatformCodeAge(Isolate* isolate, |
| 1112 | byte* sequence, |
| 1113 | Code::Age age, |
| 1114 | MarkingParity parity) { |
| 1115 | uint32_t young_length = isolate->code_aging_helper()->young_sequence_length(); |
| 1116 | if (age == kNoAgeCodeAge) { |
| 1117 | isolate->code_aging_helper()->CopyYoungSequenceTo(sequence); |
| 1118 | CpuFeatures::FlushICache(sequence, young_length); |
| 1119 | } else { |
| 1120 | Code* stub = GetCodeAgeStub(isolate, age, parity); |
| 1121 | CodePatcher patcher(sequence, young_length / Assembler::kInstrSize); |
| 1122 | // Mark this code sequence for FindPlatformCodeAgeSequence(). |
| 1123 | patcher.masm()->nop(Assembler::CODE_AGE_MARKER_NOP); |
| 1124 | // Load the stub address to t9 and call it, |
| 1125 | // GetCodeAgeAndParity() extracts the stub address from this instruction. |
| 1126 | patcher.masm()->li( |
| 1127 | t9, |
| 1128 | Operand(reinterpret_cast<uint64_t>(stub->instruction_start())), |
| 1129 | ADDRESS_LOAD); |
| 1130 | patcher.masm()->nop(); // Prevent jalr to jal optimization. |
| 1131 | patcher.masm()->jalr(t9, a0); |
| 1132 | patcher.masm()->nop(); // Branch delay slot nop. |
| 1133 | patcher.masm()->nop(); // Pad the empty space. |
| 1134 | } |
| 1135 | } |
| 1136 | |
| 1137 | |
| 1138 | #undef __ |
| 1139 | |
| 1140 | } } // namespace v8::internal |
| 1141 | |
| 1142 | #endif // V8_TARGET_ARCH_MIPS64 |