5 #if V8_TARGET_ARCH_MIPS 9 #include "src/codegen.h" 10 #include "src/macro-assembler.h" 11 #include "src/mips/simulator-mips.h" 18 #if defined(V8_HOST_ARCH_MIPS) 20 MemCopyUint8Function CreateMemCopyUint8Function(MemCopyUint8Function stub) {
21 #if defined(USE_SIMULATOR) || defined(_MIPS_ARCH_MIPS32R6) || \ 22 defined(_MIPS_ARCH_MIPS32RX) 27 byte* buffer = AllocatePage(page_allocator,
29 if (buffer ==
nullptr)
return nullptr;
31 MacroAssembler masm(AssemblerOptions{}, buffer,
static_cast<int>(allocated));
36 Label lastb, unaligned, aligned, chkw,
37 loop16w, chk1w, wordCopy_loop, skip_pref, lastbloop,
38 leave, ua_chk16w, ua_loop16w, ua_skip_pref, ua_chkw,
39 ua_chk1w, ua_wordCopy_loop, ua_smallCopy, ua_smallCopy_loop;
48 DCHECK(pref_chunk < max_pref_size);
53 uint32_t pref_limit = (5 * pref_chunk) + max_pref_size;
54 int32_t pref_hint_load = kPrefHintLoadStreamed;
55 int32_t pref_hint_store = kPrefHintPrepareForStore;
61 DCHECK(pref_hint_store != kPrefHintPrepareForStore ||
62 pref_chunk * 4 >= max_pref_size);
66 __ slti(t2, a2, 2 * loadstore_chunk);
67 __ bne(t2, zero_reg, &lastb);
75 __ andi(t8, t8, loadstore_chunk - 1);
76 __ bne(t8, zero_reg, &unaligned);
77 __ subu(a3, zero_reg, a0);
79 __ andi(a3, a3, loadstore_chunk - 1);
80 __ beq(a3, zero_reg, &aligned);
83 if (kArchEndian == kLittle) {
84 __ lwr(t8, MemOperand(a1));
86 __ swr(t8, MemOperand(a0));
89 __ lwl(t8, MemOperand(a1));
91 __ swl(t8, MemOperand(a0));
99 __ andi(t8, a2, 0x3F);
100 __ beq(a2, t8, &chkw);
109 if (pref_hint_store == kPrefHintPrepareForStore) {
111 __ Subu(t9, t0, pref_limit);
114 __ Pref(pref_hint_load, MemOperand(a1, 0 * pref_chunk));
115 __ Pref(pref_hint_load, MemOperand(a1, 1 * pref_chunk));
116 __ Pref(pref_hint_load, MemOperand(a1, 2 * pref_chunk));
117 __ Pref(pref_hint_load, MemOperand(a1, 3 * pref_chunk));
119 if (pref_hint_store != kPrefHintPrepareForStore) {
120 __ Pref(pref_hint_store, MemOperand(a0, 1 * pref_chunk));
121 __ Pref(pref_hint_store, MemOperand(a0, 2 * pref_chunk));
122 __ Pref(pref_hint_store, MemOperand(a0, 3 * pref_chunk));
125 __ lw(t0, MemOperand(a1));
127 if (pref_hint_store == kPrefHintPrepareForStore) {
129 __ Branch(USE_DELAY_SLOT, &skip_pref, gt, v1, Operand(zero_reg));
131 __ lw(t1, MemOperand(a1, 1, loadstore_chunk));
133 __ Pref(pref_hint_store, MemOperand(a0, 4 * pref_chunk));
134 __ Pref(pref_hint_store, MemOperand(a0, 5 * pref_chunk));
137 __ lw(t2, MemOperand(a1, 2, loadstore_chunk));
138 __ lw(t3, MemOperand(a1, 3, loadstore_chunk));
139 __ lw(t4, MemOperand(a1, 4, loadstore_chunk));
140 __ lw(t5, MemOperand(a1, 5, loadstore_chunk));
141 __ lw(t6, MemOperand(a1, 6, loadstore_chunk));
142 __ lw(t7, MemOperand(a1, 7, loadstore_chunk));
143 __ Pref(pref_hint_load, MemOperand(a1, 4 * pref_chunk));
145 __ sw(t0, MemOperand(a0));
146 __ sw(t1, MemOperand(a0, 1, loadstore_chunk));
147 __ sw(t2, MemOperand(a0, 2, loadstore_chunk));
148 __ sw(t3, MemOperand(a0, 3, loadstore_chunk));
149 __ sw(t4, MemOperand(a0, 4, loadstore_chunk));
150 __ sw(t5, MemOperand(a0, 5, loadstore_chunk));
151 __ sw(t6, MemOperand(a0, 6, loadstore_chunk));
152 __ sw(t7, MemOperand(a0, 7, loadstore_chunk));
154 __ lw(t0, MemOperand(a1, 8, loadstore_chunk));
155 __ lw(t1, MemOperand(a1, 9, loadstore_chunk));
156 __ lw(t2, MemOperand(a1, 10, loadstore_chunk));
157 __ lw(t3, MemOperand(a1, 11, loadstore_chunk));
158 __ lw(t4, MemOperand(a1, 12, loadstore_chunk));
159 __ lw(t5, MemOperand(a1, 13, loadstore_chunk));
160 __ lw(t6, MemOperand(a1, 14, loadstore_chunk));
161 __ lw(t7, MemOperand(a1, 15, loadstore_chunk));
162 __ Pref(pref_hint_load, MemOperand(a1, 5 * pref_chunk));
164 __ sw(t0, MemOperand(a0, 8, loadstore_chunk));
165 __ sw(t1, MemOperand(a0, 9, loadstore_chunk));
166 __ sw(t2, MemOperand(a0, 10, loadstore_chunk));
167 __ sw(t3, MemOperand(a0, 11, loadstore_chunk));
168 __ sw(t4, MemOperand(a0, 12, loadstore_chunk));
169 __ sw(t5, MemOperand(a0, 13, loadstore_chunk));
170 __ sw(t6, MemOperand(a0, 14, loadstore_chunk));
171 __ sw(t7, MemOperand(a0, 15, loadstore_chunk));
172 __ addiu(a0, a0, 16 * loadstore_chunk);
173 __ bne(a0, a3, &loop16w);
174 __ addiu(a1, a1, 16 * loadstore_chunk);
181 __ Pref(pref_hint_load, MemOperand(a1, 0 * pref_chunk));
182 __ andi(t8, a2, 0x1F);
183 __ beq(a2, t8, &chk1w);
185 __ lw(t0, MemOperand(a1));
186 __ lw(t1, MemOperand(a1, 1, loadstore_chunk));
187 __ lw(t2, MemOperand(a1, 2, loadstore_chunk));
188 __ lw(t3, MemOperand(a1, 3, loadstore_chunk));
189 __ lw(t4, MemOperand(a1, 4, loadstore_chunk));
190 __ lw(t5, MemOperand(a1, 5, loadstore_chunk));
191 __ lw(t6, MemOperand(a1, 6, loadstore_chunk));
192 __ lw(t7, MemOperand(a1, 7, loadstore_chunk));
193 __ addiu(a1, a1, 8 * loadstore_chunk);
194 __ sw(t0, MemOperand(a0));
195 __ sw(t1, MemOperand(a0, 1, loadstore_chunk));
196 __ sw(t2, MemOperand(a0, 2, loadstore_chunk));
197 __ sw(t3, MemOperand(a0, 3, loadstore_chunk));
198 __ sw(t4, MemOperand(a0, 4, loadstore_chunk));
199 __ sw(t5, MemOperand(a0, 5, loadstore_chunk));
200 __ sw(t6, MemOperand(a0, 6, loadstore_chunk));
201 __ sw(t7, MemOperand(a0, 7, loadstore_chunk));
202 __ addiu(a0, a0, 8 * loadstore_chunk);
210 __ andi(a2, t8, loadstore_chunk - 1);
211 __ beq(a2, t8, &lastb);
215 __ bind(&wordCopy_loop);
216 __ lw(t3, MemOperand(a1));
217 __ addiu(a0, a0, loadstore_chunk);
218 __ addiu(a1, a1, loadstore_chunk);
219 __ bne(a0, a3, &wordCopy_loop);
220 __ sw(t3, MemOperand(a0, -1, loadstore_chunk));
223 __ Branch(&leave, le, a2, Operand(zero_reg));
227 __ lb(v1, MemOperand(a1));
230 __ bne(a0, a3, &lastbloop);
231 __ sb(v1, MemOperand(a0, -1));
241 __ andi(a3, a3, loadstore_chunk - 1);
242 __ beq(a3, zero_reg, &ua_chk16w);
245 if (kArchEndian == kLittle) {
246 __ lwr(v1, MemOperand(a1));
248 MemOperand(a1, 1, loadstore_chunk, MemOperand::offset_minus_one));
250 __ swr(v1, MemOperand(a0));
253 __ lwl(v1, MemOperand(a1));
255 MemOperand(a1, 1, loadstore_chunk, MemOperand::offset_minus_one));
257 __ swl(v1, MemOperand(a0));
266 __ andi(t8, a2, 0x3F);
267 __ beq(a2, t8, &ua_chkw);
271 if (pref_hint_store == kPrefHintPrepareForStore) {
273 __ Subu(t9, t0, pref_limit);
276 __ Pref(pref_hint_load, MemOperand(a1, 0 * pref_chunk));
277 __ Pref(pref_hint_load, MemOperand(a1, 1 * pref_chunk));
278 __ Pref(pref_hint_load, MemOperand(a1, 2 * pref_chunk));
280 if (pref_hint_store != kPrefHintPrepareForStore) {
281 __ Pref(pref_hint_store, MemOperand(a0, 1 * pref_chunk));
282 __ Pref(pref_hint_store, MemOperand(a0, 2 * pref_chunk));
283 __ Pref(pref_hint_store, MemOperand(a0, 3 * pref_chunk));
286 __ bind(&ua_loop16w);
287 __ Pref(pref_hint_load, MemOperand(a1, 3 * pref_chunk));
288 if (kArchEndian == kLittle) {
289 __ lwr(t0, MemOperand(a1));
290 __ lwr(t1, MemOperand(a1, 1, loadstore_chunk));
291 __ lwr(t2, MemOperand(a1, 2, loadstore_chunk));
293 if (pref_hint_store == kPrefHintPrepareForStore) {
295 __ Branch(USE_DELAY_SLOT, &ua_skip_pref, gt, v1, Operand(zero_reg));
297 __ lwr(t3, MemOperand(a1, 3, loadstore_chunk));
299 __ Pref(pref_hint_store, MemOperand(a0, 4 * pref_chunk));
300 __ Pref(pref_hint_store, MemOperand(a0, 5 * pref_chunk));
302 __ bind(&ua_skip_pref);
303 __ lwr(t4, MemOperand(a1, 4, loadstore_chunk));
304 __ lwr(t5, MemOperand(a1, 5, loadstore_chunk));
305 __ lwr(t6, MemOperand(a1, 6, loadstore_chunk));
306 __ lwr(t7, MemOperand(a1, 7, loadstore_chunk));
308 MemOperand(a1, 1, loadstore_chunk, MemOperand::offset_minus_one));
310 MemOperand(a1, 2, loadstore_chunk, MemOperand::offset_minus_one));
312 MemOperand(a1, 3, loadstore_chunk, MemOperand::offset_minus_one));
314 MemOperand(a1, 4, loadstore_chunk, MemOperand::offset_minus_one));
316 MemOperand(a1, 5, loadstore_chunk, MemOperand::offset_minus_one));
318 MemOperand(a1, 6, loadstore_chunk, MemOperand::offset_minus_one));
320 MemOperand(a1, 7, loadstore_chunk, MemOperand::offset_minus_one));
322 MemOperand(a1, 8, loadstore_chunk, MemOperand::offset_minus_one));
324 __ lwl(t0, MemOperand(a1));
325 __ lwl(t1, MemOperand(a1, 1, loadstore_chunk));
326 __ lwl(t2, MemOperand(a1, 2, loadstore_chunk));
328 if (pref_hint_store == kPrefHintPrepareForStore) {
330 __ Branch(USE_DELAY_SLOT, &ua_skip_pref, gt, v1, Operand(zero_reg));
332 __ lwl(t3, MemOperand(a1, 3, loadstore_chunk));
334 __ Pref(pref_hint_store, MemOperand(a0, 4 * pref_chunk));
335 __ Pref(pref_hint_store, MemOperand(a0, 5 * pref_chunk));
337 __ bind(&ua_skip_pref);
338 __ lwl(t4, MemOperand(a1, 4, loadstore_chunk));
339 __ lwl(t5, MemOperand(a1, 5, loadstore_chunk));
340 __ lwl(t6, MemOperand(a1, 6, loadstore_chunk));
341 __ lwl(t7, MemOperand(a1, 7, loadstore_chunk));
343 MemOperand(a1, 1, loadstore_chunk, MemOperand::offset_minus_one));
345 MemOperand(a1, 2, loadstore_chunk, MemOperand::offset_minus_one));
347 MemOperand(a1, 3, loadstore_chunk, MemOperand::offset_minus_one));
349 MemOperand(a1, 4, loadstore_chunk, MemOperand::offset_minus_one));
351 MemOperand(a1, 5, loadstore_chunk, MemOperand::offset_minus_one));
353 MemOperand(a1, 6, loadstore_chunk, MemOperand::offset_minus_one));
355 MemOperand(a1, 7, loadstore_chunk, MemOperand::offset_minus_one));
357 MemOperand(a1, 8, loadstore_chunk, MemOperand::offset_minus_one));
359 __ Pref(pref_hint_load, MemOperand(a1, 4 * pref_chunk));
360 __ sw(t0, MemOperand(a0));
361 __ sw(t1, MemOperand(a0, 1, loadstore_chunk));
362 __ sw(t2, MemOperand(a0, 2, loadstore_chunk));
363 __ sw(t3, MemOperand(a0, 3, loadstore_chunk));
364 __ sw(t4, MemOperand(a0, 4, loadstore_chunk));
365 __ sw(t5, MemOperand(a0, 5, loadstore_chunk));
366 __ sw(t6, MemOperand(a0, 6, loadstore_chunk));
367 __ sw(t7, MemOperand(a0, 7, loadstore_chunk));
368 if (kArchEndian == kLittle) {
369 __ lwr(t0, MemOperand(a1, 8, loadstore_chunk));
370 __ lwr(t1, MemOperand(a1, 9, loadstore_chunk));
371 __ lwr(t2, MemOperand(a1, 10, loadstore_chunk));
372 __ lwr(t3, MemOperand(a1, 11, loadstore_chunk));
373 __ lwr(t4, MemOperand(a1, 12, loadstore_chunk));
374 __ lwr(t5, MemOperand(a1, 13, loadstore_chunk));
375 __ lwr(t6, MemOperand(a1, 14, loadstore_chunk));
376 __ lwr(t7, MemOperand(a1, 15, loadstore_chunk));
378 MemOperand(a1, 9, loadstore_chunk, MemOperand::offset_minus_one));
380 MemOperand(a1, 10, loadstore_chunk, MemOperand::offset_minus_one));
382 MemOperand(a1, 11, loadstore_chunk, MemOperand::offset_minus_one));
384 MemOperand(a1, 12, loadstore_chunk, MemOperand::offset_minus_one));
386 MemOperand(a1, 13, loadstore_chunk, MemOperand::offset_minus_one));
388 MemOperand(a1, 14, loadstore_chunk, MemOperand::offset_minus_one));
390 MemOperand(a1, 15, loadstore_chunk, MemOperand::offset_minus_one));
392 MemOperand(a1, 16, loadstore_chunk, MemOperand::offset_minus_one));
394 __ lwl(t0, MemOperand(a1, 8, loadstore_chunk));
395 __ lwl(t1, MemOperand(a1, 9, loadstore_chunk));
396 __ lwl(t2, MemOperand(a1, 10, loadstore_chunk));
397 __ lwl(t3, MemOperand(a1, 11, loadstore_chunk));
398 __ lwl(t4, MemOperand(a1, 12, loadstore_chunk));
399 __ lwl(t5, MemOperand(a1, 13, loadstore_chunk));
400 __ lwl(t6, MemOperand(a1, 14, loadstore_chunk));
401 __ lwl(t7, MemOperand(a1, 15, loadstore_chunk));
403 MemOperand(a1, 9, loadstore_chunk, MemOperand::offset_minus_one));
405 MemOperand(a1, 10, loadstore_chunk, MemOperand::offset_minus_one));
407 MemOperand(a1, 11, loadstore_chunk, MemOperand::offset_minus_one));
409 MemOperand(a1, 12, loadstore_chunk, MemOperand::offset_minus_one));
411 MemOperand(a1, 13, loadstore_chunk, MemOperand::offset_minus_one));
413 MemOperand(a1, 14, loadstore_chunk, MemOperand::offset_minus_one));
415 MemOperand(a1, 15, loadstore_chunk, MemOperand::offset_minus_one));
417 MemOperand(a1, 16, loadstore_chunk, MemOperand::offset_minus_one));
419 __ Pref(pref_hint_load, MemOperand(a1, 5 * pref_chunk));
420 __ sw(t0, MemOperand(a0, 8, loadstore_chunk));
421 __ sw(t1, MemOperand(a0, 9, loadstore_chunk));
422 __ sw(t2, MemOperand(a0, 10, loadstore_chunk));
423 __ sw(t3, MemOperand(a0, 11, loadstore_chunk));
424 __ sw(t4, MemOperand(a0, 12, loadstore_chunk));
425 __ sw(t5, MemOperand(a0, 13, loadstore_chunk));
426 __ sw(t6, MemOperand(a0, 14, loadstore_chunk));
427 __ sw(t7, MemOperand(a0, 15, loadstore_chunk));
428 __ addiu(a0, a0, 16 * loadstore_chunk);
429 __ bne(a0, a3, &ua_loop16w);
430 __ addiu(a1, a1, 16 * loadstore_chunk);
437 __ Pref(pref_hint_load, MemOperand(a1));
438 __ andi(t8, a2, 0x1F);
440 __ beq(a2, t8, &ua_chk1w);
442 if (kArchEndian == kLittle) {
443 __ lwr(t0, MemOperand(a1));
444 __ lwr(t1, MemOperand(a1, 1, loadstore_chunk));
445 __ lwr(t2, MemOperand(a1, 2, loadstore_chunk));
446 __ lwr(t3, MemOperand(a1, 3, loadstore_chunk));
447 __ lwr(t4, MemOperand(a1, 4, loadstore_chunk));
448 __ lwr(t5, MemOperand(a1, 5, loadstore_chunk));
449 __ lwr(t6, MemOperand(a1, 6, loadstore_chunk));
450 __ lwr(t7, MemOperand(a1, 7, loadstore_chunk));
452 MemOperand(a1, 1, loadstore_chunk, MemOperand::offset_minus_one));
454 MemOperand(a1, 2, loadstore_chunk, MemOperand::offset_minus_one));
456 MemOperand(a1, 3, loadstore_chunk, MemOperand::offset_minus_one));
458 MemOperand(a1, 4, loadstore_chunk, MemOperand::offset_minus_one));
460 MemOperand(a1, 5, loadstore_chunk, MemOperand::offset_minus_one));
462 MemOperand(a1, 6, loadstore_chunk, MemOperand::offset_minus_one));
464 MemOperand(a1, 7, loadstore_chunk, MemOperand::offset_minus_one));
466 MemOperand(a1, 8, loadstore_chunk, MemOperand::offset_minus_one));
468 __ lwl(t0, MemOperand(a1));
469 __ lwl(t1, MemOperand(a1, 1, loadstore_chunk));
470 __ lwl(t2, MemOperand(a1, 2, loadstore_chunk));
471 __ lwl(t3, MemOperand(a1, 3, loadstore_chunk));
472 __ lwl(t4, MemOperand(a1, 4, loadstore_chunk));
473 __ lwl(t5, MemOperand(a1, 5, loadstore_chunk));
474 __ lwl(t6, MemOperand(a1, 6, loadstore_chunk));
475 __ lwl(t7, MemOperand(a1, 7, loadstore_chunk));
477 MemOperand(a1, 1, loadstore_chunk, MemOperand::offset_minus_one));
479 MemOperand(a1, 2, loadstore_chunk, MemOperand::offset_minus_one));
481 MemOperand(a1, 3, loadstore_chunk, MemOperand::offset_minus_one));
483 MemOperand(a1, 4, loadstore_chunk, MemOperand::offset_minus_one));
485 MemOperand(a1, 5, loadstore_chunk, MemOperand::offset_minus_one));
487 MemOperand(a1, 6, loadstore_chunk, MemOperand::offset_minus_one));
489 MemOperand(a1, 7, loadstore_chunk, MemOperand::offset_minus_one));
491 MemOperand(a1, 8, loadstore_chunk, MemOperand::offset_minus_one));
493 __ addiu(a1, a1, 8 * loadstore_chunk);
494 __ sw(t0, MemOperand(a0));
495 __ sw(t1, MemOperand(a0, 1, loadstore_chunk));
496 __ sw(t2, MemOperand(a0, 2, loadstore_chunk));
497 __ sw(t3, MemOperand(a0, 3, loadstore_chunk));
498 __ sw(t4, MemOperand(a0, 4, loadstore_chunk));
499 __ sw(t5, MemOperand(a0, 5, loadstore_chunk));
500 __ sw(t6, MemOperand(a0, 6, loadstore_chunk));
501 __ sw(t7, MemOperand(a0, 7, loadstore_chunk));
502 __ addiu(a0, a0, 8 * loadstore_chunk);
507 __ andi(a2, t8, loadstore_chunk - 1);
508 __ beq(a2, t8, &ua_smallCopy);
512 __ bind(&ua_wordCopy_loop);
513 if (kArchEndian == kLittle) {
514 __ lwr(v1, MemOperand(a1));
516 MemOperand(a1, 1, loadstore_chunk, MemOperand::offset_minus_one));
518 __ lwl(v1, MemOperand(a1));
520 MemOperand(a1, 1, loadstore_chunk, MemOperand::offset_minus_one));
522 __ addiu(a0, a0, loadstore_chunk);
523 __ addiu(a1, a1, loadstore_chunk);
524 __ bne(a0, a3, &ua_wordCopy_loop);
525 __ sw(v1, MemOperand(a0, -1, loadstore_chunk));
528 __ bind(&ua_smallCopy);
529 __ beq(a2, zero_reg, &leave);
532 __ bind(&ua_smallCopy_loop);
533 __ lb(v1, MemOperand(a1));
536 __ bne(a0, a3, &ua_smallCopy_loop);
537 __ sb(v1, MemOperand(a0, -1));
543 masm.GetCode(
nullptr, &desc);
544 DCHECK(!RelocInfo::RequiresRelocationAfterCodegen(desc));
546 Assembler::FlushICache(buffer, allocated);
547 CHECK(SetPermissions(page_allocator, buffer, allocated,
548 PageAllocator::kReadExecute));
549 return FUNCTION_CAST<MemCopyUint8Function>(buffer);
554 UnaryMathFunction CreateSqrtFunction() {
555 #if defined(USE_SIMULATOR) 559 size_t allocated = 0;
560 byte* buffer = AllocatePage(page_allocator,
562 if (buffer ==
nullptr)
return nullptr;
564 MacroAssembler masm(AssemblerOptions{}, buffer,
static_cast<int>(allocated));
566 __ MovFromFloatParameter(f12);
568 __ MovToFloatResult(f0);
572 masm.GetCode(
nullptr, &desc);
573 DCHECK(!RelocInfo::RequiresRelocationAfterCodegen(desc));
575 Assembler::FlushICache(buffer, allocated);
576 CHECK(SetPermissions(page_allocator, buffer, allocated,
577 PageAllocator::kReadExecute));
578 return FUNCTION_CAST<UnaryMathFunction>(buffer);
587 #endif // V8_TARGET_ARCH_MIPS
virtual void * GetRandomMmapAddr()=0