311 __ mov(r19_sender_sp, sp);
312 __ blr(c_rarg4);
313
314 // we do this here because the notify will already have been done
315 // if we get to the next instruction via an exception
316 //
317 // n.b. adding this instruction here affects the calculation of
318 // whether or not a routine returns to the call stub (used when
319 // doing stack walks) since the normal test is to check the return
320 // pc against the address saved below. so we may need to allow for
321 // this extra instruction in the check.
322
323 // save current address for use by exception handling code
324
325 return_address = __ pc();
326
327 // store result depending on type (everything that is not
328 // T_OBJECT, T_LONG, T_FLOAT or T_DOUBLE is treated as T_INT)
329 // n.b. this assumes Java returns an integral result in r0
330 // and a floating result in j_farg0
331 __ ldr(j_rarg2, result);
332 Label is_long, is_float, is_double, exit;
333 __ ldr(j_rarg1, result_type);
334 __ cmp(j_rarg1, (u1)T_OBJECT);
335 __ br(Assembler::EQ, is_long);
336 __ cmp(j_rarg1, (u1)T_LONG);
337 __ br(Assembler::EQ, is_long);
338 __ cmp(j_rarg1, (u1)T_FLOAT);
339 __ br(Assembler::EQ, is_float);
340 __ cmp(j_rarg1, (u1)T_DOUBLE);
341 __ br(Assembler::EQ, is_double);
342
343 // handle T_INT case
344 __ strw(r0, Address(j_rarg2));
345
346 __ BIND(exit);
347
348 // pop parameters
349 __ sub(esp, rfp, -sp_after_call_off * wordSize);
350
351 #ifdef ASSERT
352 // verify that threads correspond
353 {
354 Label L, S;
355 __ ldr(rscratch1, thread);
356 __ cmp(rthread, rscratch1);
357 __ br(Assembler::NE, S);
358 __ get_thread(rscratch1);
359 __ cmp(rthread, rscratch1);
360 __ br(Assembler::EQ, L);
361 __ BIND(S);
362 __ stop("StubRoutines::call_stub: threads must correspond");
363 __ BIND(L);
364 }
376 __ ldp(r26, r25, r26_save);
377 __ ldp(r24, r23, r24_save);
378 __ ldp(r22, r21, r22_save);
379 __ ldp(r20, r19, r20_save);
380
381 // restore fpcr
382 __ ldr(rscratch1, fpcr_save);
383 __ set_fpcr(rscratch1);
384
385 __ ldp(c_rarg0, c_rarg1, call_wrapper);
386 __ ldrw(c_rarg2, result_type);
387 __ ldr(c_rarg3, method);
388 __ ldp(c_rarg4, c_rarg5, entry_point);
389 __ ldp(c_rarg6, c_rarg7, parameter_size);
390
391 // leave frame and return to caller
392 __ leave();
393 __ ret(lr);
394
395 // handle return types different from T_INT
396
397 __ BIND(is_long);
398 __ str(r0, Address(j_rarg2, 0));
399 __ br(Assembler::AL, exit);
400
401 __ BIND(is_float);
402 __ strs(j_farg0, Address(j_rarg2, 0));
403 __ br(Assembler::AL, exit);
404
405 __ BIND(is_double);
406 __ strd(j_farg0, Address(j_rarg2, 0));
407 __ br(Assembler::AL, exit);
408
409 return start;
410 }
411
412 // Return point for a Java call if there's an exception thrown in
413 // Java code. The exception is caught and transformed into a
414 // pending exception stored in JavaThread that can be tested from
415 // within the VM.
416 //
417 // Note: Usually the parameters are removed by the callee. In case
418 // of an exception crossing an activation frame boundary, that is
419 // not the case if the callee is compiled code => need to setup the
420 // rsp.
421 //
422 // r0: exception oop
423
424 address generate_catch_exception() {
425 StubGenStubId stub_id = StubGenStubId::catch_exception_id;
426 StubCodeMark mark(this, stub_id);
2207 // |array_tag| | header_size | element_type | |log2_element_size|
2208 // 32 30 24 16 8 2 0
2209 //
2210 // array_tag: typeArray = 0x3, objArray = 0x2, non-array = 0x0
2211 //
2212
2213 const int lh_offset = in_bytes(Klass::layout_helper_offset());
2214
2215 // Handle objArrays completely differently...
2216 const jint objArray_lh = Klass::array_layout_helper(T_OBJECT);
2217 __ ldrw(lh, Address(scratch_src_klass, lh_offset));
2218 __ movw(rscratch1, objArray_lh);
2219 __ eorw(rscratch2, lh, rscratch1);
2220 __ cbzw(rscratch2, L_objArray);
2221
2222 // if (src->klass() != dst->klass()) return -1;
2223 __ load_klass(rscratch2, dst);
2224 __ eor(rscratch2, rscratch2, scratch_src_klass);
2225 __ cbnz(rscratch2, L_failed);
2226
2227 // if (!src->is_Array()) return -1;
2228 __ tbz(lh, 31, L_failed); // i.e. (lh >= 0)
2229
2230 // At this point, it is known to be a typeArray (array_tag 0x3).
2231 #ifdef ASSERT
2232 {
2233 BLOCK_COMMENT("assert primitive array {");
2234 Label L;
2235 __ movw(rscratch2, Klass::_lh_array_tag_type_value << Klass::_lh_array_tag_shift);
2236 __ cmpw(lh, rscratch2);
2237 __ br(Assembler::GE, L);
2238 __ stop("must be a primitive array");
2239 __ bind(L);
2240 BLOCK_COMMENT("} assert primitive array done");
2241 }
2242 #endif
2243
2244 arraycopy_range_checks(src, src_pos, dst, dst_pos, scratch_length,
2245 rscratch2, L_failed);
2246
10441 gen_cas_entry(MacroAssembler::xword, memory_order_relaxed);
10442
10443 AtomicStubMark mark_cmpxchg_4_release
10444 (_masm, &aarch64_atomic_cmpxchg_4_release_impl);
10445 gen_cas_entry(MacroAssembler::word, memory_order_release);
10446 AtomicStubMark mark_cmpxchg_8_release
10447 (_masm, &aarch64_atomic_cmpxchg_8_release_impl);
10448 gen_cas_entry(MacroAssembler::xword, memory_order_release);
10449
10450 AtomicStubMark mark_cmpxchg_4_seq_cst
10451 (_masm, &aarch64_atomic_cmpxchg_4_seq_cst_impl);
10452 gen_cas_entry(MacroAssembler::word, memory_order_seq_cst);
10453 AtomicStubMark mark_cmpxchg_8_seq_cst
10454 (_masm, &aarch64_atomic_cmpxchg_8_seq_cst_impl);
10455 gen_cas_entry(MacroAssembler::xword, memory_order_seq_cst);
10456
10457 ICache::invalidate_range(first_entry, __ pc() - first_entry);
10458 }
10459 #endif // LINUX
10460
10461 address generate_cont_thaw(Continuation::thaw_kind kind) {
10462 bool return_barrier = Continuation::is_thaw_return_barrier(kind);
10463 bool return_barrier_exception = Continuation::is_thaw_return_barrier_exception(kind);
10464
10465 address start = __ pc();
10466
10467 if (return_barrier) {
10468 __ ldr(rscratch1, Address(rthread, JavaThread::cont_entry_offset()));
10469 __ mov(sp, rscratch1);
10470 }
10471 assert_asm(_masm, (__ ldr(rscratch1, Address(rthread, JavaThread::cont_entry_offset())), __ cmp(sp, rscratch1)), Assembler::EQ, "incorrect sp");
10472
10473 if (return_barrier) {
10474 // preserve possible return value from a method returning to the return barrier
10475 __ fmovd(rscratch1, v0);
10476 __ stp(rscratch1, r0, Address(__ pre(sp, -2 * wordSize)));
10477 }
10478
10479 __ movw(c_rarg1, (return_barrier ? 1 : 0));
10480 __ call_VM_leaf(CAST_FROM_FN_PTR(address, Continuation::prepare_thaw), rthread, c_rarg1);
10481 __ mov(rscratch2, r0); // r0 contains the size of the frames to thaw, 0 if overflow or no more frames
10482
10483 if (return_barrier) {
10484 // restore return value (no safepoint in the call to thaw, so even an oop return value should be OK)
10485 __ ldp(rscratch1, r0, Address(__ post(sp, 2 * wordSize)));
10486 __ fmovd(v0, rscratch1);
10487 }
10488 assert_asm(_masm, (__ ldr(rscratch1, Address(rthread, JavaThread::cont_entry_offset())), __ cmp(sp, rscratch1)), Assembler::EQ, "incorrect sp");
10489
10490
10491 Label thaw_success;
10492 // rscratch2 contains the size of the frames to thaw, 0 if overflow or no more frames
10493 __ cbnz(rscratch2, thaw_success);
10494 __ lea(rscratch1, RuntimeAddress(SharedRuntime::throw_StackOverflowError_entry()));
10495 __ br(rscratch1);
10496 __ bind(thaw_success);
10497
10498 // make room for the thawed frames
10499 __ sub(rscratch1, sp, rscratch2);
10500 __ andr(rscratch1, rscratch1, -16); // align
10501 __ mov(sp, rscratch1);
10502
10503 if (return_barrier) {
10504 // save original return value -- again
10505 __ fmovd(rscratch1, v0);
10506 __ stp(rscratch1, r0, Address(__ pre(sp, -2 * wordSize)));
10507 }
10508
10509 // If we want, we can templatize thaw by kind, and have three different entries
10510 __ movw(c_rarg1, (uint32_t)kind);
10511
10512 __ call_VM_leaf(Continuation::thaw_entry(), rthread, c_rarg1);
10513 __ mov(rscratch2, r0); // r0 is the sp of the yielding frame
10514
10515 if (return_barrier) {
10516 // restore return value (no safepoint in the call to thaw, so even an oop return value should be OK)
10517 __ ldp(rscratch1, r0, Address(__ post(sp, 2 * wordSize)));
10518 __ fmovd(v0, rscratch1);
10519 } else {
10520 __ mov(r0, zr); // return 0 (success) from doYield
10521 }
10522
10523 // we're now on the yield frame (which is in an address above us b/c rsp has been pushed down)
10524 __ sub(sp, rscratch2, 2*wordSize); // now pointing to rfp spill
10525 __ mov(rfp, sp);
10526
10527 if (return_barrier_exception) {
10528 __ ldr(c_rarg1, Address(rfp, wordSize)); // return address
10529 __ authenticate_return_address(c_rarg1);
10530 __ verify_oop(r0);
10531 // save return value containing the exception oop in callee-saved R19
10532 __ mov(r19, r0);
10533
10534 __ call_VM_leaf(CAST_FROM_FN_PTR(address, SharedRuntime::exception_handler_for_return_address), rthread, c_rarg1);
10535
10536 // Reinitialize the ptrue predicate register, in case the external runtime call clobbers ptrue reg, as we may return to SVE compiled code.
10537 // __ reinitialize_ptrue();
10538
11635 // assert(Ra == Pa_base[j], "must be");
11636 // MACC(Ra, Ra, t0, t1, t2);
11637 // }
11638 // iters = (2*len-i)/2;
11639 // assert(iters == len-j, "must be");
11640 // for (; iters--; j++) {
11641 // assert(Rm == Pm_base[j] && Rn == Pn_base[i-j], "must be");
11642 // MACC(Rm, Rn, t0, t1, t2);
11643 // Rm = *++Pm;
11644 // Rn = *--Pn;
11645 // }
11646 // Pm_base[i-len] = t0;
11647 // t0 = t1; t1 = t2; t2 = 0;
11648 // }
11649
11650 // while (t0)
11651 // t0 = sub(Pm_base, Pn_base, t0, len);
11652 // }
11653 };
11654
11655 // Initialization
11656 void generate_preuniverse_stubs() {
11657 // preuniverse stubs are not needed for aarch64
11658 }
11659
11660 void generate_initial_stubs() {
11661 // Generate initial stubs and initializes the entry points
11662
11663 // entry points that exist in all platforms Note: This is code
11664 // that could be shared among different platforms - however the
11665 // benefit seems to be smaller than the disadvantage of having a
11666 // much more complicated generator structure. See also comment in
11667 // stubRoutines.hpp.
11668
11669 StubRoutines::_forward_exception_entry = generate_forward_exception();
11670
11671 StubRoutines::_call_stub_entry =
11672 generate_call_stub(StubRoutines::_call_stub_return_address);
11673
11674 // is referenced by megamorphic call
11685 StubRoutines::_updateBytesCRC32 = generate_updateBytesCRC32();
11686 }
11687
11688 if (UseCRC32CIntrinsics) {
11689 StubRoutines::_updateBytesCRC32C = generate_updateBytesCRC32C();
11690 }
11691
11692 if (vmIntrinsics::is_intrinsic_available(vmIntrinsics::_dsin)) {
11693 StubRoutines::_dsin = generate_dsin_dcos(/* isCos = */ false);
11694 }
11695
11696 if (vmIntrinsics::is_intrinsic_available(vmIntrinsics::_dcos)) {
11697 StubRoutines::_dcos = generate_dsin_dcos(/* isCos = */ true);
11698 }
11699
11700 if (vmIntrinsics::is_intrinsic_available(vmIntrinsics::_float16ToFloat) &&
11701 vmIntrinsics::is_intrinsic_available(vmIntrinsics::_floatToFloat16)) {
11702 StubRoutines::_hf2f = generate_float16ToFloat();
11703 StubRoutines::_f2hf = generate_floatToFloat16();
11704 }
11705 }
11706
11707 void generate_continuation_stubs() {
11708 // Continuation stubs:
11709 StubRoutines::_cont_thaw = generate_cont_thaw();
11710 StubRoutines::_cont_returnBarrier = generate_cont_returnBarrier();
11711 StubRoutines::_cont_returnBarrierExc = generate_cont_returnBarrier_exception();
11712 StubRoutines::_cont_preempt_stub = generate_cont_preempt_stub();
11713 }
11714
11715 void generate_final_stubs() {
11716 // support for verify_oop (must happen after universe_init)
11717 if (VerifyOops) {
11718 StubRoutines::_verify_oop_subroutine_entry = generate_verify_oop();
11719 }
11720
11721 // arraycopy stubs used by compilers
11722 generate_arraycopy_stubs();
11723
11724 StubRoutines::_method_entry_barrier = generate_method_entry_barrier();
|
311 __ mov(r19_sender_sp, sp);
312 __ blr(c_rarg4);
313
314 // we do this here because the notify will already have been done
315 // if we get to the next instruction via an exception
316 //
317 // n.b. adding this instruction here affects the calculation of
318 // whether or not a routine returns to the call stub (used when
319 // doing stack walks) since the normal test is to check the return
320 // pc against the address saved below. so we may need to allow for
321 // this extra instruction in the check.
322
323 // save current address for use by exception handling code
324
325 return_address = __ pc();
326
327 // store result depending on type (everything that is not
328 // T_OBJECT, T_LONG, T_FLOAT or T_DOUBLE is treated as T_INT)
329 // n.b. this assumes Java returns an integral result in r0
330 // and a floating result in j_farg0
331 // All of j_rargN may be used to return inline type fields so be careful
332 // not to clobber those.
333 // SharedRuntime::generate_buffered_inline_type_adapter() knows the register
334 // assignment of Rresult below.
335 Register Rresult = r14, Rresult_type = r15;
336 __ ldr(Rresult, result);
337 Label is_long, is_float, is_double, check_prim, exit;
338 __ ldr(Rresult_type, result_type);
339 __ cmp(Rresult_type, (u1)T_OBJECT);
340 __ br(Assembler::EQ, check_prim);
341 __ cmp(Rresult_type, (u1)T_LONG);
342 __ br(Assembler::EQ, is_long);
343 __ cmp(Rresult_type, (u1)T_FLOAT);
344 __ br(Assembler::EQ, is_float);
345 __ cmp(Rresult_type, (u1)T_DOUBLE);
346 __ br(Assembler::EQ, is_double);
347
348 // handle T_INT case
349 __ strw(r0, Address(Rresult));
350
351 __ BIND(exit);
352
353 // pop parameters
354 __ sub(esp, rfp, -sp_after_call_off * wordSize);
355
356 #ifdef ASSERT
357 // verify that threads correspond
358 {
359 Label L, S;
360 __ ldr(rscratch1, thread);
361 __ cmp(rthread, rscratch1);
362 __ br(Assembler::NE, S);
363 __ get_thread(rscratch1);
364 __ cmp(rthread, rscratch1);
365 __ br(Assembler::EQ, L);
366 __ BIND(S);
367 __ stop("StubRoutines::call_stub: threads must correspond");
368 __ BIND(L);
369 }
381 __ ldp(r26, r25, r26_save);
382 __ ldp(r24, r23, r24_save);
383 __ ldp(r22, r21, r22_save);
384 __ ldp(r20, r19, r20_save);
385
386 // restore fpcr
387 __ ldr(rscratch1, fpcr_save);
388 __ set_fpcr(rscratch1);
389
390 __ ldp(c_rarg0, c_rarg1, call_wrapper);
391 __ ldrw(c_rarg2, result_type);
392 __ ldr(c_rarg3, method);
393 __ ldp(c_rarg4, c_rarg5, entry_point);
394 __ ldp(c_rarg6, c_rarg7, parameter_size);
395
396 // leave frame and return to caller
397 __ leave();
398 __ ret(lr);
399
400 // handle return types different from T_INT
401 __ BIND(check_prim);
402 if (InlineTypeReturnedAsFields) {
403 // Check for scalarized return value
404 __ tbz(r0, 0, is_long);
405 // Load pack handler address
406 __ andr(rscratch1, r0, -2);
407 __ ldr(rscratch1, Address(rscratch1, InstanceKlass::adr_inlineklass_fixed_block_offset()));
408 __ ldr(rscratch1, Address(rscratch1, InlineKlass::pack_handler_jobject_offset()));
409 __ blr(rscratch1);
410 __ b(exit);
411 }
412
413 __ BIND(is_long);
414 __ str(r0, Address(Rresult, 0));
415 __ br(Assembler::AL, exit);
416
417 __ BIND(is_float);
418 __ strs(j_farg0, Address(Rresult, 0));
419 __ br(Assembler::AL, exit);
420
421 __ BIND(is_double);
422 __ strd(j_farg0, Address(Rresult, 0));
423 __ br(Assembler::AL, exit);
424
425 return start;
426 }
427
428 // Return point for a Java call if there's an exception thrown in
429 // Java code. The exception is caught and transformed into a
430 // pending exception stored in JavaThread that can be tested from
431 // within the VM.
432 //
433 // Note: Usually the parameters are removed by the callee. In case
434 // of an exception crossing an activation frame boundary, that is
435 // not the case if the callee is compiled code => need to setup the
436 // rsp.
437 //
438 // r0: exception oop
439
440 address generate_catch_exception() {
441 StubGenStubId stub_id = StubGenStubId::catch_exception_id;
442 StubCodeMark mark(this, stub_id);
2223 // |array_tag| | header_size | element_type | |log2_element_size|
2224 // 32 30 24 16 8 2 0
2225 //
2226 // array_tag: typeArray = 0x3, objArray = 0x2, non-array = 0x0
2227 //
2228
2229 const int lh_offset = in_bytes(Klass::layout_helper_offset());
2230
2231 // Handle objArrays completely differently...
2232 const jint objArray_lh = Klass::array_layout_helper(T_OBJECT);
2233 __ ldrw(lh, Address(scratch_src_klass, lh_offset));
2234 __ movw(rscratch1, objArray_lh);
2235 __ eorw(rscratch2, lh, rscratch1);
2236 __ cbzw(rscratch2, L_objArray);
2237
2238 // if (src->klass() != dst->klass()) return -1;
2239 __ load_klass(rscratch2, dst);
2240 __ eor(rscratch2, rscratch2, scratch_src_klass);
2241 __ cbnz(rscratch2, L_failed);
2242
2243 // Check for flat inline type array -> return -1
2244 __ test_flat_array_oop(src, rscratch2, L_failed);
2245
2246 // Check for null-free (non-flat) inline type array -> handle as object array
2247 __ test_null_free_array_oop(src, rscratch2, L_objArray);
2248
2249 // if (!src->is_Array()) return -1;
2250 __ tbz(lh, 31, L_failed); // i.e. (lh >= 0)
2251
2252 // At this point, it is known to be a typeArray (array_tag 0x3).
2253 #ifdef ASSERT
2254 {
2255 BLOCK_COMMENT("assert primitive array {");
2256 Label L;
2257 __ movw(rscratch2, Klass::_lh_array_tag_type_value << Klass::_lh_array_tag_shift);
2258 __ cmpw(lh, rscratch2);
2259 __ br(Assembler::GE, L);
2260 __ stop("must be a primitive array");
2261 __ bind(L);
2262 BLOCK_COMMENT("} assert primitive array done");
2263 }
2264 #endif
2265
2266 arraycopy_range_checks(src, src_pos, dst, dst_pos, scratch_length,
2267 rscratch2, L_failed);
2268
10463 gen_cas_entry(MacroAssembler::xword, memory_order_relaxed);
10464
10465 AtomicStubMark mark_cmpxchg_4_release
10466 (_masm, &aarch64_atomic_cmpxchg_4_release_impl);
10467 gen_cas_entry(MacroAssembler::word, memory_order_release);
10468 AtomicStubMark mark_cmpxchg_8_release
10469 (_masm, &aarch64_atomic_cmpxchg_8_release_impl);
10470 gen_cas_entry(MacroAssembler::xword, memory_order_release);
10471
10472 AtomicStubMark mark_cmpxchg_4_seq_cst
10473 (_masm, &aarch64_atomic_cmpxchg_4_seq_cst_impl);
10474 gen_cas_entry(MacroAssembler::word, memory_order_seq_cst);
10475 AtomicStubMark mark_cmpxchg_8_seq_cst
10476 (_masm, &aarch64_atomic_cmpxchg_8_seq_cst_impl);
10477 gen_cas_entry(MacroAssembler::xword, memory_order_seq_cst);
10478
10479 ICache::invalidate_range(first_entry, __ pc() - first_entry);
10480 }
10481 #endif // LINUX
10482
10483 static void save_return_registers(MacroAssembler* masm) {
10484 if (InlineTypeReturnedAsFields) {
10485 masm->push(RegSet::range(r0, r7), sp);
10486 masm->sub(sp, sp, 4 * wordSize);
10487 masm->st1(v0, v1, v2, v3, masm->T1D, Address(sp));
10488 masm->sub(sp, sp, 4 * wordSize);
10489 masm->st1(v4, v5, v6, v7, masm->T1D, Address(sp));
10490 } else {
10491 masm->fmovd(rscratch1, v0);
10492 masm->stp(rscratch1, r0, Address(masm->pre(sp, -2 * wordSize)));
10493 }
10494 }
10495
10496 static void restore_return_registers(MacroAssembler* masm) {
10497 if (InlineTypeReturnedAsFields) {
10498 masm->ld1(v4, v5, v6, v7, masm->T1D, Address(masm->post(sp, 4 * wordSize)));
10499 masm->ld1(v0, v1, v2, v3, masm->T1D, Address(masm->post(sp, 4 * wordSize)));
10500 masm->pop(RegSet::range(r0, r7), sp);
10501 } else {
10502 masm->ldp(rscratch1, r0, Address(masm->post(sp, 2 * wordSize)));
10503 masm->fmovd(v0, rscratch1);
10504 }
10505 }
10506
10507 address generate_cont_thaw(Continuation::thaw_kind kind) {
10508 bool return_barrier = Continuation::is_thaw_return_barrier(kind);
10509 bool return_barrier_exception = Continuation::is_thaw_return_barrier_exception(kind);
10510
10511 address start = __ pc();
10512
10513 if (return_barrier) {
10514 __ ldr(rscratch1, Address(rthread, JavaThread::cont_entry_offset()));
10515 __ mov(sp, rscratch1);
10516 }
10517 assert_asm(_masm, (__ ldr(rscratch1, Address(rthread, JavaThread::cont_entry_offset())), __ cmp(sp, rscratch1)), Assembler::EQ, "incorrect sp");
10518
10519 if (return_barrier) {
10520 // preserve possible return value from a method returning to the return barrier
10521 save_return_registers(_masm);
10522 }
10523
10524 __ movw(c_rarg1, (return_barrier ? 1 : 0));
10525 __ call_VM_leaf(CAST_FROM_FN_PTR(address, Continuation::prepare_thaw), rthread, c_rarg1);
10526 __ mov(rscratch2, r0); // r0 contains the size of the frames to thaw, 0 if overflow or no more frames
10527
10528 if (return_barrier) {
10529 // restore return value (no safepoint in the call to thaw, so even an oop return value should be OK)
10530 restore_return_registers(_masm);
10531 }
10532 assert_asm(_masm, (__ ldr(rscratch1, Address(rthread, JavaThread::cont_entry_offset())), __ cmp(sp, rscratch1)), Assembler::EQ, "incorrect sp");
10533
10534
10535 Label thaw_success;
10536 // rscratch2 contains the size of the frames to thaw, 0 if overflow or no more frames
10537 __ cbnz(rscratch2, thaw_success);
10538 __ lea(rscratch1, RuntimeAddress(SharedRuntime::throw_StackOverflowError_entry()));
10539 __ br(rscratch1);
10540 __ bind(thaw_success);
10541
10542 // make room for the thawed frames
10543 __ sub(rscratch1, sp, rscratch2);
10544 __ andr(rscratch1, rscratch1, -16); // align
10545 __ mov(sp, rscratch1);
10546
10547 if (return_barrier) {
10548 // save original return value -- again
10549 save_return_registers(_masm);
10550 }
10551
10552 // If we want, we can templatize thaw by kind, and have three different entries
10553 __ movw(c_rarg1, (uint32_t)kind);
10554
10555 __ call_VM_leaf(Continuation::thaw_entry(), rthread, c_rarg1);
10556 __ mov(rscratch2, r0); // r0 is the sp of the yielding frame
10557
10558 if (return_barrier) {
10559 // restore return value (no safepoint in the call to thaw, so even an oop return value should be OK)
10560 restore_return_registers(_masm);
10561 } else {
10562 __ mov(r0, zr); // return 0 (success) from doYield
10563 }
10564
10565 // we're now on the yield frame (which is in an address above us b/c rsp has been pushed down)
10566 __ sub(sp, rscratch2, 2*wordSize); // now pointing to rfp spill
10567 __ mov(rfp, sp);
10568
10569 if (return_barrier_exception) {
10570 __ ldr(c_rarg1, Address(rfp, wordSize)); // return address
10571 __ authenticate_return_address(c_rarg1);
10572 __ verify_oop(r0);
10573 // save return value containing the exception oop in callee-saved R19
10574 __ mov(r19, r0);
10575
10576 __ call_VM_leaf(CAST_FROM_FN_PTR(address, SharedRuntime::exception_handler_for_return_address), rthread, c_rarg1);
10577
10578 // Reinitialize the ptrue predicate register, in case the external runtime call clobbers ptrue reg, as we may return to SVE compiled code.
10579 // __ reinitialize_ptrue();
10580
11677 // assert(Ra == Pa_base[j], "must be");
11678 // MACC(Ra, Ra, t0, t1, t2);
11679 // }
11680 // iters = (2*len-i)/2;
11681 // assert(iters == len-j, "must be");
11682 // for (; iters--; j++) {
11683 // assert(Rm == Pm_base[j] && Rn == Pn_base[i-j], "must be");
11684 // MACC(Rm, Rn, t0, t1, t2);
11685 // Rm = *++Pm;
11686 // Rn = *--Pn;
11687 // }
11688 // Pm_base[i-len] = t0;
11689 // t0 = t1; t1 = t2; t2 = 0;
11690 // }
11691
11692 // while (t0)
11693 // t0 = sub(Pm_base, Pn_base, t0, len);
11694 // }
11695 };
11696
11697 // Call here from the interpreter or compiled code to either load
11698 // multiple returned values from the inline type instance being
11699 // returned to registers or to store returned values to a newly
11700 // allocated inline type instance.
11701 address generate_return_value_stub(address destination, const char* name, bool has_res) {
11702 // We need to save all registers the calling convention may use so
11703 // the runtime calls read or update those registers. This needs to
11704 // be in sync with SharedRuntime::java_return_convention().
11705 // n.b. aarch64 asserts that frame::arg_reg_save_area_bytes == 0
11706 enum layout {
11707 j_rarg7_off = 0, j_rarg7_2, // j_rarg7 is r0
11708 j_rarg6_off, j_rarg6_2,
11709 j_rarg5_off, j_rarg5_2,
11710 j_rarg4_off, j_rarg4_2,
11711 j_rarg3_off, j_rarg3_2,
11712 j_rarg2_off, j_rarg2_2,
11713 j_rarg1_off, j_rarg1_2,
11714 j_rarg0_off, j_rarg0_2,
11715
11716 j_farg7_off, j_farg7_2,
11717 j_farg6_off, j_farg6_2,
11718 j_farg5_off, j_farg5_2,
11719 j_farg4_off, j_farg4_2,
11720 j_farg3_off, j_farg3_2,
11721 j_farg2_off, j_farg2_2,
11722 j_farg1_off, j_farg1_2,
11723 j_farg0_off, j_farg0_2,
11724
11725 rfp_off, rfp_off2,
11726 return_off, return_off2,
11727
11728 framesize // inclusive of return address
11729 };
11730
11731 CodeBuffer code(name, 512, 64);
11732 MacroAssembler* masm = new MacroAssembler(&code);
11733
11734 int frame_size_in_bytes = align_up(framesize*BytesPerInt, 16);
11735 assert(frame_size_in_bytes == framesize*BytesPerInt, "misaligned");
11736 int frame_size_in_slots = frame_size_in_bytes / BytesPerInt;
11737 int frame_size_in_words = frame_size_in_bytes / wordSize;
11738
11739 OopMapSet* oop_maps = new OopMapSet();
11740 OopMap* map = new OopMap(frame_size_in_slots, 0);
11741
11742 map->set_callee_saved(VMRegImpl::stack2reg(j_rarg7_off), j_rarg7->as_VMReg());
11743 map->set_callee_saved(VMRegImpl::stack2reg(j_rarg6_off), j_rarg6->as_VMReg());
11744 map->set_callee_saved(VMRegImpl::stack2reg(j_rarg5_off), j_rarg5->as_VMReg());
11745 map->set_callee_saved(VMRegImpl::stack2reg(j_rarg4_off), j_rarg4->as_VMReg());
11746 map->set_callee_saved(VMRegImpl::stack2reg(j_rarg3_off), j_rarg3->as_VMReg());
11747 map->set_callee_saved(VMRegImpl::stack2reg(j_rarg2_off), j_rarg2->as_VMReg());
11748 map->set_callee_saved(VMRegImpl::stack2reg(j_rarg1_off), j_rarg1->as_VMReg());
11749 map->set_callee_saved(VMRegImpl::stack2reg(j_rarg0_off), j_rarg0->as_VMReg());
11750
11751 map->set_callee_saved(VMRegImpl::stack2reg(j_farg0_off), j_farg0->as_VMReg());
11752 map->set_callee_saved(VMRegImpl::stack2reg(j_farg1_off), j_farg1->as_VMReg());
11753 map->set_callee_saved(VMRegImpl::stack2reg(j_farg2_off), j_farg2->as_VMReg());
11754 map->set_callee_saved(VMRegImpl::stack2reg(j_farg3_off), j_farg3->as_VMReg());
11755 map->set_callee_saved(VMRegImpl::stack2reg(j_farg4_off), j_farg4->as_VMReg());
11756 map->set_callee_saved(VMRegImpl::stack2reg(j_farg5_off), j_farg5->as_VMReg());
11757 map->set_callee_saved(VMRegImpl::stack2reg(j_farg6_off), j_farg6->as_VMReg());
11758 map->set_callee_saved(VMRegImpl::stack2reg(j_farg7_off), j_farg7->as_VMReg());
11759
11760 address start = __ pc();
11761
11762 __ enter(); // Save FP and LR before call
11763
11764 __ stpd(j_farg1, j_farg0, Address(__ pre(sp, -2 * wordSize)));
11765 __ stpd(j_farg3, j_farg2, Address(__ pre(sp, -2 * wordSize)));
11766 __ stpd(j_farg5, j_farg4, Address(__ pre(sp, -2 * wordSize)));
11767 __ stpd(j_farg7, j_farg6, Address(__ pre(sp, -2 * wordSize)));
11768
11769 __ stp(j_rarg1, j_rarg0, Address(__ pre(sp, -2 * wordSize)));
11770 __ stp(j_rarg3, j_rarg2, Address(__ pre(sp, -2 * wordSize)));
11771 __ stp(j_rarg5, j_rarg4, Address(__ pre(sp, -2 * wordSize)));
11772 __ stp(j_rarg7, j_rarg6, Address(__ pre(sp, -2 * wordSize)));
11773
11774 int frame_complete = __ offset();
11775
11776 // Set up last_Java_sp and last_Java_fp
11777 address the_pc = __ pc();
11778 __ set_last_Java_frame(sp, noreg, the_pc, rscratch1);
11779
11780 // Call runtime
11781 __ mov(c_rarg1, r0);
11782 __ mov(c_rarg0, rthread);
11783
11784 __ mov(rscratch1, destination);
11785 __ blr(rscratch1);
11786
11787 oop_maps->add_gc_map(the_pc - start, map);
11788
11789 __ reset_last_Java_frame(false);
11790
11791 __ ldp(j_rarg7, j_rarg6, Address(__ post(sp, 2 * wordSize)));
11792 __ ldp(j_rarg5, j_rarg4, Address(__ post(sp, 2 * wordSize)));
11793 __ ldp(j_rarg3, j_rarg2, Address(__ post(sp, 2 * wordSize)));
11794 __ ldp(j_rarg1, j_rarg0, Address(__ post(sp, 2 * wordSize)));
11795
11796 __ ldpd(j_farg7, j_farg6, Address(__ post(sp, 2 * wordSize)));
11797 __ ldpd(j_farg5, j_farg4, Address(__ post(sp, 2 * wordSize)));
11798 __ ldpd(j_farg3, j_farg2, Address(__ post(sp, 2 * wordSize)));
11799 __ ldpd(j_farg1, j_farg0, Address(__ post(sp, 2 * wordSize)));
11800
11801 __ leave();
11802
11803 // check for pending exceptions
11804 Label pending;
11805 __ ldr(rscratch1, Address(rthread, in_bytes(Thread::pending_exception_offset())));
11806 __ cbnz(rscratch1, pending);
11807
11808 if (has_res) {
11809 __ get_vm_result_oop(r0, rthread);
11810 }
11811
11812 __ ret(lr);
11813
11814 __ bind(pending);
11815 __ far_jump(RuntimeAddress(StubRoutines::forward_exception_entry()));
11816
11817 // -------------
11818 // make sure all code is generated
11819 masm->flush();
11820
11821 RuntimeStub* stub = RuntimeStub::new_runtime_stub(name, &code, frame_complete, frame_size_in_words, oop_maps, false);
11822 return stub->entry_point();
11823 }
11824
11825 // Initialization
11826 void generate_preuniverse_stubs() {
11827 // preuniverse stubs are not needed for aarch64
11828 }
11829
11830 void generate_initial_stubs() {
11831 // Generate initial stubs and initializes the entry points
11832
11833 // entry points that exist in all platforms Note: This is code
11834 // that could be shared among different platforms - however the
11835 // benefit seems to be smaller than the disadvantage of having a
11836 // much more complicated generator structure. See also comment in
11837 // stubRoutines.hpp.
11838
11839 StubRoutines::_forward_exception_entry = generate_forward_exception();
11840
11841 StubRoutines::_call_stub_entry =
11842 generate_call_stub(StubRoutines::_call_stub_return_address);
11843
11844 // is referenced by megamorphic call
11855 StubRoutines::_updateBytesCRC32 = generate_updateBytesCRC32();
11856 }
11857
11858 if (UseCRC32CIntrinsics) {
11859 StubRoutines::_updateBytesCRC32C = generate_updateBytesCRC32C();
11860 }
11861
11862 if (vmIntrinsics::is_intrinsic_available(vmIntrinsics::_dsin)) {
11863 StubRoutines::_dsin = generate_dsin_dcos(/* isCos = */ false);
11864 }
11865
11866 if (vmIntrinsics::is_intrinsic_available(vmIntrinsics::_dcos)) {
11867 StubRoutines::_dcos = generate_dsin_dcos(/* isCos = */ true);
11868 }
11869
11870 if (vmIntrinsics::is_intrinsic_available(vmIntrinsics::_float16ToFloat) &&
11871 vmIntrinsics::is_intrinsic_available(vmIntrinsics::_floatToFloat16)) {
11872 StubRoutines::_hf2f = generate_float16ToFloat();
11873 StubRoutines::_f2hf = generate_floatToFloat16();
11874 }
11875
11876 if (InlineTypeReturnedAsFields) {
11877 StubRoutines::_load_inline_type_fields_in_regs =
11878 generate_return_value_stub(CAST_FROM_FN_PTR(address, SharedRuntime::load_inline_type_fields_in_regs), "load_inline_type_fields_in_regs", false);
11879 StubRoutines::_store_inline_type_fields_to_buf =
11880 generate_return_value_stub(CAST_FROM_FN_PTR(address, SharedRuntime::store_inline_type_fields_to_buf), "store_inline_type_fields_to_buf", true);
11881 }
11882
11883 }
11884
11885 void generate_continuation_stubs() {
11886 // Continuation stubs:
11887 StubRoutines::_cont_thaw = generate_cont_thaw();
11888 StubRoutines::_cont_returnBarrier = generate_cont_returnBarrier();
11889 StubRoutines::_cont_returnBarrierExc = generate_cont_returnBarrier_exception();
11890 StubRoutines::_cont_preempt_stub = generate_cont_preempt_stub();
11891 }
11892
11893 void generate_final_stubs() {
11894 // support for verify_oop (must happen after universe_init)
11895 if (VerifyOops) {
11896 StubRoutines::_verify_oop_subroutine_entry = generate_verify_oop();
11897 }
11898
11899 // arraycopy stubs used by compilers
11900 generate_arraycopy_stubs();
11901
11902 StubRoutines::_method_entry_barrier = generate_method_entry_barrier();
|