1 /* 2 * Copyright (c) 1999, 2020, Oracle and/or its affiliates. All rights reserved. 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 4 * 5 * This code is free software; you can redistribute it and/or modify it 6 * under the terms of the GNU General Public License version 2 only, as 7 * published by the Free Software Foundation. 8 * 9 * This code is distributed in the hope that it will be useful, but WITHOUT 10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License 12 * version 2 for more details (a copy is included in the LICENSE file that 13 * accompanied this code). 14 * 15 * You should have received a copy of the GNU General Public License version 16 * 2 along with this work; if not, write to the Free Software Foundation, 17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. 18 * 19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA 20 * or visit www.oracle.com if you need additional information or have any 21 * questions. 22 * 23 */ 24 25 #include "precompiled.hpp" 26 #include "c1/c1_CodeStubs.hpp" 27 #include "c1/c1_FrameMap.hpp" 28 #include "c1/c1_LIRAssembler.hpp" 29 #include "c1/c1_MacroAssembler.hpp" 30 #include "c1/c1_Runtime1.hpp" 31 #include "classfile/javaClasses.hpp" 32 #include "nativeInst_x86.hpp" 33 #include "runtime/sharedRuntime.hpp" 34 #include "utilities/align.hpp" 35 #include "utilities/macros.hpp" 36 #include "vmreg_x86.inline.hpp" 37 38 39 #define __ ce->masm()-> 40 41 #ifndef _LP64 42 float ConversionStub::float_zero = 0.0; 43 double ConversionStub::double_zero = 0.0; 44 45 void ConversionStub::emit_code(LIR_Assembler* ce) { 46 __ bind(_entry); 47 assert(bytecode() == Bytecodes::_f2i || bytecode() == Bytecodes::_d2i, "other conversions do not require stub"); 48 49 50 if (input()->is_single_xmm()) { 51 __ comiss(input()->as_xmm_float_reg(), 52 ExternalAddress((address)&float_zero)); 53 } else if (input()->is_double_xmm()) { 54 __ comisd(input()->as_xmm_double_reg(), 55 ExternalAddress((address)&double_zero)); 56 } else { 57 __ push(rax); 58 __ ftst(); 59 __ fnstsw_ax(); 60 __ sahf(); 61 __ pop(rax); 62 } 63 64 Label NaN, do_return; 65 __ jccb(Assembler::parity, NaN); 66 __ jccb(Assembler::below, do_return); 67 68 // input is > 0 -> return maxInt 69 // result register already contains 0x80000000, so subtracting 1 gives 0x7fffffff 70 __ decrement(result()->as_register()); 71 __ jmpb(do_return); 72 73 // input is NaN -> return 0 74 __ bind(NaN); 75 __ xorptr(result()->as_register(), result()->as_register()); 76 77 __ bind(do_return); 78 __ jmp(_continuation); 79 } 80 #endif // !_LP64 81 82 void C1SafepointPollStub::emit_code(LIR_Assembler* ce) { 83 __ bind(_entry); 84 InternalAddress safepoint_pc(ce->masm()->pc() - ce->masm()->offset() + safepoint_offset()); 85 #ifdef _LP64 86 __ lea(rscratch1, safepoint_pc); 87 __ movptr(Address(r15_thread, JavaThread::saved_exception_pc_offset()), rscratch1); 88 #else 89 const Register tmp1 = rcx; 90 const Register tmp2 = rdx; 91 __ push(tmp1); 92 __ push(tmp2); 93 94 __ lea(tmp1, safepoint_pc); 95 __ get_thread(tmp2); 96 __ movptr(Address(tmp2, JavaThread::saved_exception_pc_offset()), tmp1); 97 98 __ pop(tmp2); 99 __ pop(tmp1); 100 #endif /* _LP64 */ 101 assert(SharedRuntime::polling_page_return_handler_blob() != NULL, 102 "polling page return stub not created yet"); 103 104 address stub = SharedRuntime::polling_page_return_handler_blob()->entry_point(); 105 __ jump(RuntimeAddress(stub)); 106 } 107 108 void CounterOverflowStub::emit_code(LIR_Assembler* ce) { 109 __ bind(_entry); 110 Metadata *m = _method->as_constant_ptr()->as_metadata(); 111 ce->store_parameter(m, 1); 112 ce->store_parameter(_bci, 0); 113 __ call(RuntimeAddress(Runtime1::entry_for(Runtime1::counter_overflow_id))); 114 ce->add_call_info_here(_info); 115 ce->verify_oop_map(_info); 116 __ jmp(_continuation); 117 } 118 119 RangeCheckStub::RangeCheckStub(CodeEmitInfo* info, LIR_Opr index, LIR_Opr array) 120 : _index(index), _array(array), _throw_index_out_of_bounds_exception(false) { 121 assert(info != NULL, "must have info"); 122 _info = new CodeEmitInfo(info); 123 } 124 125 RangeCheckStub::RangeCheckStub(CodeEmitInfo* info, LIR_Opr index) 126 : _index(index), _array(NULL), _throw_index_out_of_bounds_exception(true) { 127 assert(info != NULL, "must have info"); 128 _info = new CodeEmitInfo(info); 129 } 130 131 void RangeCheckStub::emit_code(LIR_Assembler* ce) { 132 __ bind(_entry); 133 if (_info->deoptimize_on_exception()) { 134 address a = Runtime1::entry_for(Runtime1::predicate_failed_trap_id); 135 __ call(RuntimeAddress(a)); 136 ce->add_call_info_here(_info); 137 ce->verify_oop_map(_info); 138 debug_only(__ should_not_reach_here()); 139 return; 140 } 141 142 // pass the array index on stack because all registers must be preserved 143 if (_index->is_cpu_register()) { 144 ce->store_parameter(_index->as_register(), 0); 145 } else { 146 ce->store_parameter(_index->as_jint(), 0); 147 } 148 Runtime1::StubID stub_id; 149 if (_throw_index_out_of_bounds_exception) { 150 stub_id = Runtime1::throw_index_exception_id; 151 } else { 152 stub_id = Runtime1::throw_range_check_failed_id; 153 ce->store_parameter(_array->as_pointer_register(), 1); 154 } 155 __ call(RuntimeAddress(Runtime1::entry_for(stub_id))); 156 ce->add_call_info_here(_info); 157 ce->verify_oop_map(_info); 158 debug_only(__ should_not_reach_here()); 159 } 160 161 PredicateFailedStub::PredicateFailedStub(CodeEmitInfo* info) { 162 _info = new CodeEmitInfo(info); 163 } 164 165 void PredicateFailedStub::emit_code(LIR_Assembler* ce) { 166 __ bind(_entry); 167 address a = Runtime1::entry_for(Runtime1::predicate_failed_trap_id); 168 __ call(RuntimeAddress(a)); 169 ce->add_call_info_here(_info); 170 ce->verify_oop_map(_info); 171 debug_only(__ should_not_reach_here()); 172 } 173 174 void DivByZeroStub::emit_code(LIR_Assembler* ce) { 175 if (_offset != -1) { 176 ce->compilation()->implicit_exception_table()->append(_offset, __ offset()); 177 } 178 __ bind(_entry); 179 __ call(RuntimeAddress(Runtime1::entry_for(Runtime1::throw_div0_exception_id))); 180 ce->add_call_info_here(_info); 181 debug_only(__ should_not_reach_here()); 182 } 183 184 185 // Implementation of NewInstanceStub 186 187 NewInstanceStub::NewInstanceStub(LIR_Opr klass_reg, LIR_Opr result, ciInstanceKlass* klass, CodeEmitInfo* info, Runtime1::StubID stub_id) { 188 _result = result; 189 _klass = klass; 190 _klass_reg = klass_reg; 191 _info = new CodeEmitInfo(info); 192 assert(stub_id == Runtime1::new_instance_id || 193 stub_id == Runtime1::fast_new_instance_id || 194 stub_id == Runtime1::fast_new_instance_init_check_id, 195 "need new_instance id"); 196 _stub_id = stub_id; 197 } 198 199 200 void NewInstanceStub::emit_code(LIR_Assembler* ce) { 201 assert(__ rsp_offset() == 0, "frame size should be fixed"); 202 __ bind(_entry); 203 __ movptr(rdx, _klass_reg->as_register()); 204 __ call(RuntimeAddress(Runtime1::entry_for(_stub_id))); 205 ce->add_call_info_here(_info); 206 ce->verify_oop_map(_info); 207 assert(_result->as_register() == rax, "result must in rax,"); 208 __ jmp(_continuation); 209 } 210 211 212 // Implementation of NewTypeArrayStub 213 214 NewTypeArrayStub::NewTypeArrayStub(LIR_Opr klass_reg, LIR_Opr length, LIR_Opr result, CodeEmitInfo* info) { 215 _klass_reg = klass_reg; 216 _length = length; 217 _result = result; 218 _info = new CodeEmitInfo(info); 219 } 220 221 222 void NewTypeArrayStub::emit_code(LIR_Assembler* ce) { 223 assert(__ rsp_offset() == 0, "frame size should be fixed"); 224 __ bind(_entry); 225 assert(_length->as_register() == rbx, "length must in rbx,"); 226 assert(_klass_reg->as_register() == rdx, "klass_reg must in rdx"); 227 __ call(RuntimeAddress(Runtime1::entry_for(Runtime1::new_type_array_id))); 228 ce->add_call_info_here(_info); 229 ce->verify_oop_map(_info); 230 assert(_result->as_register() == rax, "result must in rax,"); 231 __ jmp(_continuation); 232 } 233 234 235 // Implementation of NewObjectArrayStub 236 237 NewObjectArrayStub::NewObjectArrayStub(LIR_Opr klass_reg, LIR_Opr length, LIR_Opr result, CodeEmitInfo* info) { 238 _klass_reg = klass_reg; 239 _result = result; 240 _length = length; 241 _info = new CodeEmitInfo(info); 242 } 243 244 245 void NewObjectArrayStub::emit_code(LIR_Assembler* ce) { 246 assert(__ rsp_offset() == 0, "frame size should be fixed"); 247 __ bind(_entry); 248 assert(_length->as_register() == rbx, "length must in rbx,"); 249 assert(_klass_reg->as_register() == rdx, "klass_reg must in rdx"); 250 __ call(RuntimeAddress(Runtime1::entry_for(Runtime1::new_object_array_id))); 251 ce->add_call_info_here(_info); 252 ce->verify_oop_map(_info); 253 assert(_result->as_register() == rax, "result must in rax,"); 254 __ jmp(_continuation); 255 } 256 257 258 // Implementation of MonitorAccessStubs 259 260 MonitorEnterStub::MonitorEnterStub(LIR_Opr obj_reg, LIR_Opr lock_reg, CodeEmitInfo* info) 261 : MonitorAccessStub(obj_reg, lock_reg) 262 { 263 _info = new CodeEmitInfo(info); 264 } 265 266 267 void MonitorEnterStub::emit_code(LIR_Assembler* ce) { 268 assert(__ rsp_offset() == 0, "frame size should be fixed"); 269 __ bind(_entry); 270 ce->store_parameter(_obj_reg->as_register(), 1); 271 ce->store_parameter(_lock_reg->as_register(), 0); 272 Runtime1::StubID enter_id; 273 if (ce->compilation()->has_fpu_code()) { 274 enter_id = Runtime1::monitorenter_id; 275 } else { 276 enter_id = Runtime1::monitorenter_nofpu_id; 277 } 278 __ call(RuntimeAddress(Runtime1::entry_for(enter_id))); 279 ce->add_call_info_here(_info); 280 ce->verify_oop_map(_info); 281 __ jmp(_continuation); 282 } 283 284 285 void MonitorExitStub::emit_code(LIR_Assembler* ce) { 286 __ bind(_entry); 287 if (_compute_lock) { 288 // lock_reg was destroyed by fast unlocking attempt => recompute it 289 ce->monitor_address(_monitor_ix, _lock_reg); 290 } 291 ce->store_parameter(_lock_reg->as_register(), 0); 292 // note: non-blocking leaf routine => no call info needed 293 Runtime1::StubID exit_id; 294 if (ce->compilation()->has_fpu_code()) { 295 exit_id = Runtime1::monitorexit_id; 296 } else { 297 exit_id = Runtime1::monitorexit_nofpu_id; 298 } 299 __ call(RuntimeAddress(Runtime1::entry_for(exit_id))); 300 __ jmp(_continuation); 301 } 302 303 304 // Implementation of patching: 305 // - Copy the code at given offset to an inlined buffer (first the bytes, then the number of bytes) 306 // - Replace original code with a call to the stub 307 // At Runtime: 308 // - call to stub, jump to runtime 309 // - in runtime: preserve all registers (rspecially objects, i.e., source and destination object) 310 // - in runtime: after initializing class, restore original code, reexecute instruction 311 312 int PatchingStub::_patch_info_offset = -NativeGeneralJump::instruction_size; 313 314 void PatchingStub::align_patch_site(MacroAssembler* masm) { 315 // We're patching a 5-7 byte instruction on intel and we need to 316 // make sure that we don't see a piece of the instruction. It 317 // appears mostly impossible on Intel to simply invalidate other 318 // processors caches and since they may do aggressive prefetch it's 319 // very hard to make a guess about what code might be in the icache. 320 // Force the instruction to be double word aligned so that it 321 // doesn't span a cache line. 322 masm->align(align_up((int)NativeGeneralJump::instruction_size, wordSize)); 323 } 324 325 void PatchingStub::emit_code(LIR_Assembler* ce) { 326 assert(NativeCall::instruction_size <= _bytes_to_copy && _bytes_to_copy <= 0xFF, "not enough room for call"); 327 328 Label call_patch; 329 330 // static field accesses have special semantics while the class 331 // initializer is being run so we emit a test which can be used to 332 // check that this code is being executed by the initializing 333 // thread. 334 address being_initialized_entry = __ pc(); 335 if (CommentedAssembly) { 336 __ block_comment(" patch template"); 337 } 338 if (_id == load_klass_id) { 339 // produce a copy of the load klass instruction for use by the being initialized case 340 #ifdef ASSERT 341 address start = __ pc(); 342 #endif 343 Metadata* o = NULL; 344 __ mov_metadata(_obj, o); 345 #ifdef ASSERT 346 for (int i = 0; i < _bytes_to_copy; i++) { 347 address ptr = (address)(_pc_start + i); 348 int a_byte = (*ptr) & 0xFF; 349 assert(a_byte == *start++, "should be the same code"); 350 } 351 #endif 352 } else if (_id == load_mirror_id) { 353 // produce a copy of the load mirror instruction for use by the being 354 // initialized case 355 #ifdef ASSERT 356 address start = __ pc(); 357 #endif 358 jobject o = NULL; 359 __ movoop(_obj, o); 360 #ifdef ASSERT 361 for (int i = 0; i < _bytes_to_copy; i++) { 362 address ptr = (address)(_pc_start + i); 363 int a_byte = (*ptr) & 0xFF; 364 assert(a_byte == *start++, "should be the same code"); 365 } 366 #endif 367 } else { 368 // make a copy the code which is going to be patched. 369 for (int i = 0; i < _bytes_to_copy; i++) { 370 address ptr = (address)(_pc_start + i); 371 int a_byte = (*ptr) & 0xFF; 372 __ emit_int8(a_byte); 373 *ptr = 0x90; // make the site look like a nop 374 } 375 } 376 377 address end_of_patch = __ pc(); 378 int bytes_to_skip = 0; 379 if (_id == load_mirror_id) { 380 int offset = __ offset(); 381 if (CommentedAssembly) { 382 __ block_comment(" being_initialized check"); 383 } 384 assert(_obj != noreg, "must be a valid register"); 385 Register tmp = rax; 386 Register tmp2 = rbx; 387 __ push(tmp); 388 __ push(tmp2); 389 // Load without verification to keep code size small. We need it because 390 // begin_initialized_entry_offset has to fit in a byte. Also, we know it's not null. 391 __ movptr(tmp2, Address(_obj, java_lang_Class::klass_offset())); 392 __ get_thread(tmp); 393 __ cmpptr(tmp, Address(tmp2, InstanceKlass::init_thread_offset())); 394 __ pop(tmp2); 395 __ pop(tmp); 396 __ jcc(Assembler::notEqual, call_patch); 397 398 // access_field patches may execute the patched code before it's 399 // copied back into place so we need to jump back into the main 400 // code of the nmethod to continue execution. 401 __ jmp(_patch_site_continuation); 402 403 // make sure this extra code gets skipped 404 bytes_to_skip += __ offset() - offset; 405 } 406 if (CommentedAssembly) { 407 __ block_comment("patch data encoded as movl"); 408 } 409 // Now emit the patch record telling the runtime how to find the 410 // pieces of the patch. We only need 3 bytes but for readability of 411 // the disassembly we make the data look like a movl reg, imm32, 412 // which requires 5 bytes 413 int sizeof_patch_record = 5; 414 bytes_to_skip += sizeof_patch_record; 415 416 // emit the offsets needed to find the code to patch 417 int being_initialized_entry_offset = __ pc() - being_initialized_entry + sizeof_patch_record; 418 419 __ emit_int8((unsigned char)0xB8); 420 __ emit_int8(0); 421 __ emit_int8(being_initialized_entry_offset); 422 __ emit_int8(bytes_to_skip); 423 __ emit_int8(_bytes_to_copy); 424 address patch_info_pc = __ pc(); 425 assert(patch_info_pc - end_of_patch == bytes_to_skip, "incorrect patch info"); 426 427 address entry = __ pc(); 428 NativeGeneralJump::insert_unconditional((address)_pc_start, entry); 429 address target = NULL; 430 relocInfo::relocType reloc_type = relocInfo::none; 431 switch (_id) { 432 case access_field_id: target = Runtime1::entry_for(Runtime1::access_field_patching_id); break; 433 case load_klass_id: target = Runtime1::entry_for(Runtime1::load_klass_patching_id); reloc_type = relocInfo::metadata_type; break; 434 case load_mirror_id: target = Runtime1::entry_for(Runtime1::load_mirror_patching_id); reloc_type = relocInfo::oop_type; break; 435 case load_appendix_id: target = Runtime1::entry_for(Runtime1::load_appendix_patching_id); reloc_type = relocInfo::oop_type; break; 436 default: ShouldNotReachHere(); 437 } 438 __ bind(call_patch); 439 440 if (CommentedAssembly) { 441 __ block_comment("patch entry point"); 442 } 443 __ call(RuntimeAddress(target)); 444 assert(_patch_info_offset == (patch_info_pc - __ pc()), "must not change"); 445 ce->add_call_info_here(_info); 446 int jmp_off = __ offset(); 447 __ jmp(_patch_site_entry); 448 // Add enough nops so deoptimization can overwrite the jmp above with a call 449 // and not destroy the world. We cannot use fat nops here, since the concurrent 450 // code rewrite may transiently create the illegal instruction sequence. 451 for (int j = __ offset() ; j < jmp_off + 5 ; j++ ) { 452 __ nop(); 453 } 454 if (_id == load_klass_id || _id == load_mirror_id || _id == load_appendix_id) { 455 CodeSection* cs = __ code_section(); 456 RelocIterator iter(cs, (address)_pc_start, (address)(_pc_start + 1)); 457 relocInfo::change_reloc_info_for_address(&iter, (address) _pc_start, reloc_type, relocInfo::none); 458 } 459 } 460 461 462 void DeoptimizeStub::emit_code(LIR_Assembler* ce) { 463 __ bind(_entry); 464 ce->store_parameter(_trap_request, 0); 465 __ call(RuntimeAddress(Runtime1::entry_for(Runtime1::deoptimize_id))); 466 ce->add_call_info_here(_info); 467 DEBUG_ONLY(__ should_not_reach_here()); 468 } 469 470 471 void ImplicitNullCheckStub::emit_code(LIR_Assembler* ce) { 472 address a; 473 if (_info->deoptimize_on_exception()) { 474 // Deoptimize, do not throw the exception, because it is probably wrong to do it here. 475 a = Runtime1::entry_for(Runtime1::predicate_failed_trap_id); 476 } else { 477 a = Runtime1::entry_for(Runtime1::throw_null_pointer_exception_id); 478 } 479 480 ce->compilation()->implicit_exception_table()->append(_offset, __ offset()); 481 __ bind(_entry); 482 __ call(RuntimeAddress(a)); 483 ce->add_call_info_here(_info); 484 ce->verify_oop_map(_info); 485 debug_only(__ should_not_reach_here()); 486 } 487 488 489 void SimpleExceptionStub::emit_code(LIR_Assembler* ce) { 490 assert(__ rsp_offset() == 0, "frame size should be fixed"); 491 492 __ bind(_entry); 493 // pass the object on stack because all registers must be preserved 494 if (_obj->is_cpu_register()) { 495 ce->store_parameter(_obj->as_register(), 0); 496 } 497 __ call(RuntimeAddress(Runtime1::entry_for(_stub))); 498 ce->add_call_info_here(_info); 499 debug_only(__ should_not_reach_here()); 500 } 501 502 503 void ArrayCopyStub::emit_code(LIR_Assembler* ce) { 504 //---------------slow case: call to native----------------- 505 __ bind(_entry); 506 // Figure out where the args should go 507 // This should really convert the IntrinsicID to the Method* and signature 508 // but I don't know how to do that. 509 // 510 VMRegPair args[5]; 511 BasicType signature[5] = { T_OBJECT, T_INT, T_OBJECT, T_INT, T_INT}; 512 SharedRuntime::java_calling_convention(signature, args, 5); 513 514 // push parameters 515 // (src, src_pos, dest, destPos, length) 516 Register r[5]; 517 r[0] = src()->as_register(); 518 r[1] = src_pos()->as_register(); 519 r[2] = dst()->as_register(); 520 r[3] = dst_pos()->as_register(); 521 r[4] = length()->as_register(); 522 523 // next registers will get stored on the stack 524 for (int i = 0; i < 5 ; i++ ) { 525 VMReg r_1 = args[i].first(); 526 if (r_1->is_stack()) { 527 int st_off = r_1->reg2stack() * wordSize; 528 __ movptr (Address(rsp, st_off), r[i]); 529 } else { 530 assert(r[i] == args[i].first()->as_Register(), "Wrong register for arg "); 531 } 532 } 533 534 ce->align_call(lir_static_call); 535 536 ce->emit_static_call_stub(); 537 if (ce->compilation()->bailed_out()) { 538 return; // CodeCache is full 539 } 540 AddressLiteral resolve(SharedRuntime::get_resolve_static_call_stub(), 541 relocInfo::static_call_type); 542 __ call(resolve); 543 ce->add_call_info_here(info()); 544 545 #ifndef PRODUCT 546 __ incrementl(ExternalAddress((address)&Runtime1::_arraycopy_slowcase_cnt)); 547 #endif 548 549 __ jmp(_continuation); 550 } 551 552 #undef __