< prev index next >

src/hotspot/cpu/x86/interp_masm_x86.cpp

Print this page

   1 /*
   2  * Copyright (c) 1997, 2024, Oracle and/or its affiliates. All rights reserved.
   3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   4  *
   5  * This code is free software; you can redistribute it and/or modify it
   6  * under the terms of the GNU General Public License version 2 only, as
   7  * published by the Free Software Foundation.
   8  *
   9  * This code is distributed in the hope that it will be useful, but WITHOUT
  10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  12  * version 2 for more details (a copy is included in the LICENSE file that
  13  * accompanied this code).
  14  *
  15  * You should have received a copy of the GNU General Public License version
  16  * 2 along with this work; if not, write to the Free Software Foundation,
  17  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  18  *
  19  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  20  * or visit www.oracle.com if you need additional information or have any
  21  * questions.
  22  *
  23  */
  24 
  25 #include "precompiled.hpp"
  26 #include "compiler/compiler_globals.hpp"
  27 #include "interp_masm_x86.hpp"
  28 #include "interpreter/interpreter.hpp"
  29 #include "interpreter/interpreterRuntime.hpp"
  30 #include "logging/log.hpp"
  31 #include "oops/arrayOop.hpp"

  32 #include "oops/markWord.hpp"
  33 #include "oops/methodData.hpp"
  34 #include "oops/method.hpp"

  35 #include "oops/resolvedFieldEntry.hpp"
  36 #include "oops/resolvedIndyEntry.hpp"
  37 #include "oops/resolvedMethodEntry.hpp"
  38 #include "prims/jvmtiExport.hpp"
  39 #include "prims/jvmtiThreadState.hpp"
  40 #include "runtime/basicLock.hpp"
  41 #include "runtime/frame.inline.hpp"
  42 #include "runtime/javaThread.hpp"
  43 #include "runtime/safepointMechanism.hpp"
  44 #include "runtime/sharedRuntime.hpp"
  45 #include "utilities/powerOfTwo.hpp"
  46 
  47 // Implementation of InterpreterMacroAssembler
  48 
  49 void InterpreterMacroAssembler::jump_to_entry(address entry) {
  50   assert(entry, "Entry must have been generated by now");
  51   jump(RuntimeAddress(entry));
  52 }
  53 
  54 void InterpreterMacroAssembler::profile_obj_type(Register obj, const Address& mdo_addr) {

 156         Address mdo_arg_addr(mdp, in_bytes(TypeEntriesAtCall::argument_type_offset(i))-off_to_args);
 157         profile_obj_type(tmp, mdo_arg_addr);
 158 
 159         int to_add = in_bytes(TypeStackSlotEntries::per_arg_size());
 160         addptr(mdp, to_add);
 161         off_to_args += to_add;
 162       }
 163 
 164       if (MethodData::profile_return()) {
 165         movptr(tmp, Address(mdp, in_bytes(TypeEntriesAtCall::cell_count_offset())-off_to_args));
 166         subl(tmp, TypeProfileArgsLimit*TypeStackSlotEntries::per_arg_count());
 167       }
 168 
 169       bind(done);
 170 
 171       if (MethodData::profile_return()) {
 172         // We're right after the type profile for the last
 173         // argument. tmp is the number of cells left in the
 174         // CallTypeData/VirtualCallTypeData to reach its end. Non null
 175         // if there's a return to profile.
 176         assert(ReturnTypeEntry::static_cell_count() < TypeStackSlotEntries::per_arg_count(), "can't move past ret type");
 177         shll(tmp, log2i_exact((int)DataLayout::cell_size));
 178         addptr(mdp, tmp);
 179       }
 180       movptr(Address(rbp, frame::interpreter_frame_mdp_offset * wordSize), mdp);
 181     } else {
 182       assert(MethodData::profile_return(), "either profile call args or call ret");
 183       update_mdp_by_constant(mdp, in_bytes(TypeEntriesAtCall::return_only_size()));
 184     }
 185 
 186     // mdp points right after the end of the
 187     // CallTypeData/VirtualCallTypeData, right after the cells for the
 188     // return value type if there's one
 189 
 190     bind(profile_continue);
 191   }
 192 }
 193 
 194 void InterpreterMacroAssembler::profile_return_type(Register mdp, Register ret, Register tmp) {
 195   assert_different_registers(mdp, ret, tmp, _bcp_register);
 196   if (ProfileInterpreter && MethodData::profile_return()) {

 201     if (MethodData::profile_return_jsr292_only()) {
 202       assert(Method::intrinsic_id_size_in_bytes() == 2, "assuming Method::_intrinsic_id is u2");
 203 
 204       // If we don't profile all invoke bytecodes we must make sure
 205       // it's a bytecode we indeed profile. We can't go back to the
 206       // beginning of the ProfileData we intend to update to check its
 207       // type because we're right after it and we don't known its
 208       // length
 209       Label do_profile;
 210       cmpb(Address(_bcp_register, 0), Bytecodes::_invokedynamic);
 211       jcc(Assembler::equal, do_profile);
 212       cmpb(Address(_bcp_register, 0), Bytecodes::_invokehandle);
 213       jcc(Assembler::equal, do_profile);
 214       get_method(tmp);
 215       cmpw(Address(tmp, Method::intrinsic_id_offset()), static_cast<int>(vmIntrinsics::_compiledLambdaForm));
 216       jcc(Assembler::notEqual, profile_continue);
 217 
 218       bind(do_profile);
 219     }
 220 
 221     Address mdo_ret_addr(mdp, -in_bytes(ReturnTypeEntry::size()));
 222     mov(tmp, ret);
 223     profile_obj_type(tmp, mdo_ret_addr);
 224 
 225     bind(profile_continue);
 226   }
 227 }
 228 
 229 void InterpreterMacroAssembler::profile_parameters_type(Register mdp, Register tmp1, Register tmp2) {
 230   if (ProfileInterpreter && MethodData::profile_parameters()) {
 231     Label profile_continue;
 232 
 233     test_method_data_pointer(mdp, profile_continue);
 234 
 235     // Load the offset of the area within the MDO used for
 236     // parameters. If it's negative we're not profiling any parameters
 237     movl(tmp1, Address(mdp, in_bytes(MethodData::parameters_type_data_di_offset()) - in_bytes(MethodData::data_offset())));
 238     testl(tmp1, tmp1);
 239     jcc(Assembler::negative, profile_continue);
 240 
 241     // Compute a pointer to the area for parameters from the offset

 491                                                              Register cpool,
 492                                                              Register index) {
 493   assert_different_registers(cpool, index);
 494 
 495   movw(index, Address(cpool, index, Address::times_ptr, sizeof(ConstantPool)));
 496   Register resolved_klasses = cpool;
 497   movptr(resolved_klasses, Address(cpool, ConstantPool::resolved_klasses_offset()));
 498   movptr(klass, Address(resolved_klasses, index, Address::times_ptr, Array<Klass*>::base_offset_in_bytes()));
 499 }
 500 
 501 // Generate a subtype check: branch to ok_is_subtype if sub_klass is a
 502 // subtype of super_klass.
 503 //
 504 // Args:
 505 //      rax: superklass
 506 //      Rsub_klass: subklass
 507 //
 508 // Kills:
 509 //      rcx, rdi
 510 void InterpreterMacroAssembler::gen_subtype_check(Register Rsub_klass,
 511                                                   Label& ok_is_subtype) {

 512   assert(Rsub_klass != rax, "rax holds superklass");
 513   LP64_ONLY(assert(Rsub_klass != r14, "r14 holds locals");)
 514   LP64_ONLY(assert(Rsub_klass != r13, "r13 holds bcp");)
 515   assert(Rsub_klass != rcx, "rcx holds 2ndary super array length");
 516   assert(Rsub_klass != rdi, "rdi holds 2ndary super array scan ptr");
 517 
 518   // Profile the not-null value's klass.
 519   profile_typecheck(rcx, Rsub_klass, rdi); // blows rcx, reloads rdi


 520 
 521   // Do the check.
 522   check_klass_subtype(Rsub_klass, rax, rcx, ok_is_subtype); // blows rcx
 523 }
 524 
 525 
 526 #ifndef _LP64
 527 void InterpreterMacroAssembler::f2ieee() {
 528   if (IEEEPrecision) {
 529     fstp_s(Address(rsp, 0));
 530     fld_s(Address(rsp, 0));
 531   }
 532 }
 533 
 534 
 535 void InterpreterMacroAssembler::d2ieee() {
 536   if (IEEEPrecision) {
 537     fstp_d(Address(rsp, 0));
 538     fld_d(Address(rsp, 0));
 539   }

 951   // the stack, will call InterpreterRuntime::at_unwind.
 952   Label slow_path;
 953   Label fast_path;
 954   safepoint_poll(slow_path, rthread, true /* at_return */, false /* in_nmethod */);
 955   jmp(fast_path);
 956   bind(slow_path);
 957   push(state);
 958   set_last_Java_frame(rthread, noreg, rbp, (address)pc(), rscratch1);
 959   super_call_VM_leaf(CAST_FROM_FN_PTR(address, InterpreterRuntime::at_unwind), rthread);
 960   NOT_LP64(get_thread(rthread);) // call_VM clobbered it, restore
 961   reset_last_Java_frame(rthread, true);
 962   pop(state);
 963   bind(fast_path);
 964 
 965   // get the value of _do_not_unlock_if_synchronized into rdx
 966   const Address do_not_unlock_if_synchronized(rthread,
 967     in_bytes(JavaThread::do_not_unlock_if_synchronized_offset()));
 968   movbool(rbx, do_not_unlock_if_synchronized);
 969   movbool(do_not_unlock_if_synchronized, false); // reset the flag
 970 
 971  // get method access flags
 972   movptr(rcx, Address(rbp, frame::interpreter_frame_method_offset * wordSize));
 973   movl(rcx, Address(rcx, Method::access_flags_offset()));
 974   testl(rcx, JVM_ACC_SYNCHRONIZED);
 975   jcc(Assembler::zero, unlocked);
 976 
 977   // Don't unlock anything if the _do_not_unlock_if_synchronized flag
 978   // is set.
 979   testbool(rbx);
 980   jcc(Assembler::notZero, no_unlock);
 981 
 982   // unlock monitor
 983   push(state); // save result
 984 
 985   // BasicObjectLock will be first in list, since this is a
 986   // synchronized method. However, need to check that the object has
 987   // not been unlocked by an explicit monitorexit bytecode.
 988   const Address monitor(rbp, frame::interpreter_frame_initial_sp_offset *
 989                         wordSize - (int) sizeof(BasicObjectLock));
 990   // We use c_rarg1/rdx so that if we go slow path it will be the correct
 991   // register for unlock_object to pass to VM directly

1077     bind(loop);
1078     // check if current entry is used
1079     cmpptr(Address(rmon, BasicObjectLock::obj_offset()), NULL_WORD);
1080     jcc(Assembler::notEqual, exception);
1081 
1082     addptr(rmon, entry_size); // otherwise advance to next entry
1083     bind(entry);
1084     cmpptr(rmon, rbx); // check if bottom reached
1085     jcc(Assembler::notEqual, loop); // if not at bottom then check this entry
1086   }
1087 
1088   bind(no_unlock);
1089 
1090   // jvmti support
1091   if (notify_jvmdi) {
1092     notify_method_exit(state, NotifyJVMTI);    // preserve TOSCA
1093   } else {
1094     notify_method_exit(state, SkipNotifyJVMTI); // preserve TOSCA
1095   }
1096 
1097   // remove activation
1098   // get sender sp
1099   movptr(rbx,
1100          Address(rbp, frame::interpreter_frame_sender_sp_offset * wordSize));
1101   if (StackReservedPages > 0) {


1102     // testing if reserved zone needs to be re-enabled
1103     Register rthread = LP64_ONLY(r15_thread) NOT_LP64(rcx);
1104     Label no_reserved_zone_enabling;
1105 
1106     NOT_LP64(get_thread(rthread);)
1107 
1108     // check if already enabled - if so no re-enabling needed
1109     assert(sizeof(StackOverflow::StackGuardState) == 4, "unexpected size");
1110     cmpl(Address(rthread, JavaThread::stack_guard_state_offset()), StackOverflow::stack_guard_enabled);
1111     jcc(Assembler::equal, no_reserved_zone_enabling);
1112 
1113     cmpptr(rbx, Address(rthread, JavaThread::reserved_stack_activation_offset()));
1114     jcc(Assembler::lessEqual, no_reserved_zone_enabling);
1115 
1116     call_VM_leaf(
1117       CAST_FROM_FN_PTR(address, SharedRuntime::enable_stack_reserved_zone), rthread);
1118     call_VM(noreg, CAST_FROM_FN_PTR(address,
1119                    InterpreterRuntime::throw_delayed_StackOverflowError));
1120     should_not_reach_here();
1121 
1122     bind(no_reserved_zone_enabling);
1123   }








































1124   leave();                           // remove frame anchor
1125   pop(ret_addr);                     // get return address
1126   mov(rsp, rbx);                     // set sp to sender sp
1127   pop_cont_fastpath();
1128 }
1129 
1130 void InterpreterMacroAssembler::get_method_counters(Register method,
1131                                                     Register mcs, Label& skip) {
1132   Label has_counters;
1133   movptr(mcs, Address(method, Method::method_counters_offset()));
1134   testptr(mcs, mcs);
1135   jcc(Assembler::notZero, has_counters);
1136   call_VM(noreg, CAST_FROM_FN_PTR(address,
1137           InterpreterRuntime::build_method_counters), method);
1138   movptr(mcs, Address(method,Method::method_counters_offset()));
1139   testptr(mcs, mcs);
1140   jcc(Assembler::zero, skip); // No MethodCounters allocated, OutOfMemory
1141   bind(has_counters);
1142 }
1143 





























































1144 
1145 // Lock object
1146 //
1147 // Args:
1148 //      rdx, c_rarg1: BasicObjectLock to be used for locking
1149 //
1150 // Kills:
1151 //      rax, rbx
1152 void InterpreterMacroAssembler::lock_object(Register lock_reg) {
1153   assert(lock_reg == LP64_ONLY(c_rarg1) NOT_LP64(rdx),
1154          "The argument is only for looks. It must be c_rarg1");
1155 
1156   if (LockingMode == LM_MONITOR) {
1157     call_VM(noreg,
1158             CAST_FROM_FN_PTR(address, InterpreterRuntime::monitorenter),
1159             lock_reg);
1160   } else {
1161     Label count_locking, done, slow_case;
1162 
1163     const Register swap_reg = rax; // Must use rax for cmpxchg instruction

1176     if (DiagnoseSyncOnValueBasedClasses != 0) {
1177       load_klass(tmp_reg, obj_reg, rklass_decode_tmp);
1178       testb(Address(tmp_reg, Klass::misc_flags_offset()), KlassFlags::_misc_is_value_based_class);
1179       jcc(Assembler::notZero, slow_case);
1180     }
1181 
1182     if (LockingMode == LM_LIGHTWEIGHT) {
1183 #ifdef _LP64
1184       const Register thread = r15_thread;
1185       lightweight_lock(lock_reg, obj_reg, swap_reg, thread, tmp_reg, slow_case);
1186 #else
1187       // Lacking registers and thread on x86_32. Always take slow path.
1188       jmp(slow_case);
1189 #endif
1190     } else if (LockingMode == LM_LEGACY) {
1191       // Load immediate 1 into swap_reg %rax
1192       movl(swap_reg, 1);
1193 
1194       // Load (object->mark() | 1) into swap_reg %rax
1195       orptr(swap_reg, Address(obj_reg, oopDesc::mark_offset_in_bytes()));




1196 
1197       // Save (object->mark() | 1) into BasicLock's displaced header
1198       movptr(Address(lock_reg, mark_offset), swap_reg);
1199 
1200       assert(lock_offset == 0,
1201              "displaced header must be first word in BasicObjectLock");
1202 
1203       lock();
1204       cmpxchgptr(lock_reg, Address(obj_reg, oopDesc::mark_offset_in_bytes()));
1205       jcc(Assembler::zero, count_locking);
1206 
1207       const int zero_bits = LP64_ONLY(7) NOT_LP64(3);
1208 
1209       // Fast check for recursive lock.
1210       //
1211       // Can apply the optimization only if this is a stack lock
1212       // allocated in this thread. For efficiency, we can focus on
1213       // recently allocated stack locks (instead of reading the stack
1214       // base and checking whether 'mark' points inside the current
1215       // thread stack):

1533     test_method_data_pointer(mdp, profile_continue);
1534 
1535     // We are taking a branch.  Increment the taken count.
1536     // We inline increment_mdp_data_at to return bumped_count in a register
1537     //increment_mdp_data_at(mdp, in_bytes(JumpData::taken_offset()));
1538     Address data(mdp, in_bytes(JumpData::taken_offset()));
1539     movptr(bumped_count, data);
1540     assert(DataLayout::counter_increment == 1,
1541             "flow-free idiom only works with 1");
1542     addptr(bumped_count, DataLayout::counter_increment);
1543     sbbptr(bumped_count, 0);
1544     movptr(data, bumped_count); // Store back out
1545 
1546     // The method data pointer needs to be updated to reflect the new target.
1547     update_mdp_by_offset(mdp, in_bytes(JumpData::displacement_offset()));
1548     bind(profile_continue);
1549   }
1550 }
1551 
1552 
1553 void InterpreterMacroAssembler::profile_not_taken_branch(Register mdp) {
1554   if (ProfileInterpreter) {
1555     Label profile_continue;
1556 
1557     // If no method data exists, go to profile_continue.
1558     test_method_data_pointer(mdp, profile_continue);
1559 
1560     // We are taking a branch.  Increment the not taken count.
1561     increment_mdp_data_at(mdp, in_bytes(BranchData::not_taken_offset()));
1562 
1563     // The method data pointer needs to be updated to correspond to
1564     // the next bytecode
1565     update_mdp_by_constant(mdp, in_bytes(BranchData::branch_data_size()));
1566     bind(profile_continue);
1567   }
1568 }
1569 
1570 void InterpreterMacroAssembler::profile_call(Register mdp) {
1571   if (ProfileInterpreter) {
1572     Label profile_continue;
1573 
1574     // If no method data exists, go to profile_continue.
1575     test_method_data_pointer(mdp, profile_continue);
1576 
1577     // We are making a call.  Increment the count.
1578     increment_mdp_data_at(mdp, in_bytes(CounterData::count_offset()));
1579 
1580     // The method data pointer needs to be updated to reflect the new target.
1581     update_mdp_by_constant(mdp, in_bytes(CounterData::counter_data_size()));
1582     bind(profile_continue);
1583   }
1584 }
1585 

1608                                                      Register reg2,
1609                                                      bool receiver_can_be_null) {
1610   if (ProfileInterpreter) {
1611     Label profile_continue;
1612 
1613     // If no method data exists, go to profile_continue.
1614     test_method_data_pointer(mdp, profile_continue);
1615 
1616     Label skip_receiver_profile;
1617     if (receiver_can_be_null) {
1618       Label not_null;
1619       testptr(receiver, receiver);
1620       jccb(Assembler::notZero, not_null);
1621       // We are making a call.  Increment the count for null receiver.
1622       increment_mdp_data_at(mdp, in_bytes(CounterData::count_offset()));
1623       jmp(skip_receiver_profile);
1624       bind(not_null);
1625     }
1626 
1627     // Record the receiver type.
1628     record_klass_in_profile(receiver, mdp, reg2, true);
1629     bind(skip_receiver_profile);
1630 
1631     // The method data pointer needs to be updated to reflect the new target.
1632     update_mdp_by_constant(mdp, in_bytes(VirtualCallData::virtual_call_data_size()));
1633     bind(profile_continue);
1634   }
1635 }
1636 
1637 // This routine creates a state machine for updating the multi-row
1638 // type profile at a virtual call site (or other type-sensitive bytecode).
1639 // The machine visits each row (of receiver/count) until the receiver type
1640 // is found, or until it runs out of rows.  At the same time, it remembers
1641 // the location of the first empty row.  (An empty row records null for its
1642 // receiver, and can be allocated for a newly-observed receiver type.)
1643 // Because there are two degrees of freedom in the state, a simple linear
1644 // search will not work; it must be a decision tree.  Hence this helper
1645 // function is recursive, to generate the required tree structured code.
1646 // It's the interpreter, so we are trading off code space for speed.
1647 // See below for example code.
1648 void InterpreterMacroAssembler::record_klass_in_profile_helper(
1649                                         Register receiver, Register mdp,
1650                                         Register reg2, int start_row,
1651                                         Label& done, bool is_virtual_call) {
1652   if (TypeProfileWidth == 0) {
1653     increment_mdp_data_at(mdp, in_bytes(CounterData::count_offset()));
1654   } else {
1655     record_item_in_profile_helper(receiver, mdp, reg2, 0, done, TypeProfileWidth,
1656                                   &VirtualCallData::receiver_offset, &VirtualCallData::receiver_count_offset);
1657   }
1658 }
1659 
1660 void InterpreterMacroAssembler::record_item_in_profile_helper(Register item, Register mdp, Register reg2, int start_row,
1661                                                               Label& done, int total_rows,
1662                                                               OffsetFunction item_offset_fn,
1663                                                               OffsetFunction item_count_offset_fn) {
1664   int last_row = total_rows - 1;
1665   assert(start_row <= last_row, "must be work left to do");
1666   // Test this row for both the item and for null.
1667   // Take any of three different outcomes:
1668   //   1. found item => increment count and goto done
1669   //   2. found null => keep looking for case 1, maybe allocate this cell
1670   //   3. found something else => keep looking for cases 1 and 2
1671   // Case 3 is handled by a recursive call.

1735 //     // inner copy of decision tree, rooted at row[1]
1736 //     if (row[1].rec == rec) { row[1].incr(); goto done; }
1737 //     if (row[1].rec != nullptr) {
1738 //       // degenerate decision tree, rooted at row[2]
1739 //       if (row[2].rec == rec) { row[2].incr(); goto done; }
1740 //       if (row[2].rec != nullptr) { count.incr(); goto done; } // overflow
1741 //       row[2].init(rec); goto done;
1742 //     } else {
1743 //       // remember row[1] is empty
1744 //       if (row[2].rec == rec) { row[2].incr(); goto done; }
1745 //       row[1].init(rec); goto done;
1746 //     }
1747 //   } else {
1748 //     // remember row[0] is empty
1749 //     if (row[1].rec == rec) { row[1].incr(); goto done; }
1750 //     if (row[2].rec == rec) { row[2].incr(); goto done; }
1751 //     row[0].init(rec); goto done;
1752 //   }
1753 //   done:
1754 
1755 void InterpreterMacroAssembler::record_klass_in_profile(Register receiver,
1756                                                         Register mdp, Register reg2,
1757                                                         bool is_virtual_call) {
1758   assert(ProfileInterpreter, "must be profiling");
1759   Label done;
1760 
1761   record_klass_in_profile_helper(receiver, mdp, reg2, 0, done, is_virtual_call);
1762 
1763   bind (done);
1764 }
1765 
1766 void InterpreterMacroAssembler::profile_ret(Register return_bci,
1767                                             Register mdp) {
1768   if (ProfileInterpreter) {
1769     Label profile_continue;
1770     uint row;
1771 
1772     // If no method data exists, go to profile_continue.
1773     test_method_data_pointer(mdp, profile_continue);
1774 
1775     // Update the total ret count.
1776     increment_mdp_data_at(mdp, in_bytes(CounterData::count_offset()));
1777 
1778     for (row = 0; row < RetData::row_limit(); row++) {
1779       Label next_test;
1780 
1781       // See if return_bci is equal to bci[n]:

1818     update_mdp_by_constant(mdp, mdp_delta);
1819 
1820     bind(profile_continue);
1821   }
1822 }
1823 
1824 
1825 void InterpreterMacroAssembler::profile_typecheck(Register mdp, Register klass, Register reg2) {
1826   if (ProfileInterpreter) {
1827     Label profile_continue;
1828 
1829     // If no method data exists, go to profile_continue.
1830     test_method_data_pointer(mdp, profile_continue);
1831 
1832     // The method data pointer needs to be updated.
1833     int mdp_delta = in_bytes(BitData::bit_data_size());
1834     if (TypeProfileCasts) {
1835       mdp_delta = in_bytes(VirtualCallData::virtual_call_data_size());
1836 
1837       // Record the object type.
1838       record_klass_in_profile(klass, mdp, reg2, false);
1839       NOT_LP64(assert(reg2 == rdi, "we know how to fix this blown reg");)
1840       NOT_LP64(restore_locals();)         // Restore EDI
1841     }
1842     update_mdp_by_constant(mdp, mdp_delta);
1843 
1844     bind(profile_continue);
1845   }
1846 }
1847 
1848 
1849 void InterpreterMacroAssembler::profile_switch_default(Register mdp) {
1850   if (ProfileInterpreter) {
1851     Label profile_continue;
1852 
1853     // If no method data exists, go to profile_continue.
1854     test_method_data_pointer(mdp, profile_continue);
1855 
1856     // Update the default case count
1857     increment_mdp_data_at(mdp,
1858                           in_bytes(MultiBranchData::default_count_offset()));

1880     // case_array_offset_in_bytes()
1881     movl(reg2, in_bytes(MultiBranchData::per_case_size()));
1882     imulptr(index, reg2); // XXX l ?
1883     addptr(index, in_bytes(MultiBranchData::case_array_offset())); // XXX l ?
1884 
1885     // Update the case count
1886     increment_mdp_data_at(mdp,
1887                           index,
1888                           in_bytes(MultiBranchData::relative_count_offset()));
1889 
1890     // The method data pointer needs to be updated.
1891     update_mdp_by_offset(mdp,
1892                          index,
1893                          in_bytes(MultiBranchData::
1894                                   relative_displacement_offset()));
1895 
1896     bind(profile_continue);
1897   }
1898 }
1899 


















































































































1900 
1901 
1902 void InterpreterMacroAssembler::_interp_verify_oop(Register reg, TosState state, const char* file, int line) {
1903   if (state == atos) {
1904     MacroAssembler::_verify_oop_checked(reg, "broken oop", file, line);
1905   }
1906 }
1907 
1908 void InterpreterMacroAssembler::verify_FPU(int stack_depth, TosState state) {
1909 #ifndef _LP64
1910   if ((state == ftos && UseSSE < 1) ||
1911       (state == dtos && UseSSE < 2)) {
1912     MacroAssembler::verify_FPU(stack_depth);
1913   }
1914 #endif
1915 }
1916 
1917 // Jump if ((*counter_addr += increment) & mask) == 0
1918 void InterpreterMacroAssembler::increment_mask_and_jump(Address counter_addr, Address mask,
1919                                                         Register scratch, Label* where) {

   1 /*
   2  * Copyright (c) 1997, 2025, Oracle and/or its affiliates. All rights reserved.
   3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   4  *
   5  * This code is free software; you can redistribute it and/or modify it
   6  * under the terms of the GNU General Public License version 2 only, as
   7  * published by the Free Software Foundation.
   8  *
   9  * This code is distributed in the hope that it will be useful, but WITHOUT
  10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  12  * version 2 for more details (a copy is included in the LICENSE file that
  13  * accompanied this code).
  14  *
  15  * You should have received a copy of the GNU General Public License version
  16  * 2 along with this work; if not, write to the Free Software Foundation,
  17  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  18  *
  19  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  20  * or visit www.oracle.com if you need additional information or have any
  21  * questions.
  22  *
  23  */
  24 
  25 #include "precompiled.hpp"
  26 #include "compiler/compiler_globals.hpp"
  27 #include "interp_masm_x86.hpp"
  28 #include "interpreter/interpreter.hpp"
  29 #include "interpreter/interpreterRuntime.hpp"
  30 #include "logging/log.hpp"
  31 #include "oops/arrayOop.hpp"
  32 #include "oops/constMethodFlags.hpp"
  33 #include "oops/markWord.hpp"
  34 #include "oops/methodData.hpp"
  35 #include "oops/method.hpp"
  36 #include "oops/inlineKlass.hpp"
  37 #include "oops/resolvedFieldEntry.hpp"
  38 #include "oops/resolvedIndyEntry.hpp"
  39 #include "oops/resolvedMethodEntry.hpp"
  40 #include "prims/jvmtiExport.hpp"
  41 #include "prims/jvmtiThreadState.hpp"
  42 #include "runtime/basicLock.hpp"
  43 #include "runtime/frame.inline.hpp"
  44 #include "runtime/javaThread.hpp"
  45 #include "runtime/safepointMechanism.hpp"
  46 #include "runtime/sharedRuntime.hpp"
  47 #include "utilities/powerOfTwo.hpp"
  48 
  49 // Implementation of InterpreterMacroAssembler
  50 
  51 void InterpreterMacroAssembler::jump_to_entry(address entry) {
  52   assert(entry, "Entry must have been generated by now");
  53   jump(RuntimeAddress(entry));
  54 }
  55 
  56 void InterpreterMacroAssembler::profile_obj_type(Register obj, const Address& mdo_addr) {

 158         Address mdo_arg_addr(mdp, in_bytes(TypeEntriesAtCall::argument_type_offset(i))-off_to_args);
 159         profile_obj_type(tmp, mdo_arg_addr);
 160 
 161         int to_add = in_bytes(TypeStackSlotEntries::per_arg_size());
 162         addptr(mdp, to_add);
 163         off_to_args += to_add;
 164       }
 165 
 166       if (MethodData::profile_return()) {
 167         movptr(tmp, Address(mdp, in_bytes(TypeEntriesAtCall::cell_count_offset())-off_to_args));
 168         subl(tmp, TypeProfileArgsLimit*TypeStackSlotEntries::per_arg_count());
 169       }
 170 
 171       bind(done);
 172 
 173       if (MethodData::profile_return()) {
 174         // We're right after the type profile for the last
 175         // argument. tmp is the number of cells left in the
 176         // CallTypeData/VirtualCallTypeData to reach its end. Non null
 177         // if there's a return to profile.
 178         assert(SingleTypeEntry::static_cell_count() < TypeStackSlotEntries::per_arg_count(), "can't move past ret type");
 179         shll(tmp, log2i_exact((int)DataLayout::cell_size));
 180         addptr(mdp, tmp);
 181       }
 182       movptr(Address(rbp, frame::interpreter_frame_mdp_offset * wordSize), mdp);
 183     } else {
 184       assert(MethodData::profile_return(), "either profile call args or call ret");
 185       update_mdp_by_constant(mdp, in_bytes(TypeEntriesAtCall::return_only_size()));
 186     }
 187 
 188     // mdp points right after the end of the
 189     // CallTypeData/VirtualCallTypeData, right after the cells for the
 190     // return value type if there's one
 191 
 192     bind(profile_continue);
 193   }
 194 }
 195 
 196 void InterpreterMacroAssembler::profile_return_type(Register mdp, Register ret, Register tmp) {
 197   assert_different_registers(mdp, ret, tmp, _bcp_register);
 198   if (ProfileInterpreter && MethodData::profile_return()) {

 203     if (MethodData::profile_return_jsr292_only()) {
 204       assert(Method::intrinsic_id_size_in_bytes() == 2, "assuming Method::_intrinsic_id is u2");
 205 
 206       // If we don't profile all invoke bytecodes we must make sure
 207       // it's a bytecode we indeed profile. We can't go back to the
 208       // beginning of the ProfileData we intend to update to check its
 209       // type because we're right after it and we don't known its
 210       // length
 211       Label do_profile;
 212       cmpb(Address(_bcp_register, 0), Bytecodes::_invokedynamic);
 213       jcc(Assembler::equal, do_profile);
 214       cmpb(Address(_bcp_register, 0), Bytecodes::_invokehandle);
 215       jcc(Assembler::equal, do_profile);
 216       get_method(tmp);
 217       cmpw(Address(tmp, Method::intrinsic_id_offset()), static_cast<int>(vmIntrinsics::_compiledLambdaForm));
 218       jcc(Assembler::notEqual, profile_continue);
 219 
 220       bind(do_profile);
 221     }
 222 
 223     Address mdo_ret_addr(mdp, -in_bytes(SingleTypeEntry::size()));
 224     mov(tmp, ret);
 225     profile_obj_type(tmp, mdo_ret_addr);
 226 
 227     bind(profile_continue);
 228   }
 229 }
 230 
 231 void InterpreterMacroAssembler::profile_parameters_type(Register mdp, Register tmp1, Register tmp2) {
 232   if (ProfileInterpreter && MethodData::profile_parameters()) {
 233     Label profile_continue;
 234 
 235     test_method_data_pointer(mdp, profile_continue);
 236 
 237     // Load the offset of the area within the MDO used for
 238     // parameters. If it's negative we're not profiling any parameters
 239     movl(tmp1, Address(mdp, in_bytes(MethodData::parameters_type_data_di_offset()) - in_bytes(MethodData::data_offset())));
 240     testl(tmp1, tmp1);
 241     jcc(Assembler::negative, profile_continue);
 242 
 243     // Compute a pointer to the area for parameters from the offset

 493                                                              Register cpool,
 494                                                              Register index) {
 495   assert_different_registers(cpool, index);
 496 
 497   movw(index, Address(cpool, index, Address::times_ptr, sizeof(ConstantPool)));
 498   Register resolved_klasses = cpool;
 499   movptr(resolved_klasses, Address(cpool, ConstantPool::resolved_klasses_offset()));
 500   movptr(klass, Address(resolved_klasses, index, Address::times_ptr, Array<Klass*>::base_offset_in_bytes()));
 501 }
 502 
 503 // Generate a subtype check: branch to ok_is_subtype if sub_klass is a
 504 // subtype of super_klass.
 505 //
 506 // Args:
 507 //      rax: superklass
 508 //      Rsub_klass: subklass
 509 //
 510 // Kills:
 511 //      rcx, rdi
 512 void InterpreterMacroAssembler::gen_subtype_check(Register Rsub_klass,
 513                                                   Label& ok_is_subtype,
 514                                                   bool profile) {
 515   assert(Rsub_klass != rax, "rax holds superklass");
 516   LP64_ONLY(assert(Rsub_klass != r14, "r14 holds locals");)
 517   LP64_ONLY(assert(Rsub_klass != r13, "r13 holds bcp");)
 518   assert(Rsub_klass != rcx, "rcx holds 2ndary super array length");
 519   assert(Rsub_klass != rdi, "rdi holds 2ndary super array scan ptr");
 520 
 521   // Profile the not-null value's klass.
 522   if (profile) {
 523     profile_typecheck(rcx, Rsub_klass, rdi); // blows rcx, reloads rdi
 524   }
 525 
 526   // Do the check.
 527   check_klass_subtype(Rsub_klass, rax, rcx, ok_is_subtype); // blows rcx
 528 }
 529 
 530 
 531 #ifndef _LP64
 532 void InterpreterMacroAssembler::f2ieee() {
 533   if (IEEEPrecision) {
 534     fstp_s(Address(rsp, 0));
 535     fld_s(Address(rsp, 0));
 536   }
 537 }
 538 
 539 
 540 void InterpreterMacroAssembler::d2ieee() {
 541   if (IEEEPrecision) {
 542     fstp_d(Address(rsp, 0));
 543     fld_d(Address(rsp, 0));
 544   }

 956   // the stack, will call InterpreterRuntime::at_unwind.
 957   Label slow_path;
 958   Label fast_path;
 959   safepoint_poll(slow_path, rthread, true /* at_return */, false /* in_nmethod */);
 960   jmp(fast_path);
 961   bind(slow_path);
 962   push(state);
 963   set_last_Java_frame(rthread, noreg, rbp, (address)pc(), rscratch1);
 964   super_call_VM_leaf(CAST_FROM_FN_PTR(address, InterpreterRuntime::at_unwind), rthread);
 965   NOT_LP64(get_thread(rthread);) // call_VM clobbered it, restore
 966   reset_last_Java_frame(rthread, true);
 967   pop(state);
 968   bind(fast_path);
 969 
 970   // get the value of _do_not_unlock_if_synchronized into rdx
 971   const Address do_not_unlock_if_synchronized(rthread,
 972     in_bytes(JavaThread::do_not_unlock_if_synchronized_offset()));
 973   movbool(rbx, do_not_unlock_if_synchronized);
 974   movbool(do_not_unlock_if_synchronized, false); // reset the flag
 975 
 976   // get method access flags
 977   movptr(rcx, Address(rbp, frame::interpreter_frame_method_offset * wordSize));
 978   movl(rcx, Address(rcx, Method::access_flags_offset()));
 979   testl(rcx, JVM_ACC_SYNCHRONIZED);
 980   jcc(Assembler::zero, unlocked);
 981 
 982   // Don't unlock anything if the _do_not_unlock_if_synchronized flag
 983   // is set.
 984   testbool(rbx);
 985   jcc(Assembler::notZero, no_unlock);
 986 
 987   // unlock monitor
 988   push(state); // save result
 989 
 990   // BasicObjectLock will be first in list, since this is a
 991   // synchronized method. However, need to check that the object has
 992   // not been unlocked by an explicit monitorexit bytecode.
 993   const Address monitor(rbp, frame::interpreter_frame_initial_sp_offset *
 994                         wordSize - (int) sizeof(BasicObjectLock));
 995   // We use c_rarg1/rdx so that if we go slow path it will be the correct
 996   // register for unlock_object to pass to VM directly

1082     bind(loop);
1083     // check if current entry is used
1084     cmpptr(Address(rmon, BasicObjectLock::obj_offset()), NULL_WORD);
1085     jcc(Assembler::notEqual, exception);
1086 
1087     addptr(rmon, entry_size); // otherwise advance to next entry
1088     bind(entry);
1089     cmpptr(rmon, rbx); // check if bottom reached
1090     jcc(Assembler::notEqual, loop); // if not at bottom then check this entry
1091   }
1092 
1093   bind(no_unlock);
1094 
1095   // jvmti support
1096   if (notify_jvmdi) {
1097     notify_method_exit(state, NotifyJVMTI);    // preserve TOSCA
1098   } else {
1099     notify_method_exit(state, SkipNotifyJVMTI); // preserve TOSCA
1100   }
1101 




1102   if (StackReservedPages > 0) {
1103     movptr(rbx,
1104                Address(rbp, frame::interpreter_frame_sender_sp_offset * wordSize));
1105     // testing if reserved zone needs to be re-enabled
1106     Register rthread = LP64_ONLY(r15_thread) NOT_LP64(rcx);
1107     Label no_reserved_zone_enabling;
1108 
1109     NOT_LP64(get_thread(rthread);)
1110 
1111     // check if already enabled - if so no re-enabling needed
1112     assert(sizeof(StackOverflow::StackGuardState) == 4, "unexpected size");
1113     cmpl(Address(rthread, JavaThread::stack_guard_state_offset()), StackOverflow::stack_guard_enabled);
1114     jcc(Assembler::equal, no_reserved_zone_enabling);
1115 
1116     cmpptr(rbx, Address(rthread, JavaThread::reserved_stack_activation_offset()));
1117     jcc(Assembler::lessEqual, no_reserved_zone_enabling);
1118 
1119     call_VM_leaf(
1120       CAST_FROM_FN_PTR(address, SharedRuntime::enable_stack_reserved_zone), rthread);
1121     call_VM(noreg, CAST_FROM_FN_PTR(address,
1122                    InterpreterRuntime::throw_delayed_StackOverflowError));
1123     should_not_reach_here();
1124 
1125     bind(no_reserved_zone_enabling);
1126   }
1127 
1128   // remove activation
1129   // get sender sp
1130   movptr(rbx,
1131          Address(rbp, frame::interpreter_frame_sender_sp_offset * wordSize));
1132 
1133   if (state == atos && InlineTypeReturnedAsFields) {
1134     // Check if we are returning an non-null inline type and load its fields into registers
1135     Label skip;
1136     test_oop_is_not_inline_type(rax, rscratch1, skip);
1137 
1138 #ifndef _LP64
1139     super_call_VM_leaf(StubRoutines::load_inline_type_fields_in_regs());
1140 #else
1141     // Load fields from a buffered value with an inline class specific handler
1142     load_klass(rdi, rax, rscratch1);
1143     movptr(rdi, Address(rdi, InstanceKlass::adr_inlineklass_fixed_block_offset()));
1144     movptr(rdi, Address(rdi, InlineKlass::unpack_handler_offset()));
1145     // Unpack handler can be null if inline type is not scalarizable in returns
1146     testptr(rdi, rdi);
1147     jcc(Assembler::zero, skip);
1148     call(rdi);
1149 #endif
1150 #ifdef ASSERT
1151     // TODO 8284443 Enable
1152     if (StressCallingConvention && false) {
1153       Label skip_stress;
1154       movptr(rscratch1, Address(rbp, frame::interpreter_frame_method_offset * wordSize));
1155       movl(rscratch1, Address(rscratch1, Method::flags_offset()));
1156       testl(rcx, MethodFlags::has_scalarized_return_flag());
1157       jcc(Assembler::zero, skip_stress);
1158       load_klass(rax, rax, rscratch1);
1159       orptr(rax, 1);
1160       bind(skip_stress);
1161     }
1162 #endif
1163     // call above kills the value in rbx. Reload it.
1164     movptr(rbx, Address(rbp, frame::interpreter_frame_sender_sp_offset * wordSize));
1165     bind(skip);
1166   }
1167   leave();                           // remove frame anchor
1168   pop(ret_addr);                     // get return address
1169   mov(rsp, rbx);                     // set sp to sender sp
1170   pop_cont_fastpath();
1171 }
1172 
1173 void InterpreterMacroAssembler::get_method_counters(Register method,
1174                                                     Register mcs, Label& skip) {
1175   Label has_counters;
1176   movptr(mcs, Address(method, Method::method_counters_offset()));
1177   testptr(mcs, mcs);
1178   jcc(Assembler::notZero, has_counters);
1179   call_VM(noreg, CAST_FROM_FN_PTR(address,
1180           InterpreterRuntime::build_method_counters), method);
1181   movptr(mcs, Address(method,Method::method_counters_offset()));
1182   testptr(mcs, mcs);
1183   jcc(Assembler::zero, skip); // No MethodCounters allocated, OutOfMemory
1184   bind(has_counters);
1185 }
1186 
1187 void InterpreterMacroAssembler::allocate_instance(Register klass, Register new_obj,
1188                                                   Register t1, Register t2,
1189                                                   bool clear_fields, Label& alloc_failed) {
1190   MacroAssembler::allocate_instance(klass, new_obj, t1, t2, clear_fields, alloc_failed);
1191   if (DTraceMethodProbes) {
1192     // Trigger dtrace event for fastpath
1193     push(atos);
1194     call_VM_leaf(CAST_FROM_FN_PTR(address, static_cast<int (*)(oopDesc*)>(SharedRuntime::dtrace_object_alloc)), new_obj);
1195     pop(atos);
1196   }
1197 }
1198 
1199 void InterpreterMacroAssembler::read_flat_field(Register entry, Register tmp1, Register tmp2, Register obj) {
1200   Label alloc_failed, empty_value, done;
1201   const Register alloc_temp = LP64_ONLY(rscratch1) NOT_LP64(rsi);
1202   const Register dst_temp   = LP64_ONLY(rscratch2) NOT_LP64(rdi);
1203   assert_different_registers(obj, entry, tmp1, tmp2, dst_temp, r8, r9);
1204 
1205   // FIXME: code below could be re-written to better use InlineLayoutInfo data structure
1206   // see aarch64 version
1207 
1208   // Grap the inline field klass
1209   const Register field_klass = tmp1;
1210   load_unsigned_short(tmp2, Address(entry, in_bytes(ResolvedFieldEntry::field_index_offset())));
1211   movptr(tmp1, Address(entry, ResolvedFieldEntry::field_holder_offset()));
1212   get_inline_type_field_klass(tmp1, tmp2, field_klass);
1213 
1214     //check for empty value klass
1215   test_klass_is_empty_inline_type(field_klass, dst_temp, empty_value);
1216 
1217   // allocate buffer
1218   push(obj);  // push object being read from     // FIXME spilling on stack could probably be avoided by using tmp2
1219   allocate_instance(field_klass, obj, alloc_temp, dst_temp, false, alloc_failed);
1220 
1221   // Have an oop instance buffer, copy into it
1222   load_unsigned_short(r9, Address(entry, in_bytes(ResolvedFieldEntry::field_index_offset())));
1223   movptr(r8, Address(entry, in_bytes(ResolvedFieldEntry::field_holder_offset())));
1224   inline_layout_info(r8, r9, r8); // holder, index, info => InlineLayoutInfo into r8
1225 
1226   data_for_oop(obj, dst_temp, field_klass);
1227   pop(alloc_temp);             // restore object being read from
1228   load_sized_value(tmp2, Address(entry, in_bytes(ResolvedFieldEntry::field_offset_offset())), sizeof(int), true /*is_signed*/);
1229   lea(tmp2, Address(alloc_temp, tmp2));
1230   // call_VM_leaf, clobbers a few regs, save restore new obj
1231   push(obj);
1232   // access_value_copy(IS_DEST_UNINITIALIZED, tmp2, dst_temp, field_klass);
1233   flat_field_copy(IS_DEST_UNINITIALIZED, tmp2, dst_temp, r8);
1234   pop(obj);
1235   jmp(done);
1236 
1237   bind(empty_value);
1238   get_empty_inline_type_oop(field_klass, dst_temp, obj);
1239   jmp(done);
1240 
1241   bind(alloc_failed);
1242   pop(obj);
1243   call_VM(noreg, CAST_FROM_FN_PTR(address, InterpreterRuntime::read_flat_field),
1244           obj, entry);
1245   get_vm_result(obj, r15_thread);
1246   bind(done);
1247 }
1248 
1249 // Lock object
1250 //
1251 // Args:
1252 //      rdx, c_rarg1: BasicObjectLock to be used for locking
1253 //
1254 // Kills:
1255 //      rax, rbx
1256 void InterpreterMacroAssembler::lock_object(Register lock_reg) {
1257   assert(lock_reg == LP64_ONLY(c_rarg1) NOT_LP64(rdx),
1258          "The argument is only for looks. It must be c_rarg1");
1259 
1260   if (LockingMode == LM_MONITOR) {
1261     call_VM(noreg,
1262             CAST_FROM_FN_PTR(address, InterpreterRuntime::monitorenter),
1263             lock_reg);
1264   } else {
1265     Label count_locking, done, slow_case;
1266 
1267     const Register swap_reg = rax; // Must use rax for cmpxchg instruction

1280     if (DiagnoseSyncOnValueBasedClasses != 0) {
1281       load_klass(tmp_reg, obj_reg, rklass_decode_tmp);
1282       testb(Address(tmp_reg, Klass::misc_flags_offset()), KlassFlags::_misc_is_value_based_class);
1283       jcc(Assembler::notZero, slow_case);
1284     }
1285 
1286     if (LockingMode == LM_LIGHTWEIGHT) {
1287 #ifdef _LP64
1288       const Register thread = r15_thread;
1289       lightweight_lock(lock_reg, obj_reg, swap_reg, thread, tmp_reg, slow_case);
1290 #else
1291       // Lacking registers and thread on x86_32. Always take slow path.
1292       jmp(slow_case);
1293 #endif
1294     } else if (LockingMode == LM_LEGACY) {
1295       // Load immediate 1 into swap_reg %rax
1296       movl(swap_reg, 1);
1297 
1298       // Load (object->mark() | 1) into swap_reg %rax
1299       orptr(swap_reg, Address(obj_reg, oopDesc::mark_offset_in_bytes()));
1300       if (EnableValhalla) {
1301         // Mask inline_type bit such that we go to the slow path if object is an inline type
1302         andptr(swap_reg, ~((int) markWord::inline_type_bit_in_place));
1303       }
1304 
1305       // Save (object->mark() | 1) into BasicLock's displaced header
1306       movptr(Address(lock_reg, mark_offset), swap_reg);
1307 
1308       assert(lock_offset == 0,
1309              "displaced header must be first word in BasicObjectLock");
1310 
1311       lock();
1312       cmpxchgptr(lock_reg, Address(obj_reg, oopDesc::mark_offset_in_bytes()));
1313       jcc(Assembler::zero, count_locking);
1314 
1315       const int zero_bits = LP64_ONLY(7) NOT_LP64(3);
1316 
1317       // Fast check for recursive lock.
1318       //
1319       // Can apply the optimization only if this is a stack lock
1320       // allocated in this thread. For efficiency, we can focus on
1321       // recently allocated stack locks (instead of reading the stack
1322       // base and checking whether 'mark' points inside the current
1323       // thread stack):

1641     test_method_data_pointer(mdp, profile_continue);
1642 
1643     // We are taking a branch.  Increment the taken count.
1644     // We inline increment_mdp_data_at to return bumped_count in a register
1645     //increment_mdp_data_at(mdp, in_bytes(JumpData::taken_offset()));
1646     Address data(mdp, in_bytes(JumpData::taken_offset()));
1647     movptr(bumped_count, data);
1648     assert(DataLayout::counter_increment == 1,
1649             "flow-free idiom only works with 1");
1650     addptr(bumped_count, DataLayout::counter_increment);
1651     sbbptr(bumped_count, 0);
1652     movptr(data, bumped_count); // Store back out
1653 
1654     // The method data pointer needs to be updated to reflect the new target.
1655     update_mdp_by_offset(mdp, in_bytes(JumpData::displacement_offset()));
1656     bind(profile_continue);
1657   }
1658 }
1659 
1660 
1661 void InterpreterMacroAssembler::profile_not_taken_branch(Register mdp, bool acmp) {
1662   if (ProfileInterpreter) {
1663     Label profile_continue;
1664 
1665     // If no method data exists, go to profile_continue.
1666     test_method_data_pointer(mdp, profile_continue);
1667 
1668     // We are taking a branch.  Increment the not taken count.
1669     increment_mdp_data_at(mdp, in_bytes(BranchData::not_taken_offset()));
1670 
1671     // The method data pointer needs to be updated to correspond to
1672     // the next bytecode
1673     update_mdp_by_constant(mdp, acmp ? in_bytes(ACmpData::acmp_data_size()): in_bytes(BranchData::branch_data_size()));
1674     bind(profile_continue);
1675   }
1676 }
1677 
1678 void InterpreterMacroAssembler::profile_call(Register mdp) {
1679   if (ProfileInterpreter) {
1680     Label profile_continue;
1681 
1682     // If no method data exists, go to profile_continue.
1683     test_method_data_pointer(mdp, profile_continue);
1684 
1685     // We are making a call.  Increment the count.
1686     increment_mdp_data_at(mdp, in_bytes(CounterData::count_offset()));
1687 
1688     // The method data pointer needs to be updated to reflect the new target.
1689     update_mdp_by_constant(mdp, in_bytes(CounterData::counter_data_size()));
1690     bind(profile_continue);
1691   }
1692 }
1693 

1716                                                      Register reg2,
1717                                                      bool receiver_can_be_null) {
1718   if (ProfileInterpreter) {
1719     Label profile_continue;
1720 
1721     // If no method data exists, go to profile_continue.
1722     test_method_data_pointer(mdp, profile_continue);
1723 
1724     Label skip_receiver_profile;
1725     if (receiver_can_be_null) {
1726       Label not_null;
1727       testptr(receiver, receiver);
1728       jccb(Assembler::notZero, not_null);
1729       // We are making a call.  Increment the count for null receiver.
1730       increment_mdp_data_at(mdp, in_bytes(CounterData::count_offset()));
1731       jmp(skip_receiver_profile);
1732       bind(not_null);
1733     }
1734 
1735     // Record the receiver type.
1736     record_klass_in_profile(receiver, mdp, reg2);
1737     bind(skip_receiver_profile);
1738 
1739     // The method data pointer needs to be updated to reflect the new target.
1740     update_mdp_by_constant(mdp, in_bytes(VirtualCallData::virtual_call_data_size()));
1741     bind(profile_continue);
1742   }
1743 }
1744 
1745 // This routine creates a state machine for updating the multi-row
1746 // type profile at a virtual call site (or other type-sensitive bytecode).
1747 // The machine visits each row (of receiver/count) until the receiver type
1748 // is found, or until it runs out of rows.  At the same time, it remembers
1749 // the location of the first empty row.  (An empty row records null for its
1750 // receiver, and can be allocated for a newly-observed receiver type.)
1751 // Because there are two degrees of freedom in the state, a simple linear
1752 // search will not work; it must be a decision tree.  Hence this helper
1753 // function is recursive, to generate the required tree structured code.
1754 // It's the interpreter, so we are trading off code space for speed.
1755 // See below for example code.
1756 void InterpreterMacroAssembler::record_klass_in_profile_helper(Register receiver, Register mdp,
1757                                                                Register reg2, int start_row,
1758                                                                Label& done) {

1759   if (TypeProfileWidth == 0) {
1760     increment_mdp_data_at(mdp, in_bytes(CounterData::count_offset()));
1761   } else {
1762     record_item_in_profile_helper(receiver, mdp, reg2, 0, done, TypeProfileWidth,
1763                                   &VirtualCallData::receiver_offset, &VirtualCallData::receiver_count_offset);
1764   }
1765 }
1766 
1767 void InterpreterMacroAssembler::record_item_in_profile_helper(Register item, Register mdp, Register reg2, int start_row,
1768                                                               Label& done, int total_rows,
1769                                                               OffsetFunction item_offset_fn,
1770                                                               OffsetFunction item_count_offset_fn) {
1771   int last_row = total_rows - 1;
1772   assert(start_row <= last_row, "must be work left to do");
1773   // Test this row for both the item and for null.
1774   // Take any of three different outcomes:
1775   //   1. found item => increment count and goto done
1776   //   2. found null => keep looking for case 1, maybe allocate this cell
1777   //   3. found something else => keep looking for cases 1 and 2
1778   // Case 3 is handled by a recursive call.

1842 //     // inner copy of decision tree, rooted at row[1]
1843 //     if (row[1].rec == rec) { row[1].incr(); goto done; }
1844 //     if (row[1].rec != nullptr) {
1845 //       // degenerate decision tree, rooted at row[2]
1846 //       if (row[2].rec == rec) { row[2].incr(); goto done; }
1847 //       if (row[2].rec != nullptr) { count.incr(); goto done; } // overflow
1848 //       row[2].init(rec); goto done;
1849 //     } else {
1850 //       // remember row[1] is empty
1851 //       if (row[2].rec == rec) { row[2].incr(); goto done; }
1852 //       row[1].init(rec); goto done;
1853 //     }
1854 //   } else {
1855 //     // remember row[0] is empty
1856 //     if (row[1].rec == rec) { row[1].incr(); goto done; }
1857 //     if (row[2].rec == rec) { row[2].incr(); goto done; }
1858 //     row[0].init(rec); goto done;
1859 //   }
1860 //   done:
1861 
1862 void InterpreterMacroAssembler::record_klass_in_profile(Register receiver, Register mdp, Register reg2) {


1863   assert(ProfileInterpreter, "must be profiling");
1864   Label done;
1865 
1866   record_klass_in_profile_helper(receiver, mdp, reg2, 0, done);
1867 
1868   bind (done);
1869 }
1870 
1871 void InterpreterMacroAssembler::profile_ret(Register return_bci,
1872                                             Register mdp) {
1873   if (ProfileInterpreter) {
1874     Label profile_continue;
1875     uint row;
1876 
1877     // If no method data exists, go to profile_continue.
1878     test_method_data_pointer(mdp, profile_continue);
1879 
1880     // Update the total ret count.
1881     increment_mdp_data_at(mdp, in_bytes(CounterData::count_offset()));
1882 
1883     for (row = 0; row < RetData::row_limit(); row++) {
1884       Label next_test;
1885 
1886       // See if return_bci is equal to bci[n]:

1923     update_mdp_by_constant(mdp, mdp_delta);
1924 
1925     bind(profile_continue);
1926   }
1927 }
1928 
1929 
1930 void InterpreterMacroAssembler::profile_typecheck(Register mdp, Register klass, Register reg2) {
1931   if (ProfileInterpreter) {
1932     Label profile_continue;
1933 
1934     // If no method data exists, go to profile_continue.
1935     test_method_data_pointer(mdp, profile_continue);
1936 
1937     // The method data pointer needs to be updated.
1938     int mdp_delta = in_bytes(BitData::bit_data_size());
1939     if (TypeProfileCasts) {
1940       mdp_delta = in_bytes(VirtualCallData::virtual_call_data_size());
1941 
1942       // Record the object type.
1943       record_klass_in_profile(klass, mdp, reg2);
1944       NOT_LP64(assert(reg2 == rdi, "we know how to fix this blown reg");)
1945       NOT_LP64(restore_locals();)         // Restore EDI
1946     }
1947     update_mdp_by_constant(mdp, mdp_delta);
1948 
1949     bind(profile_continue);
1950   }
1951 }
1952 
1953 
1954 void InterpreterMacroAssembler::profile_switch_default(Register mdp) {
1955   if (ProfileInterpreter) {
1956     Label profile_continue;
1957 
1958     // If no method data exists, go to profile_continue.
1959     test_method_data_pointer(mdp, profile_continue);
1960 
1961     // Update the default case count
1962     increment_mdp_data_at(mdp,
1963                           in_bytes(MultiBranchData::default_count_offset()));

1985     // case_array_offset_in_bytes()
1986     movl(reg2, in_bytes(MultiBranchData::per_case_size()));
1987     imulptr(index, reg2); // XXX l ?
1988     addptr(index, in_bytes(MultiBranchData::case_array_offset())); // XXX l ?
1989 
1990     // Update the case count
1991     increment_mdp_data_at(mdp,
1992                           index,
1993                           in_bytes(MultiBranchData::relative_count_offset()));
1994 
1995     // The method data pointer needs to be updated.
1996     update_mdp_by_offset(mdp,
1997                          index,
1998                          in_bytes(MultiBranchData::
1999                                   relative_displacement_offset()));
2000 
2001     bind(profile_continue);
2002   }
2003 }
2004 
2005 template <class ArrayData> void InterpreterMacroAssembler::profile_array_type(Register mdp,
2006                                                                               Register array,
2007                                                                               Register tmp) {
2008   if (ProfileInterpreter) {
2009     Label profile_continue;
2010 
2011     // If no method data exists, go to profile_continue.
2012     test_method_data_pointer(mdp, profile_continue);
2013 
2014     mov(tmp, array);
2015     profile_obj_type(tmp, Address(mdp, in_bytes(ArrayData::array_offset())));
2016 
2017     Label not_flat;
2018     test_non_flat_array_oop(array, tmp, not_flat);
2019 
2020     set_mdp_flag_at(mdp, ArrayData::flat_array_byte_constant());
2021 
2022     bind(not_flat);
2023 
2024     Label not_null_free;
2025     test_non_null_free_array_oop(array, tmp, not_null_free);
2026 
2027     set_mdp_flag_at(mdp, ArrayData::null_free_array_byte_constant());
2028 
2029     bind(not_null_free);
2030 
2031     bind(profile_continue);
2032   }
2033 }
2034 
2035 template void InterpreterMacroAssembler::profile_array_type<ArrayLoadData>(Register mdp,
2036                                                                            Register array,
2037                                                                            Register tmp);
2038 template void InterpreterMacroAssembler::profile_array_type<ArrayStoreData>(Register mdp,
2039                                                                             Register array,
2040                                                                             Register tmp);
2041 
2042 
2043 void InterpreterMacroAssembler::profile_multiple_element_types(Register mdp, Register element, Register tmp, const Register tmp2) {
2044   if (ProfileInterpreter) {
2045     Label profile_continue;
2046 
2047     // If no method data exists, go to profile_continue.
2048     test_method_data_pointer(mdp, profile_continue);
2049 
2050     Label done, update;
2051     testptr(element, element);
2052     jccb(Assembler::notZero, update);
2053     set_mdp_flag_at(mdp, BitData::null_seen_byte_constant());
2054     jmp(done);
2055 
2056     bind(update);
2057     load_klass(tmp, element, rscratch1);
2058 
2059     // Record the object type.
2060     record_klass_in_profile(tmp, mdp, tmp2);
2061 
2062     bind(done);
2063 
2064     // The method data pointer needs to be updated.
2065     update_mdp_by_constant(mdp, in_bytes(ArrayStoreData::array_store_data_size()));
2066 
2067     bind(profile_continue);
2068   }
2069 }
2070 
2071 void InterpreterMacroAssembler::profile_element_type(Register mdp,
2072                                                      Register element,
2073                                                      Register tmp) {
2074   if (ProfileInterpreter) {
2075     Label profile_continue;
2076 
2077     // If no method data exists, go to profile_continue.
2078     test_method_data_pointer(mdp, profile_continue);
2079 
2080     mov(tmp, element);
2081     profile_obj_type(tmp, Address(mdp, in_bytes(ArrayLoadData::element_offset())));
2082 
2083     // The method data pointer needs to be updated.
2084     update_mdp_by_constant(mdp, in_bytes(ArrayLoadData::array_load_data_size()));
2085 
2086     bind(profile_continue);
2087   }
2088 }
2089 
2090 void InterpreterMacroAssembler::profile_acmp(Register mdp,
2091                                              Register left,
2092                                              Register right,
2093                                              Register tmp) {
2094   if (ProfileInterpreter) {
2095     Label profile_continue;
2096 
2097     // If no method data exists, go to profile_continue.
2098     test_method_data_pointer(mdp, profile_continue);
2099 
2100     mov(tmp, left);
2101     profile_obj_type(tmp, Address(mdp, in_bytes(ACmpData::left_offset())));
2102 
2103     Label left_not_inline_type;
2104     test_oop_is_not_inline_type(left, tmp, left_not_inline_type);
2105     set_mdp_flag_at(mdp, ACmpData::left_inline_type_byte_constant());
2106     bind(left_not_inline_type);
2107 
2108     mov(tmp, right);
2109     profile_obj_type(tmp, Address(mdp, in_bytes(ACmpData::right_offset())));
2110 
2111     Label right_not_inline_type;
2112     test_oop_is_not_inline_type(right, tmp, right_not_inline_type);
2113     set_mdp_flag_at(mdp, ACmpData::right_inline_type_byte_constant());
2114     bind(right_not_inline_type);
2115 
2116     bind(profile_continue);
2117   }
2118 }
2119 
2120 
2121 void InterpreterMacroAssembler::_interp_verify_oop(Register reg, TosState state, const char* file, int line) {
2122   if (state == atos) {
2123     MacroAssembler::_verify_oop_checked(reg, "broken oop", file, line);
2124   }
2125 }
2126 
2127 void InterpreterMacroAssembler::verify_FPU(int stack_depth, TosState state) {
2128 #ifndef _LP64
2129   if ((state == ftos && UseSSE < 1) ||
2130       (state == dtos && UseSSE < 2)) {
2131     MacroAssembler::verify_FPU(stack_depth);
2132   }
2133 #endif
2134 }
2135 
2136 // Jump if ((*counter_addr += increment) & mask) == 0
2137 void InterpreterMacroAssembler::increment_mask_and_jump(Address counter_addr, Address mask,
2138                                                         Register scratch, Label* where) {
< prev index next >