1 /*
   2  * Copyright (c) 1998, 2024, Oracle and/or its affiliates. All rights reserved.
   3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   4  *
   5  * This code is free software; you can redistribute it and/or modify it
   6  * under the terms of the GNU General Public License version 2 only, as
   7  * published by the Free Software Foundation.
   8  *
   9  * This code is distributed in the hope that it will be useful, but WITHOUT
  10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  12  * version 2 for more details (a copy is included in the LICENSE file that
  13  * accompanied this code).
  14  *
  15  * You should have received a copy of the GNU General Public License version
  16  * 2 along with this work; if not, write to the Free Software Foundation,
  17  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  18  *
  19  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  20  * or visit www.oracle.com if you need additional information or have any
  21  * questions.
  22  *
  23  */
  24 
  25 #include "precompiled.hpp"
  26 #include "classfile/vmSymbols.hpp"
  27 #include "gc/shared/collectedHeap.hpp"
  28 #include "jfr/jfrEvents.hpp"
  29 #include "logging/log.hpp"
  30 #include "logging/logStream.hpp"
  31 #include "memory/allocation.inline.hpp"
  32 #include "memory/padded.hpp"
  33 #include "memory/resourceArea.hpp"
  34 #include "memory/universe.hpp"
  35 #include "oops/markWord.hpp"
  36 #include "oops/oop.inline.hpp"
  37 #include "runtime/atomic.hpp"
  38 #include "runtime/frame.inline.hpp"
  39 #include "runtime/globals.hpp"
  40 #include "runtime/handles.inline.hpp"
  41 #include "runtime/handshake.hpp"
  42 #include "runtime/interfaceSupport.inline.hpp"
  43 #include "runtime/javaThread.hpp"
  44 #include "runtime/lockStack.inline.hpp"
  45 #include "runtime/mutexLocker.hpp"
  46 #include "runtime/objectMonitor.hpp"
  47 #include "runtime/objectMonitor.inline.hpp"
  48 #include "runtime/os.inline.hpp"
  49 #include "runtime/osThread.hpp"
  50 #include "runtime/perfData.hpp"
  51 #include "runtime/safepointMechanism.inline.hpp"
  52 #include "runtime/safepointVerifiers.hpp"
  53 #include "runtime/sharedRuntime.hpp"
  54 #include "runtime/stubRoutines.hpp"
  55 #include "runtime/synchronizer.hpp"
  56 #include "runtime/threads.hpp"
  57 #include "runtime/timer.hpp"
  58 #include "runtime/trimNativeHeap.hpp"
  59 #include "runtime/vframe.hpp"
  60 #include "runtime/vmThread.hpp"
  61 #include "utilities/align.hpp"
  62 #include "utilities/dtrace.hpp"
  63 #include "utilities/events.hpp"
  64 #include "utilities/globalDefinitions.hpp"
  65 #include "utilities/linkedlist.hpp"
  66 #include "utilities/preserveException.hpp"
  67 
  68 class ObjectMonitorDeflationLogging;
  69 
  70 void MonitorList::add(ObjectMonitor* m) {
  71   ObjectMonitor* head;
  72   do {
  73     head = Atomic::load(&_head);
  74     m->set_next_om(head);
  75   } while (Atomic::cmpxchg(&_head, head, m) != head);
  76 
  77   size_t count = Atomic::add(&_count, 1u);
  78   if (count > max()) {
  79     Atomic::inc(&_max);
  80   }
  81 }
  82 
  83 size_t MonitorList::count() const {
  84   return Atomic::load(&_count);
  85 }
  86 
  87 size_t MonitorList::max() const {
  88   return Atomic::load(&_max);
  89 }
  90 
  91 class ObjectMonitorDeflationSafepointer : public StackObj {
  92   JavaThread* const                    _current;
  93   ObjectMonitorDeflationLogging* const _log;
  94 
  95 public:
  96   ObjectMonitorDeflationSafepointer(JavaThread* current, ObjectMonitorDeflationLogging* log)
  97     : _current(current), _log(log) {}
  98 
  99   void block_for_safepoint(const char* op_name, const char* count_name, size_t counter);
 100 };
 101 
 102 // Walk the in-use list and unlink deflated ObjectMonitors.
 103 // Returns the number of unlinked ObjectMonitors.
 104 size_t MonitorList::unlink_deflated(size_t deflated_count,
 105                                     GrowableArray<ObjectMonitor*>* unlinked_list,
 106                                     ObjectMonitorDeflationSafepointer* safepointer) {
 107   size_t unlinked_count = 0;
 108   ObjectMonitor* prev = nullptr;
 109   ObjectMonitor* m = Atomic::load_acquire(&_head);
 110 
 111   while (m != nullptr) {
 112     if (m->is_being_async_deflated()) {
 113       // Find next live ObjectMonitor. Batch up the unlinkable monitors, so we can
 114       // modify the list once per batch. The batch starts at "m".
 115       size_t unlinked_batch = 0;
 116       ObjectMonitor* next = m;
 117       // Look for at most MonitorUnlinkBatch monitors, or the number of
 118       // deflated and not unlinked monitors, whatever comes first.
 119       assert(deflated_count >= unlinked_count, "Sanity: underflow");
 120       size_t unlinked_batch_limit = MIN2<size_t>(deflated_count - unlinked_count, MonitorUnlinkBatch);
 121       do {
 122         ObjectMonitor* next_next = next->next_om();
 123         unlinked_batch++;
 124         unlinked_list->append(next);
 125         next = next_next;
 126         if (unlinked_batch >= unlinked_batch_limit) {
 127           // Reached the max batch, so bail out of the gathering loop.
 128           break;
 129         }
 130         if (prev == nullptr && Atomic::load(&_head) != m) {
 131           // Current batch used to be at head, but it is not at head anymore.
 132           // Bail out and figure out where we currently are. This avoids long
 133           // walks searching for new prev during unlink under heavy list inserts.
 134           break;
 135         }
 136       } while (next != nullptr && next->is_being_async_deflated());
 137 
 138       // Unlink the found batch.
 139       if (prev == nullptr) {
 140         // The current batch is the first batch, so there is a chance that it starts at head.
 141         // Optimistically assume no inserts happened, and try to unlink the entire batch from the head.
 142         ObjectMonitor* prev_head = Atomic::cmpxchg(&_head, m, next);
 143         if (prev_head != m) {
 144           // Something must have updated the head. Figure out the actual prev for this batch.
 145           for (ObjectMonitor* n = prev_head; n != m; n = n->next_om()) {
 146             prev = n;
 147           }
 148           assert(prev != nullptr, "Should have found the prev for the current batch");
 149           prev->set_next_om(next);
 150         }
 151       } else {
 152         // The current batch is preceded by another batch. This guarantees the current batch
 153         // does not start at head. Unlink the entire current batch without updating the head.
 154         assert(Atomic::load(&_head) != m, "Sanity");
 155         prev->set_next_om(next);
 156       }
 157 
 158       unlinked_count += unlinked_batch;
 159       if (unlinked_count >= deflated_count) {
 160         // Reached the max so bail out of the searching loop.
 161         // There should be no more deflated monitors left.
 162         break;
 163       }
 164       m = next;
 165     } else {
 166       prev = m;
 167       m = m->next_om();
 168     }
 169 
 170     // Must check for a safepoint/handshake and honor it.
 171     safepointer->block_for_safepoint("unlinking", "unlinked_count", unlinked_count);
 172   }
 173 
 174 #ifdef ASSERT
 175   // Invariant: the code above should unlink all deflated monitors.
 176   // The code that runs after this unlinking does not expect deflated monitors.
 177   // Notably, attempting to deflate the already deflated monitor would break.
 178   {
 179     ObjectMonitor* m = Atomic::load_acquire(&_head);
 180     while (m != nullptr) {
 181       assert(!m->is_being_async_deflated(), "All deflated monitors should be unlinked");
 182       m = m->next_om();
 183     }
 184   }
 185 #endif
 186 
 187   Atomic::sub(&_count, unlinked_count);
 188   return unlinked_count;
 189 }
 190 
 191 MonitorList::Iterator MonitorList::iterator() const {
 192   return Iterator(Atomic::load_acquire(&_head));
 193 }
 194 
 195 ObjectMonitor* MonitorList::Iterator::next() {
 196   ObjectMonitor* current = _current;
 197   _current = current->next_om();
 198   return current;
 199 }
 200 
 201 // The "core" versions of monitor enter and exit reside in this file.
 202 // The interpreter and compilers contain specialized transliterated
 203 // variants of the enter-exit fast-path operations.  See c2_MacroAssembler_x86.cpp
 204 // fast_lock(...) for instance.  If you make changes here, make sure to modify the
 205 // interpreter, and both C1 and C2 fast-path inline locking code emission.
 206 //
 207 // -----------------------------------------------------------------------------
 208 
 209 #ifdef DTRACE_ENABLED
 210 
 211 // Only bother with this argument setup if dtrace is available
 212 // TODO-FIXME: probes should not fire when caller is _blocked.  assert() accordingly.
 213 
 214 #define DTRACE_MONITOR_PROBE_COMMON(obj, thread)                           \
 215   char* bytes = nullptr;                                                      \
 216   int len = 0;                                                             \
 217   jlong jtid = SharedRuntime::get_java_tid(thread);                        \
 218   Symbol* klassname = obj->klass()->name();                                \
 219   if (klassname != nullptr) {                                                 \
 220     bytes = (char*)klassname->bytes();                                     \
 221     len = klassname->utf8_length();                                        \
 222   }
 223 
 224 #define DTRACE_MONITOR_WAIT_PROBE(monitor, obj, thread, millis)            \
 225   {                                                                        \
 226     if (DTraceMonitorProbes) {                                             \
 227       DTRACE_MONITOR_PROBE_COMMON(obj, thread);                            \
 228       HOTSPOT_MONITOR_WAIT(jtid,                                           \
 229                            (uintptr_t)(monitor), bytes, len, (millis));    \
 230     }                                                                      \
 231   }
 232 
 233 #define HOTSPOT_MONITOR_PROBE_notify HOTSPOT_MONITOR_NOTIFY
 234 #define HOTSPOT_MONITOR_PROBE_notifyAll HOTSPOT_MONITOR_NOTIFYALL
 235 #define HOTSPOT_MONITOR_PROBE_waited HOTSPOT_MONITOR_WAITED
 236 
 237 #define DTRACE_MONITOR_PROBE(probe, monitor, obj, thread)                  \
 238   {                                                                        \
 239     if (DTraceMonitorProbes) {                                             \
 240       DTRACE_MONITOR_PROBE_COMMON(obj, thread);                            \
 241       HOTSPOT_MONITOR_PROBE_##probe(jtid, /* probe = waited */             \
 242                                     (uintptr_t)(monitor), bytes, len);     \
 243     }                                                                      \
 244   }
 245 
 246 #else //  ndef DTRACE_ENABLED
 247 
 248 #define DTRACE_MONITOR_WAIT_PROBE(obj, thread, millis, mon)    {;}
 249 #define DTRACE_MONITOR_PROBE(probe, obj, thread, mon)          {;}
 250 
 251 #endif // ndef DTRACE_ENABLED
 252 
 253 // This exists only as a workaround of dtrace bug 6254741
 254 static int dtrace_waited_probe(ObjectMonitor* monitor, Handle obj, JavaThread* thr) {
 255   DTRACE_MONITOR_PROBE(waited, monitor, obj(), thr);
 256   return 0;
 257 }
 258 
 259 static constexpr size_t inflation_lock_count() {
 260   return 256;
 261 }
 262 
 263 // Static storage for an array of PlatformMutex.
 264 alignas(PlatformMutex) static uint8_t _inflation_locks[inflation_lock_count()][sizeof(PlatformMutex)];
 265 
 266 static inline PlatformMutex* inflation_lock(size_t index) {
 267   return reinterpret_cast<PlatformMutex*>(_inflation_locks[index]);
 268 }
 269 
 270 void ObjectSynchronizer::initialize() {
 271   for (size_t i = 0; i < inflation_lock_count(); i++) {
 272     ::new(static_cast<void*>(inflation_lock(i))) PlatformMutex();
 273   }
 274   // Start the ceiling with the estimate for one thread.
 275   set_in_use_list_ceiling(AvgMonitorsPerThreadEstimate);
 276 
 277   // Start the timer for deflations, so it does not trigger immediately.
 278   _last_async_deflation_time_ns = os::javaTimeNanos();
 279 }
 280 
 281 MonitorList ObjectSynchronizer::_in_use_list;
 282 // monitors_used_above_threshold() policy is as follows:
 283 //
 284 // The ratio of the current _in_use_list count to the ceiling is used
 285 // to determine if we are above MonitorUsedDeflationThreshold and need
 286 // to do an async monitor deflation cycle. The ceiling is increased by
 287 // AvgMonitorsPerThreadEstimate when a thread is added to the system
 288 // and is decreased by AvgMonitorsPerThreadEstimate when a thread is
 289 // removed from the system.
 290 //
 291 // Note: If the _in_use_list max exceeds the ceiling, then
 292 // monitors_used_above_threshold() will use the in_use_list max instead
 293 // of the thread count derived ceiling because we have used more
 294 // ObjectMonitors than the estimated average.
 295 //
 296 // Note: If deflate_idle_monitors() has NoAsyncDeflationProgressMax
 297 // no-progress async monitor deflation cycles in a row, then the ceiling
 298 // is adjusted upwards by monitors_used_above_threshold().
 299 //
 300 // Start the ceiling with the estimate for one thread in initialize()
 301 // which is called after cmd line options are processed.
 302 static size_t _in_use_list_ceiling = 0;
 303 bool volatile ObjectSynchronizer::_is_async_deflation_requested = false;
 304 bool volatile ObjectSynchronizer::_is_final_audit = false;
 305 jlong ObjectSynchronizer::_last_async_deflation_time_ns = 0;
 306 static uintx _no_progress_cnt = 0;
 307 static bool _no_progress_skip_increment = false;
 308 
 309 // =====================> Quick functions
 310 
 311 // The quick_* forms are special fast-path variants used to improve
 312 // performance.  In the simplest case, a "quick_*" implementation could
 313 // simply return false, in which case the caller will perform the necessary
 314 // state transitions and call the slow-path form.
 315 // The fast-path is designed to handle frequently arising cases in an efficient
 316 // manner and is just a degenerate "optimistic" variant of the slow-path.
 317 // returns true  -- to indicate the call was satisfied.
 318 // returns false -- to indicate the call needs the services of the slow-path.
 319 // A no-loitering ordinance is in effect for code in the quick_* family
 320 // operators: safepoints or indefinite blocking (blocking that might span a
 321 // safepoint) are forbidden. Generally the thread_state() is _in_Java upon
 322 // entry.
 323 //
 324 // Consider: An interesting optimization is to have the JIT recognize the
 325 // following common idiom:
 326 //   synchronized (someobj) { .... ; notify(); }
 327 // That is, we find a notify() or notifyAll() call that immediately precedes
 328 // the monitorexit operation.  In that case the JIT could fuse the operations
 329 // into a single notifyAndExit() runtime primitive.
 330 
 331 bool ObjectSynchronizer::quick_notify(oopDesc* obj, JavaThread* current, bool all) {
 332   assert(current->thread_state() == _thread_in_Java, "invariant");
 333   NoSafepointVerifier nsv;
 334   if (obj == nullptr) return false;  // slow-path for invalid obj
 335   const markWord mark = obj->mark();
 336 
 337   if (LockingMode == LM_LIGHTWEIGHT) {
 338     if (mark.is_fast_locked() && current->lock_stack().contains(cast_to_oop(obj))) {
 339       // Degenerate notify
 340       // fast-locked by caller so by definition the implied waitset is empty.
 341       return true;
 342     }
 343   } else if (LockingMode == LM_LEGACY) {
 344     if (mark.has_locker() && current->is_lock_owned((address)mark.locker())) {
 345       // Degenerate notify
 346       // stack-locked by caller so by definition the implied waitset is empty.
 347       return true;
 348     }
 349   }
 350 
 351   if (mark.has_monitor()) {
 352     ObjectMonitor* const mon = mark.monitor();
 353     assert(mon->object() == oop(obj), "invariant");
 354     if (mon->owner() != current) return false;  // slow-path for IMS exception
 355 
 356     if (mon->first_waiter() != nullptr) {
 357       // We have one or more waiters. Since this is an inflated monitor
 358       // that we own, we can transfer one or more threads from the waitset
 359       // to the entrylist here and now, avoiding the slow-path.
 360       if (all) {
 361         DTRACE_MONITOR_PROBE(notifyAll, mon, obj, current);
 362       } else {
 363         DTRACE_MONITOR_PROBE(notify, mon, obj, current);
 364       }
 365       int free_count = 0;
 366       do {
 367         mon->INotify(current);
 368         ++free_count;
 369       } while (mon->first_waiter() != nullptr && all);
 370       OM_PERFDATA_OP(Notifications, inc(free_count));
 371     }
 372     return true;
 373   }
 374 
 375   // other IMS exception states take the slow-path
 376   return false;
 377 }
 378 
 379 
 380 // The LockNode emitted directly at the synchronization site would have
 381 // been too big if it were to have included support for the cases of inflated
 382 // recursive enter and exit, so they go here instead.
 383 // Note that we can't safely call AsyncPrintJavaStack() from within
 384 // quick_enter() as our thread state remains _in_Java.
 385 
 386 bool ObjectSynchronizer::quick_enter(oop obj, JavaThread* current,
 387                                      BasicLock * lock) {
 388   assert(current->thread_state() == _thread_in_Java, "invariant");
 389   NoSafepointVerifier nsv;
 390   if (obj == nullptr) return false;       // Need to throw NPE
 391 
 392   if (obj->klass()->is_value_based()) {
 393     return false;
 394   }
 395 
 396   if (LockingMode == LM_LIGHTWEIGHT) {
 397     LockStack& lock_stack = current->lock_stack();
 398     if (lock_stack.is_full()) {
 399       // Always go into runtime if the lock stack is full.
 400       return false;
 401     }
 402     if (lock_stack.try_recursive_enter(obj)) {
 403       // Recursive lock successful.
 404       current->inc_held_monitor_count();
 405       return true;
 406     }
 407   }
 408 
 409   const markWord mark = obj->mark();
 410 
 411   if (mark.has_monitor()) {
 412     ObjectMonitor* const m = mark.monitor();
 413     // An async deflation or GC can race us before we manage to make
 414     // the ObjectMonitor busy by setting the owner below. If we detect
 415     // that race we just bail out to the slow-path here.
 416     if (m->object_peek() == nullptr) {
 417       return false;
 418     }
 419     JavaThread* const owner = static_cast<JavaThread*>(m->owner_raw());
 420 
 421     // Lock contention and Transactional Lock Elision (TLE) diagnostics
 422     // and observability
 423     // Case: light contention possibly amenable to TLE
 424     // Case: TLE inimical operations such as nested/recursive synchronization
 425 
 426     if (owner == current) {
 427       m->_recursions++;
 428       current->inc_held_monitor_count();
 429       return true;
 430     }
 431 
 432     if (LockingMode != LM_LIGHTWEIGHT) {
 433       // This Java Monitor is inflated so obj's header will never be
 434       // displaced to this thread's BasicLock. Make the displaced header
 435       // non-null so this BasicLock is not seen as recursive nor as
 436       // being locked. We do this unconditionally so that this thread's
 437       // BasicLock cannot be mis-interpreted by any stack walkers. For
 438       // performance reasons, stack walkers generally first check for
 439       // stack-locking in the object's header, the second check is for
 440       // recursive stack-locking in the displaced header in the BasicLock,
 441       // and last are the inflated Java Monitor (ObjectMonitor) checks.
 442       lock->set_displaced_header(markWord::unused_mark());
 443     }
 444 
 445     if (owner == nullptr && m->try_set_owner_from(nullptr, current) == nullptr) {
 446       assert(m->_recursions == 0, "invariant");
 447       current->inc_held_monitor_count();
 448       return true;
 449     }
 450   }
 451 
 452   // Note that we could inflate in quick_enter.
 453   // This is likely a useful optimization
 454   // Critically, in quick_enter() we must not:
 455   // -- block indefinitely, or
 456   // -- reach a safepoint
 457 
 458   return false;        // revert to slow-path
 459 }
 460 
 461 // Handle notifications when synchronizing on value based classes
 462 void ObjectSynchronizer::handle_sync_on_value_based_class(Handle obj, JavaThread* locking_thread) {
 463   assert(locking_thread == Thread::current() || locking_thread->is_obj_deopt_suspend(), "must be");
 464   frame last_frame = locking_thread->last_frame();
 465   bool bcp_was_adjusted = false;
 466   // Don't decrement bcp if it points to the frame's first instruction.  This happens when
 467   // handle_sync_on_value_based_class() is called because of a synchronized method.  There
 468   // is no actual monitorenter instruction in the byte code in this case.
 469   if (last_frame.is_interpreted_frame() &&
 470       (last_frame.interpreter_frame_method()->code_base() < last_frame.interpreter_frame_bcp())) {
 471     // adjust bcp to point back to monitorenter so that we print the correct line numbers
 472     last_frame.interpreter_frame_set_bcp(last_frame.interpreter_frame_bcp() - 1);
 473     bcp_was_adjusted = true;
 474   }
 475 
 476   if (DiagnoseSyncOnValueBasedClasses == FATAL_EXIT) {
 477     ResourceMark rm;
 478     stringStream ss;
 479     locking_thread->print_active_stack_on(&ss);
 480     char* base = (char*)strstr(ss.base(), "at");
 481     char* newline = (char*)strchr(ss.base(), '\n');
 482     if (newline != nullptr) {
 483       *newline = '\0';
 484     }
 485     fatal("Synchronizing on object " INTPTR_FORMAT " of klass %s %s", p2i(obj()), obj->klass()->external_name(), base);
 486   } else {
 487     assert(DiagnoseSyncOnValueBasedClasses == LOG_WARNING, "invalid value for DiagnoseSyncOnValueBasedClasses");
 488     ResourceMark rm;
 489     Log(valuebasedclasses) vblog;
 490 
 491     vblog.info("Synchronizing on object " INTPTR_FORMAT " of klass %s", p2i(obj()), obj->klass()->external_name());
 492     if (locking_thread->has_last_Java_frame()) {
 493       LogStream info_stream(vblog.info());
 494       locking_thread->print_active_stack_on(&info_stream);
 495     } else {
 496       vblog.info("Cannot find the last Java frame");
 497     }
 498 
 499     EventSyncOnValueBasedClass event;
 500     if (event.should_commit()) {
 501       event.set_valueBasedClass(obj->klass());
 502       event.commit();
 503     }
 504   }
 505 
 506   if (bcp_was_adjusted) {
 507     last_frame.interpreter_frame_set_bcp(last_frame.interpreter_frame_bcp() + 1);
 508   }
 509 }
 510 
 511 static bool useHeavyMonitors() {
 512 #if defined(X86) || defined(AARCH64) || defined(PPC64) || defined(RISCV64) || defined(S390)
 513   return LockingMode == LM_MONITOR;
 514 #else
 515   return false;
 516 #endif
 517 }
 518 
 519 // -----------------------------------------------------------------------------
 520 // Monitor Enter/Exit
 521 
 522 void ObjectSynchronizer::enter_for(Handle obj, BasicLock* lock, JavaThread* locking_thread) {
 523   // When called with locking_thread != Thread::current() some mechanism must synchronize
 524   // the locking_thread with respect to the current thread. Currently only used when
 525   // deoptimizing and re-locking locks. See Deoptimization::relock_objects
 526   assert(locking_thread == Thread::current() || locking_thread->is_obj_deopt_suspend(), "must be");
 527   if (!enter_fast_impl(obj, lock, locking_thread)) {
 528     // Inflated ObjectMonitor::enter_for is required
 529 
 530     // An async deflation can race after the inflate_for() call and before
 531     // enter_for() can make the ObjectMonitor busy. enter_for() returns false
 532     // if we have lost the race to async deflation and we simply try again.
 533     while (true) {
 534       ObjectMonitor* monitor = inflate_for(locking_thread, obj(), inflate_cause_monitor_enter);
 535       if (monitor->enter_for(locking_thread)) {
 536         return;
 537       }
 538       assert(monitor->is_being_async_deflated(), "must be");
 539     }
 540   }
 541 }
 542 
 543 void ObjectSynchronizer::enter(Handle obj, BasicLock* lock, JavaThread* current) {
 544   assert(current == Thread::current(), "must be");
 545   if (!enter_fast_impl(obj, lock, current)) {
 546     // Inflated ObjectMonitor::enter is required
 547 
 548     // An async deflation can race after the inflate() call and before
 549     // enter() can make the ObjectMonitor busy. enter() returns false if
 550     // we have lost the race to async deflation and we simply try again.
 551     while (true) {
 552       ObjectMonitor* monitor = inflate(current, obj(), inflate_cause_monitor_enter);
 553       if (monitor->enter(current)) {
 554         return;
 555       }
 556     }
 557   }
 558 }
 559 
 560 // The interpreter and compiler assembly code tries to lock using the fast path
 561 // of this algorithm. Make sure to update that code if the following function is
 562 // changed. The implementation is extremely sensitive to race condition. Be careful.
 563 bool ObjectSynchronizer::enter_fast_impl(Handle obj, BasicLock* lock, JavaThread* locking_thread) {
 564 
 565   if (obj->klass()->is_value_based()) {
 566     handle_sync_on_value_based_class(obj, locking_thread);
 567   }
 568 
 569   locking_thread->inc_held_monitor_count();
 570 
 571   if (!useHeavyMonitors()) {
 572     if (LockingMode == LM_LIGHTWEIGHT) {
 573       // Fast-locking does not use the 'lock' argument.
 574       LockStack& lock_stack = locking_thread->lock_stack();
 575       if (lock_stack.is_full()) {
 576         // We unconditionally make room on the lock stack by inflating
 577         // the least recently locked object on the lock stack.
 578 
 579         // About the choice to inflate least recently locked object.
 580         // First we must chose to inflate a lock, either some lock on
 581         // the lock-stack or the lock that is currently being entered
 582         // (which may or may not be on the lock-stack).
 583         // Second the best lock to inflate is a lock which is entered
 584         // in a control flow where there are only a very few locks being
 585         // used, as the costly part of inflated locking is inflation,
 586         // not locking. But this property is entirely program dependent.
 587         // Third inflating the lock currently being entered on when it
 588         // is not present on the lock-stack will result in a still full
 589         // lock-stack. This creates a scenario where every deeper nested
 590         // monitorenter must call into the runtime.
 591         // The rational here is as follows:
 592         // Because we cannot (currently) figure out the second, and want
 593         // to avoid the third, we inflate a lock on the lock-stack.
 594         // The least recently locked lock is chosen as it is the lock
 595         // with the longest critical section.
 596 
 597         log_info(monitorinflation)("LockStack capacity exceeded, inflating.");
 598         ObjectMonitor* monitor = inflate_for(locking_thread, lock_stack.bottom(), inflate_cause_vm_internal);
 599         assert(monitor->owner() == Thread::current(), "must be owner=" PTR_FORMAT " current=" PTR_FORMAT " mark=" PTR_FORMAT,
 600                p2i(monitor->owner()), p2i(Thread::current()), monitor->object()->mark_acquire().value());
 601         assert(!lock_stack.is_full(), "must have made room here");
 602       }
 603 
 604       markWord mark = obj()->mark_acquire();
 605       while (mark.is_unlocked()) {
 606         // Retry until a lock state change has been observed. cas_set_mark() may collide with non lock bits modifications.
 607         // Try to swing into 'fast-locked' state.
 608         assert(!lock_stack.contains(obj()), "thread must not already hold the lock");
 609         const markWord locked_mark = mark.set_fast_locked();
 610         const markWord old_mark = obj()->cas_set_mark(locked_mark, mark);
 611         if (old_mark == mark) {
 612           // Successfully fast-locked, push object to lock-stack and return.
 613           lock_stack.push(obj());
 614           return true;
 615         }
 616         mark = old_mark;
 617       }
 618 
 619       if (mark.is_fast_locked() && lock_stack.try_recursive_enter(obj())) {
 620         // Recursive lock successful.
 621         return true;
 622       }
 623 
 624       // Failed to fast lock.
 625       return false;
 626     } else if (LockingMode == LM_LEGACY) {
 627       markWord mark = obj->mark();
 628       if (mark.is_unlocked()) {
 629         // Anticipate successful CAS -- the ST of the displaced mark must
 630         // be visible <= the ST performed by the CAS.
 631         lock->set_displaced_header(mark);
 632         if (mark == obj()->cas_set_mark(markWord::from_pointer(lock), mark)) {
 633           return true;
 634         }
 635       } else if (mark.has_locker() &&
 636                  locking_thread->is_lock_owned((address) mark.locker())) {
 637         assert(lock != mark.locker(), "must not re-lock the same lock");
 638         assert(lock != (BasicLock*) obj->mark().value(), "don't relock with same BasicLock");
 639         lock->set_displaced_header(markWord::from_pointer(nullptr));
 640         return true;
 641       }
 642 
 643       // The object header will never be displaced to this lock,
 644       // so it does not matter what the value is, except that it
 645       // must be non-zero to avoid looking like a re-entrant lock,
 646       // and must not look locked either.
 647       lock->set_displaced_header(markWord::unused_mark());
 648 
 649       // Failed to fast lock.
 650       return false;
 651     }
 652   } else if (VerifyHeavyMonitors) {
 653     guarantee((obj->mark().value() & markWord::lock_mask_in_place) != markWord::locked_value, "must not be lightweight/stack-locked");
 654   }
 655 
 656   return false;
 657 }
 658 
 659 void ObjectSynchronizer::exit(oop object, BasicLock* lock, JavaThread* current) {
 660   current->dec_held_monitor_count();
 661 
 662   if (!useHeavyMonitors()) {
 663     markWord mark = object->mark();
 664     if (LockingMode == LM_LIGHTWEIGHT) {
 665       // Fast-locking does not use the 'lock' argument.
 666       LockStack& lock_stack = current->lock_stack();
 667       if (mark.is_fast_locked() && lock_stack.try_recursive_exit(object)) {
 668         // Recursively unlocked.
 669         return;
 670       }
 671 
 672       if (mark.is_fast_locked() && lock_stack.is_recursive(object)) {
 673         // This lock is recursive but is not at the top of the lock stack so we're
 674         // doing an unbalanced exit. We have to fall thru to inflation below and
 675         // let ObjectMonitor::exit() do the unlock.
 676       } else {
 677         while (mark.is_fast_locked()) {
 678           // Retry until a lock state change has been observed. cas_set_mark() may collide with non lock bits modifications.
 679           const markWord unlocked_mark = mark.set_unlocked();
 680           const markWord old_mark = object->cas_set_mark(unlocked_mark, mark);
 681           if (old_mark == mark) {
 682             size_t recursions = lock_stack.remove(object) - 1;
 683             assert(recursions == 0, "must not be recursive here");
 684             return;
 685           }
 686           mark = old_mark;
 687         }
 688       }
 689     } else if (LockingMode == LM_LEGACY) {
 690       markWord dhw = lock->displaced_header();
 691       if (dhw.value() == 0) {
 692         // If the displaced header is null, then this exit matches up with
 693         // a recursive enter. No real work to do here except for diagnostics.
 694 #ifndef PRODUCT
 695         if (mark != markWord::INFLATING()) {
 696           // Only do diagnostics if we are not racing an inflation. Simply
 697           // exiting a recursive enter of a Java Monitor that is being
 698           // inflated is safe; see the has_monitor() comment below.
 699           assert(!mark.is_unlocked(), "invariant");
 700           assert(!mark.has_locker() ||
 701                  current->is_lock_owned((address)mark.locker()), "invariant");
 702           if (mark.has_monitor()) {
 703             // The BasicLock's displaced_header is marked as a recursive
 704             // enter and we have an inflated Java Monitor (ObjectMonitor).
 705             // This is a special case where the Java Monitor was inflated
 706             // after this thread entered the stack-lock recursively. When a
 707             // Java Monitor is inflated, we cannot safely walk the Java
 708             // Monitor owner's stack and update the BasicLocks because a
 709             // Java Monitor can be asynchronously inflated by a thread that
 710             // does not own the Java Monitor.
 711             ObjectMonitor* m = mark.monitor();
 712             assert(m->object()->mark() == mark, "invariant");
 713             assert(m->is_entered(current), "invariant");
 714           }
 715         }
 716 #endif
 717         return;
 718       }
 719 
 720       if (mark == markWord::from_pointer(lock)) {
 721         // If the object is stack-locked by the current thread, try to
 722         // swing the displaced header from the BasicLock back to the mark.
 723         assert(dhw.is_neutral(), "invariant");
 724         if (object->cas_set_mark(dhw, mark) == mark) {
 725           return;
 726         }
 727       }
 728     }
 729   } else if (VerifyHeavyMonitors) {
 730     guarantee((object->mark().value() & markWord::lock_mask_in_place) != markWord::locked_value, "must not be lightweight/stack-locked");
 731   }
 732 
 733   // We have to take the slow-path of possible inflation and then exit.
 734   // The ObjectMonitor* can't be async deflated until ownership is
 735   // dropped inside exit() and the ObjectMonitor* must be !is_busy().
 736   ObjectMonitor* monitor = inflate(current, object, inflate_cause_vm_internal);
 737   assert(!monitor->is_owner_anonymous(), "must not be");
 738   monitor->exit(current);
 739 }
 740 
 741 // -----------------------------------------------------------------------------
 742 // JNI locks on java objects
 743 // NOTE: must use heavy weight monitor to handle jni monitor enter
 744 void ObjectSynchronizer::jni_enter(Handle obj, JavaThread* current) {
 745   if (obj->klass()->is_value_based()) {
 746     handle_sync_on_value_based_class(obj, current);
 747   }
 748 
 749   // the current locking is from JNI instead of Java code
 750   current->set_current_pending_monitor_is_from_java(false);
 751   // An async deflation can race after the inflate() call and before
 752   // enter() can make the ObjectMonitor busy. enter() returns false if
 753   // we have lost the race to async deflation and we simply try again.
 754   while (true) {
 755     ObjectMonitor* monitor = inflate(current, obj(), inflate_cause_jni_enter);
 756     if (monitor->enter(current)) {
 757       current->inc_held_monitor_count(1, true);
 758       break;
 759     }
 760   }
 761   current->set_current_pending_monitor_is_from_java(true);
 762 }
 763 
 764 // NOTE: must use heavy weight monitor to handle jni monitor exit
 765 void ObjectSynchronizer::jni_exit(oop obj, TRAPS) {
 766   JavaThread* current = THREAD;
 767 
 768   // The ObjectMonitor* can't be async deflated until ownership is
 769   // dropped inside exit() and the ObjectMonitor* must be !is_busy().
 770   ObjectMonitor* monitor = inflate(current, obj, inflate_cause_jni_exit);
 771   // If this thread has locked the object, exit the monitor. We
 772   // intentionally do not use CHECK on check_owner because we must exit the
 773   // monitor even if an exception was already pending.
 774   if (monitor->check_owner(THREAD)) {
 775     monitor->exit(current);
 776     current->dec_held_monitor_count(1, true);
 777   }
 778 }
 779 
 780 // -----------------------------------------------------------------------------
 781 // Internal VM locks on java objects
 782 // standard constructor, allows locking failures
 783 ObjectLocker::ObjectLocker(Handle obj, JavaThread* thread) {
 784   _thread = thread;
 785   _thread->check_for_valid_safepoint_state();
 786   _obj = obj;
 787 
 788   if (_obj() != nullptr) {
 789     ObjectSynchronizer::enter(_obj, &_lock, _thread);
 790   }
 791 }
 792 
 793 ObjectLocker::~ObjectLocker() {
 794   if (_obj() != nullptr) {
 795     ObjectSynchronizer::exit(_obj(), &_lock, _thread);
 796   }
 797 }
 798 
 799 
 800 // -----------------------------------------------------------------------------
 801 //  Wait/Notify/NotifyAll
 802 // NOTE: must use heavy weight monitor to handle wait()
 803 int ObjectSynchronizer::wait(Handle obj, jlong millis, TRAPS) {
 804   JavaThread* current = THREAD;
 805   if (millis < 0) {
 806     THROW_MSG_0(vmSymbols::java_lang_IllegalArgumentException(), "timeout value is negative");
 807   }
 808   // The ObjectMonitor* can't be async deflated because the _waiters
 809   // field is incremented before ownership is dropped and decremented
 810   // after ownership is regained.
 811   ObjectMonitor* monitor = inflate(current, obj(), inflate_cause_wait);
 812 
 813   DTRACE_MONITOR_WAIT_PROBE(monitor, obj(), current, millis);
 814   monitor->wait(millis, true, THREAD); // Not CHECK as we need following code
 815 
 816   // This dummy call is in place to get around dtrace bug 6254741.  Once
 817   // that's fixed we can uncomment the following line, remove the call
 818   // and change this function back into a "void" func.
 819   // DTRACE_MONITOR_PROBE(waited, monitor, obj(), THREAD);
 820   int ret_code = dtrace_waited_probe(monitor, obj, THREAD);
 821   return ret_code;
 822 }
 823 
 824 void ObjectSynchronizer::waitUninterruptibly(Handle obj, jlong millis, TRAPS) {
 825   if (millis < 0) {
 826     THROW_MSG(vmSymbols::java_lang_IllegalArgumentException(), "timeout value is negative");
 827   }
 828   ObjectSynchronizer::inflate(THREAD,
 829                               obj(),
 830                               inflate_cause_wait)->wait(millis, false, THREAD);
 831 }
 832 
 833 
 834 void ObjectSynchronizer::notify(Handle obj, TRAPS) {
 835   JavaThread* current = THREAD;
 836 
 837   markWord mark = obj->mark();
 838   if (LockingMode == LM_LIGHTWEIGHT) {
 839     if ((mark.is_fast_locked() && current->lock_stack().contains(obj()))) {
 840       // Not inflated so there can't be any waiters to notify.
 841       return;
 842     }
 843   } else if (LockingMode == LM_LEGACY) {
 844     if (mark.has_locker() && current->is_lock_owned((address)mark.locker())) {
 845       // Not inflated so there can't be any waiters to notify.
 846       return;
 847     }
 848   }
 849   // The ObjectMonitor* can't be async deflated until ownership is
 850   // dropped by the calling thread.
 851   ObjectMonitor* monitor = inflate(current, obj(), inflate_cause_notify);
 852   monitor->notify(CHECK);
 853 }
 854 
 855 // NOTE: see comment of notify()
 856 void ObjectSynchronizer::notifyall(Handle obj, TRAPS) {
 857   JavaThread* current = THREAD;
 858 
 859   markWord mark = obj->mark();
 860   if (LockingMode == LM_LIGHTWEIGHT) {
 861     if ((mark.is_fast_locked() && current->lock_stack().contains(obj()))) {
 862       // Not inflated so there can't be any waiters to notify.
 863       return;
 864     }
 865   } else if (LockingMode == LM_LEGACY) {
 866     if (mark.has_locker() && current->is_lock_owned((address)mark.locker())) {
 867       // Not inflated so there can't be any waiters to notify.
 868       return;
 869     }
 870   }
 871   // The ObjectMonitor* can't be async deflated until ownership is
 872   // dropped by the calling thread.
 873   ObjectMonitor* monitor = inflate(current, obj(), inflate_cause_notify);
 874   monitor->notifyAll(CHECK);
 875 }
 876 
 877 // -----------------------------------------------------------------------------
 878 // Hash Code handling
 879 
 880 struct SharedGlobals {
 881   char         _pad_prefix[OM_CACHE_LINE_SIZE];
 882   // This is a highly shared mostly-read variable.
 883   // To avoid false-sharing it needs to be the sole occupant of a cache line.
 884   volatile int stw_random;
 885   DEFINE_PAD_MINUS_SIZE(1, OM_CACHE_LINE_SIZE, sizeof(volatile int));
 886   // Hot RW variable -- Sequester to avoid false-sharing
 887   volatile int hc_sequence;
 888   DEFINE_PAD_MINUS_SIZE(2, OM_CACHE_LINE_SIZE, sizeof(volatile int));
 889 };
 890 
 891 static SharedGlobals GVars;
 892 
 893 static markWord read_stable_mark(oop obj) {
 894   markWord mark = obj->mark_acquire();
 895   if (!mark.is_being_inflated() || LockingMode == LM_LIGHTWEIGHT) {
 896     // New lightweight locking does not use the markWord::INFLATING() protocol.
 897     return mark;       // normal fast-path return
 898   }
 899 
 900   int its = 0;
 901   for (;;) {
 902     markWord mark = obj->mark_acquire();
 903     if (!mark.is_being_inflated()) {
 904       return mark;    // normal fast-path return
 905     }
 906 
 907     // The object is being inflated by some other thread.
 908     // The caller of read_stable_mark() must wait for inflation to complete.
 909     // Avoid live-lock.
 910 
 911     ++its;
 912     if (its > 10000 || !os::is_MP()) {
 913       if (its & 1) {
 914         os::naked_yield();
 915       } else {
 916         // Note that the following code attenuates the livelock problem but is not
 917         // a complete remedy.  A more complete solution would require that the inflating
 918         // thread hold the associated inflation lock.  The following code simply restricts
 919         // the number of spinners to at most one.  We'll have N-2 threads blocked
 920         // on the inflationlock, 1 thread holding the inflation lock and using
 921         // a yield/park strategy, and 1 thread in the midst of inflation.
 922         // A more refined approach would be to change the encoding of INFLATING
 923         // to allow encapsulation of a native thread pointer.  Threads waiting for
 924         // inflation to complete would use CAS to push themselves onto a singly linked
 925         // list rooted at the markword.  Once enqueued, they'd loop, checking a per-thread flag
 926         // and calling park().  When inflation was complete the thread that accomplished inflation
 927         // would detach the list and set the markword to inflated with a single CAS and
 928         // then for each thread on the list, set the flag and unpark() the thread.
 929 
 930         // Index into the lock array based on the current object address.
 931         static_assert(is_power_of_2(inflation_lock_count()), "must be");
 932         size_t ix = (cast_from_oop<intptr_t>(obj) >> 5) & (inflation_lock_count() - 1);
 933         int YieldThenBlock = 0;
 934         assert(ix < inflation_lock_count(), "invariant");
 935         inflation_lock(ix)->lock();
 936         while (obj->mark_acquire() == markWord::INFLATING()) {
 937           // Beware: naked_yield() is advisory and has almost no effect on some platforms
 938           // so we periodically call current->_ParkEvent->park(1).
 939           // We use a mixed spin/yield/block mechanism.
 940           if ((YieldThenBlock++) >= 16) {
 941             Thread::current()->_ParkEvent->park(1);
 942           } else {
 943             os::naked_yield();
 944           }
 945         }
 946         inflation_lock(ix)->unlock();
 947       }
 948     } else {
 949       SpinPause();       // SMP-polite spinning
 950     }
 951   }
 952 }
 953 
 954 // hashCode() generation :
 955 //
 956 // Possibilities:
 957 // * MD5Digest of {obj,stw_random}
 958 // * CRC32 of {obj,stw_random} or any linear-feedback shift register function.
 959 // * A DES- or AES-style SBox[] mechanism
 960 // * One of the Phi-based schemes, such as:
 961 //   2654435761 = 2^32 * Phi (golden ratio)
 962 //   HashCodeValue = ((uintptr_t(obj) >> 3) * 2654435761) ^ GVars.stw_random ;
 963 // * A variation of Marsaglia's shift-xor RNG scheme.
 964 // * (obj ^ stw_random) is appealing, but can result
 965 //   in undesirable regularity in the hashCode values of adjacent objects
 966 //   (objects allocated back-to-back, in particular).  This could potentially
 967 //   result in hashtable collisions and reduced hashtable efficiency.
 968 //   There are simple ways to "diffuse" the middle address bits over the
 969 //   generated hashCode values:
 970 
 971 static inline intptr_t get_next_hash(Thread* current, oop obj) {
 972   intptr_t value = 0;
 973   if (hashCode == 0) {
 974     // This form uses global Park-Miller RNG.
 975     // On MP system we'll have lots of RW access to a global, so the
 976     // mechanism induces lots of coherency traffic.
 977     value = os::random();
 978   } else if (hashCode == 1) {
 979     // This variation has the property of being stable (idempotent)
 980     // between STW operations.  This can be useful in some of the 1-0
 981     // synchronization schemes.
 982     intptr_t addr_bits = cast_from_oop<intptr_t>(obj) >> 3;
 983     value = addr_bits ^ (addr_bits >> 5) ^ GVars.stw_random;
 984   } else if (hashCode == 2) {
 985     value = 1;            // for sensitivity testing
 986   } else if (hashCode == 3) {
 987     value = ++GVars.hc_sequence;
 988   } else if (hashCode == 4) {
 989     value = cast_from_oop<intptr_t>(obj);
 990   } else {
 991     // Marsaglia's xor-shift scheme with thread-specific state
 992     // This is probably the best overall implementation -- we'll
 993     // likely make this the default in future releases.
 994     unsigned t = current->_hashStateX;
 995     t ^= (t << 11);
 996     current->_hashStateX = current->_hashStateY;
 997     current->_hashStateY = current->_hashStateZ;
 998     current->_hashStateZ = current->_hashStateW;
 999     unsigned v = current->_hashStateW;
1000     v = (v ^ (v >> 19)) ^ (t ^ (t >> 8));
1001     current->_hashStateW = v;
1002     value = v;
1003   }
1004 
1005   value &= markWord::hash_mask;
1006   if (value == 0) value = 0xBAD;
1007   assert(value != markWord::no_hash, "invariant");
1008   return value;
1009 }
1010 
1011 intptr_t ObjectSynchronizer::FastHashCode(Thread* current, oop obj) {
1012 
1013   while (true) {
1014     ObjectMonitor* monitor = nullptr;
1015     markWord temp, test;
1016     intptr_t hash;
1017     markWord mark = read_stable_mark(obj);
1018     if (VerifyHeavyMonitors) {
1019       assert(LockingMode == LM_MONITOR, "+VerifyHeavyMonitors requires LockingMode == 0 (LM_MONITOR)");
1020       guarantee((obj->mark().value() & markWord::lock_mask_in_place) != markWord::locked_value, "must not be lightweight/stack-locked");
1021     }
1022     if (mark.is_unlocked() || (LockingMode == LM_LIGHTWEIGHT && mark.is_fast_locked())) {
1023       hash = mark.hash();
1024       if (hash != 0) {                     // if it has a hash, just return it
1025         return hash;
1026       }
1027       hash = get_next_hash(current, obj);  // get a new hash
1028       temp = mark.copy_set_hash(hash);     // merge the hash into header
1029                                            // try to install the hash
1030       test = obj->cas_set_mark(temp, mark);
1031       if (test == mark) {                  // if the hash was installed, return it
1032         return hash;
1033       }
1034       if (LockingMode == LM_LIGHTWEIGHT) {
1035         // CAS failed, retry
1036         continue;
1037       }
1038       // Failed to install the hash. It could be that another thread
1039       // installed the hash just before our attempt or inflation has
1040       // occurred or... so we fall thru to inflate the monitor for
1041       // stability and then install the hash.
1042     } else if (mark.has_monitor()) {
1043       monitor = mark.monitor();
1044       temp = monitor->header();
1045       assert(temp.is_neutral(), "invariant: header=" INTPTR_FORMAT, temp.value());
1046       hash = temp.hash();
1047       if (hash != 0) {
1048         // It has a hash.
1049 
1050         // Separate load of dmw/header above from the loads in
1051         // is_being_async_deflated().
1052 
1053         // dmw/header and _contentions may get written by different threads.
1054         // Make sure to observe them in the same order when having several observers.
1055         OrderAccess::loadload_for_IRIW();
1056 
1057         if (monitor->is_being_async_deflated()) {
1058           // But we can't safely use the hash if we detect that async
1059           // deflation has occurred. So we attempt to restore the
1060           // header/dmw to the object's header so that we only retry
1061           // once if the deflater thread happens to be slow.
1062           monitor->install_displaced_markword_in_object(obj);
1063           continue;
1064         }
1065         return hash;
1066       }
1067       // Fall thru so we only have one place that installs the hash in
1068       // the ObjectMonitor.
1069     } else if (LockingMode == LM_LEGACY && mark.has_locker()
1070                && current->is_Java_thread()
1071                && JavaThread::cast(current)->is_lock_owned((address)mark.locker())) {
1072       // This is a stack-lock owned by the calling thread so fetch the
1073       // displaced markWord from the BasicLock on the stack.
1074       temp = mark.displaced_mark_helper();
1075       assert(temp.is_neutral(), "invariant: header=" INTPTR_FORMAT, temp.value());
1076       hash = temp.hash();
1077       if (hash != 0) {                  // if it has a hash, just return it
1078         return hash;
1079       }
1080       // WARNING:
1081       // The displaced header in the BasicLock on a thread's stack
1082       // is strictly immutable. It CANNOT be changed in ANY cases.
1083       // So we have to inflate the stack-lock into an ObjectMonitor
1084       // even if the current thread owns the lock. The BasicLock on
1085       // a thread's stack can be asynchronously read by other threads
1086       // during an inflate() call so any change to that stack memory
1087       // may not propagate to other threads correctly.
1088     }
1089 
1090     // Inflate the monitor to set the hash.
1091 
1092     // There's no need to inflate if the mark has already got a monitor.
1093     // NOTE: an async deflation can race after we get the monitor and
1094     // before we can update the ObjectMonitor's header with the hash
1095     // value below.
1096     monitor = mark.has_monitor() ? mark.monitor() : inflate(current, obj, inflate_cause_hash_code);
1097     // Load ObjectMonitor's header/dmw field and see if it has a hash.
1098     mark = monitor->header();
1099     assert(mark.is_neutral(), "invariant: header=" INTPTR_FORMAT, mark.value());
1100     hash = mark.hash();
1101     if (hash == 0) {                       // if it does not have a hash
1102       hash = get_next_hash(current, obj);  // get a new hash
1103       temp = mark.copy_set_hash(hash)   ;  // merge the hash into header
1104       assert(temp.is_neutral(), "invariant: header=" INTPTR_FORMAT, temp.value());
1105       uintptr_t v = Atomic::cmpxchg((volatile uintptr_t*)monitor->header_addr(), mark.value(), temp.value());
1106       test = markWord(v);
1107       if (test != mark) {
1108         // The attempt to update the ObjectMonitor's header/dmw field
1109         // did not work. This can happen if another thread managed to
1110         // merge in the hash just before our cmpxchg().
1111         // If we add any new usages of the header/dmw field, this code
1112         // will need to be updated.
1113         hash = test.hash();
1114         assert(test.is_neutral(), "invariant: header=" INTPTR_FORMAT, test.value());
1115         assert(hash != 0, "should only have lost the race to a thread that set a non-zero hash");
1116       }
1117       if (monitor->is_being_async_deflated()) {
1118         // If we detect that async deflation has occurred, then we
1119         // attempt to restore the header/dmw to the object's header
1120         // so that we only retry once if the deflater thread happens
1121         // to be slow.
1122         monitor->install_displaced_markword_in_object(obj);
1123         continue;
1124       }
1125     }
1126     // We finally get the hash.
1127     return hash;
1128   }
1129 }
1130 
1131 bool ObjectSynchronizer::current_thread_holds_lock(JavaThread* current,
1132                                                    Handle h_obj) {
1133   assert(current == JavaThread::current(), "Can only be called on current thread");
1134   oop obj = h_obj();
1135 
1136   markWord mark = read_stable_mark(obj);
1137 
1138   if (LockingMode == LM_LEGACY && mark.has_locker()) {
1139     // stack-locked case, header points into owner's stack
1140     return current->is_lock_owned((address)mark.locker());
1141   }
1142 
1143   if (LockingMode == LM_LIGHTWEIGHT && mark.is_fast_locked()) {
1144     // fast-locking case, see if lock is in current's lock stack
1145     return current->lock_stack().contains(h_obj());
1146   }
1147 
1148   if (mark.has_monitor()) {
1149     // Inflated monitor so header points to ObjectMonitor (tagged pointer).
1150     // The first stage of async deflation does not affect any field
1151     // used by this comparison so the ObjectMonitor* is usable here.
1152     ObjectMonitor* monitor = mark.monitor();
1153     return monitor->is_entered(current) != 0;
1154   }
1155   // Unlocked case, header in place
1156   assert(mark.is_unlocked(), "sanity check");
1157   return false;
1158 }
1159 
1160 JavaThread* ObjectSynchronizer::get_lock_owner(ThreadsList * t_list, Handle h_obj) {
1161   oop obj = h_obj();
1162   markWord mark = read_stable_mark(obj);
1163 
1164   if (LockingMode == LM_LEGACY && mark.has_locker()) {
1165     // stack-locked so header points into owner's stack.
1166     // owning_thread_from_monitor_owner() may also return null here:
1167     return Threads::owning_thread_from_monitor_owner(t_list, (address) mark.locker());
1168   }
1169 
1170   if (LockingMode == LM_LIGHTWEIGHT && mark.is_fast_locked()) {
1171     // fast-locked so get owner from the object.
1172     // owning_thread_from_object() may also return null here:
1173     return Threads::owning_thread_from_object(t_list, h_obj());
1174   }
1175 
1176   if (mark.has_monitor()) {
1177     // Inflated monitor so header points to ObjectMonitor (tagged pointer).
1178     // The first stage of async deflation does not affect any field
1179     // used by this comparison so the ObjectMonitor* is usable here.
1180     ObjectMonitor* monitor = mark.monitor();
1181     assert(monitor != nullptr, "monitor should be non-null");
1182     // owning_thread_from_monitor() may also return null here:
1183     return Threads::owning_thread_from_monitor(t_list, monitor);
1184   }
1185 
1186   // Unlocked case, header in place
1187   // Cannot have assertion since this object may have been
1188   // locked by another thread when reaching here.
1189   // assert(mark.is_unlocked(), "sanity check");
1190 
1191   return nullptr;
1192 }
1193 
1194 // Visitors ...
1195 
1196 // Iterate over all ObjectMonitors.
1197 template <typename Function>
1198 void ObjectSynchronizer::monitors_iterate(Function function) {
1199   MonitorList::Iterator iter = _in_use_list.iterator();
1200   while (iter.has_next()) {
1201     ObjectMonitor* monitor = iter.next();
1202     function(monitor);
1203   }
1204 }
1205 
1206 // Iterate ObjectMonitors owned by any thread and where the owner `filter`
1207 // returns true.
1208 template <typename OwnerFilter>
1209 void ObjectSynchronizer::owned_monitors_iterate_filtered(MonitorClosure* closure, OwnerFilter filter) {
1210   monitors_iterate([&](ObjectMonitor* monitor) {
1211     // This function is only called at a safepoint or when the
1212     // target thread is suspended or when the target thread is
1213     // operating on itself. The current closures in use today are
1214     // only interested in an owned ObjectMonitor and ownership
1215     // cannot be dropped under the calling contexts so the
1216     // ObjectMonitor cannot be async deflated.
1217     if (monitor->has_owner() && filter(monitor->owner_raw())) {
1218       assert(!monitor->is_being_async_deflated(), "Owned monitors should not be deflating");
1219 
1220       closure->do_monitor(monitor);
1221     }
1222   });
1223 }
1224 
1225 // Iterate ObjectMonitors where the owner == thread; this does NOT include
1226 // ObjectMonitors where owner is set to a stack-lock address in thread.
1227 void ObjectSynchronizer::owned_monitors_iterate(MonitorClosure* closure, JavaThread* thread) {
1228   auto thread_filter = [&](void* owner) { return owner == thread; };
1229   return owned_monitors_iterate_filtered(closure, thread_filter);
1230 }
1231 
1232 // Iterate ObjectMonitors owned by any thread.
1233 void ObjectSynchronizer::owned_monitors_iterate(MonitorClosure* closure) {
1234   auto all_filter = [&](void* owner) { return true; };
1235   return owned_monitors_iterate_filtered(closure, all_filter);
1236 }
1237 
1238 static bool monitors_used_above_threshold(MonitorList* list) {
1239   if (MonitorUsedDeflationThreshold == 0) {  // disabled case is easy
1240     return false;
1241   }
1242   // Start with ceiling based on a per-thread estimate:
1243   size_t ceiling = ObjectSynchronizer::in_use_list_ceiling();
1244   size_t old_ceiling = ceiling;
1245   if (ceiling < list->max()) {
1246     // The max used by the system has exceeded the ceiling so use that:
1247     ceiling = list->max();
1248   }
1249   size_t monitors_used = list->count();
1250   if (monitors_used == 0) {  // empty list is easy
1251     return false;
1252   }
1253   if (NoAsyncDeflationProgressMax != 0 &&
1254       _no_progress_cnt >= NoAsyncDeflationProgressMax) {
1255     double remainder = (100.0 - MonitorUsedDeflationThreshold) / 100.0;
1256     size_t new_ceiling = ceiling + (size_t)((double)ceiling * remainder) + 1;
1257     ObjectSynchronizer::set_in_use_list_ceiling(new_ceiling);
1258     log_info(monitorinflation)("Too many deflations without progress; "
1259                                "bumping in_use_list_ceiling from " SIZE_FORMAT
1260                                " to " SIZE_FORMAT, old_ceiling, new_ceiling);
1261     _no_progress_cnt = 0;
1262     ceiling = new_ceiling;
1263   }
1264 
1265   // Check if our monitor usage is above the threshold:
1266   size_t monitor_usage = (monitors_used * 100LL) / ceiling;
1267   if (int(monitor_usage) > MonitorUsedDeflationThreshold) {
1268     log_info(monitorinflation)("monitors_used=" SIZE_FORMAT ", ceiling=" SIZE_FORMAT
1269                                ", monitor_usage=" SIZE_FORMAT ", threshold=%d",
1270                                monitors_used, ceiling, monitor_usage, MonitorUsedDeflationThreshold);
1271     return true;
1272   }
1273 
1274   return false;
1275 }
1276 
1277 size_t ObjectSynchronizer::in_use_list_ceiling() {
1278   return _in_use_list_ceiling;
1279 }
1280 
1281 void ObjectSynchronizer::dec_in_use_list_ceiling() {
1282   Atomic::sub(&_in_use_list_ceiling, AvgMonitorsPerThreadEstimate);
1283 }
1284 
1285 void ObjectSynchronizer::inc_in_use_list_ceiling() {
1286   Atomic::add(&_in_use_list_ceiling, AvgMonitorsPerThreadEstimate);
1287 }
1288 
1289 void ObjectSynchronizer::set_in_use_list_ceiling(size_t new_value) {
1290   _in_use_list_ceiling = new_value;
1291 }
1292 
1293 bool ObjectSynchronizer::is_async_deflation_needed() {
1294   if (is_async_deflation_requested()) {
1295     // Async deflation request.
1296     log_info(monitorinflation)("Async deflation needed: explicit request");
1297     return true;
1298   }
1299 
1300   jlong time_since_last = time_since_last_async_deflation_ms();
1301 
1302   if (AsyncDeflationInterval > 0 &&
1303       time_since_last > AsyncDeflationInterval &&
1304       monitors_used_above_threshold(&_in_use_list)) {
1305     // It's been longer than our specified deflate interval and there
1306     // are too many monitors in use. We don't deflate more frequently
1307     // than AsyncDeflationInterval (unless is_async_deflation_requested)
1308     // in order to not swamp the MonitorDeflationThread.
1309     log_info(monitorinflation)("Async deflation needed: monitors used are above the threshold");
1310     return true;
1311   }
1312 
1313   if (GuaranteedAsyncDeflationInterval > 0 &&
1314       time_since_last > GuaranteedAsyncDeflationInterval) {
1315     // It's been longer than our specified guaranteed deflate interval.
1316     // We need to clean up the used monitors even if the threshold is
1317     // not reached, to keep the memory utilization at bay when many threads
1318     // touched many monitors.
1319     log_info(monitorinflation)("Async deflation needed: guaranteed interval (" INTX_FORMAT " ms) "
1320                                "is greater than time since last deflation (" JLONG_FORMAT " ms)",
1321                                GuaranteedAsyncDeflationInterval, time_since_last);
1322 
1323     // If this deflation has no progress, then it should not affect the no-progress
1324     // tracking, otherwise threshold heuristics would think it was triggered, experienced
1325     // no progress, and needs to backoff more aggressively. In this "no progress" case,
1326     // the generic code would bump the no-progress counter, and we compensate for that
1327     // by telling it to skip the update.
1328     //
1329     // If this deflation has progress, then it should let non-progress tracking
1330     // know about this, otherwise the threshold heuristics would kick in, potentially
1331     // experience no-progress due to aggressive cleanup by this deflation, and think
1332     // it is still in no-progress stride. In this "progress" case, the generic code would
1333     // zero the counter, and we allow it to happen.
1334     _no_progress_skip_increment = true;
1335 
1336     return true;
1337   }
1338 
1339   return false;
1340 }
1341 
1342 void ObjectSynchronizer::request_deflate_idle_monitors() {
1343   MonitorLocker ml(MonitorDeflation_lock, Mutex::_no_safepoint_check_flag);
1344   set_is_async_deflation_requested(true);
1345   ml.notify_all();
1346 }
1347 
1348 bool ObjectSynchronizer::request_deflate_idle_monitors_from_wb() {
1349   JavaThread* current = JavaThread::current();
1350   bool ret_code = false;
1351 
1352   jlong last_time = last_async_deflation_time_ns();
1353 
1354   request_deflate_idle_monitors();
1355 
1356   const int N_CHECKS = 5;
1357   for (int i = 0; i < N_CHECKS; i++) {  // sleep for at most 5 seconds
1358     if (last_async_deflation_time_ns() > last_time) {
1359       log_info(monitorinflation)("Async Deflation happened after %d check(s).", i);
1360       ret_code = true;
1361       break;
1362     }
1363     {
1364       // JavaThread has to honor the blocking protocol.
1365       ThreadBlockInVM tbivm(current);
1366       os::naked_short_sleep(999);  // sleep for almost 1 second
1367     }
1368   }
1369   if (!ret_code) {
1370     log_info(monitorinflation)("Async Deflation DID NOT happen after %d checks.", N_CHECKS);
1371   }
1372 
1373   return ret_code;
1374 }
1375 
1376 jlong ObjectSynchronizer::time_since_last_async_deflation_ms() {
1377   return (os::javaTimeNanos() - last_async_deflation_time_ns()) / (NANOUNITS / MILLIUNITS);
1378 }
1379 
1380 static void post_monitor_inflate_event(EventJavaMonitorInflate* event,
1381                                        const oop obj,
1382                                        ObjectSynchronizer::InflateCause cause) {
1383   assert(event != nullptr, "invariant");
1384   event->set_monitorClass(obj->klass());
1385   event->set_address((uintptr_t)(void*)obj);
1386   event->set_cause((u1)cause);
1387   event->commit();
1388 }
1389 
1390 // Fast path code shared by multiple functions
1391 void ObjectSynchronizer::inflate_helper(oop obj) {
1392   markWord mark = obj->mark_acquire();
1393   if (mark.has_monitor()) {
1394     ObjectMonitor* monitor = mark.monitor();
1395     markWord dmw = monitor->header();
1396     assert(dmw.is_neutral(), "sanity check: header=" INTPTR_FORMAT, dmw.value());
1397     return;
1398   }
1399   (void)inflate(Thread::current(), obj, inflate_cause_vm_internal);
1400 }
1401 
1402 ObjectMonitor* ObjectSynchronizer::inflate(Thread* current, oop obj, const InflateCause cause) {
1403   assert(current == Thread::current(), "must be");
1404   if (LockingMode == LM_LIGHTWEIGHT && current->is_Java_thread()) {
1405     return inflate_impl(JavaThread::cast(current), obj, cause);
1406   }
1407   return inflate_impl(nullptr, obj, cause);
1408 }
1409 
1410 ObjectMonitor* ObjectSynchronizer::inflate_for(JavaThread* thread, oop obj, const InflateCause cause) {
1411   assert(thread == Thread::current() || thread->is_obj_deopt_suspend(), "must be");
1412   return inflate_impl(thread, obj, cause);
1413 }
1414 
1415 ObjectMonitor* ObjectSynchronizer::inflate_impl(JavaThread* inflating_thread, oop object, const InflateCause cause) {
1416   // The JavaThread* inflating_thread parameter is only used by LM_LIGHTWEIGHT and requires
1417   // that the inflating_thread == Thread::current() or is suspended throughout the call by
1418   // some other mechanism.
1419   // Even with LM_LIGHTWEIGHT the thread might be nullptr when called from a non
1420   // JavaThread. (As may still be the case from FastHashCode). However it is only
1421   // important for the correctness of the LM_LIGHTWEIGHT algorithm that the thread
1422   // is set when called from ObjectSynchronizer::enter from the owning thread,
1423   // ObjectSynchronizer::enter_for from any thread, or ObjectSynchronizer::exit.
1424   EventJavaMonitorInflate event;
1425 
1426   for (;;) {
1427     const markWord mark = object->mark_acquire();
1428 
1429     // The mark can be in one of the following states:
1430     // *  inflated     - Just return if using stack-locking.
1431     //                   If using fast-locking and the ObjectMonitor owner
1432     //                   is anonymous and the inflating_thread owns the
1433     //                   object lock, then we make the inflating_thread
1434     //                   the ObjectMonitor owner and remove the lock from
1435     //                   the inflating_thread's lock stack.
1436     // *  fast-locked  - Coerce it to inflated from fast-locked.
1437     // *  stack-locked - Coerce it to inflated from stack-locked.
1438     // *  INFLATING    - Busy wait for conversion from stack-locked to
1439     //                   inflated.
1440     // *  unlocked     - Aggressively inflate the object.
1441 
1442     // CASE: inflated
1443     if (mark.has_monitor()) {
1444       ObjectMonitor* inf = mark.monitor();
1445       markWord dmw = inf->header();
1446       assert(dmw.is_neutral(), "invariant: header=" INTPTR_FORMAT, dmw.value());
1447       if (LockingMode == LM_LIGHTWEIGHT && inf->is_owner_anonymous() &&
1448           inflating_thread != nullptr && inflating_thread->lock_stack().contains(object)) {
1449         inf->set_owner_from_anonymous(inflating_thread);
1450         size_t removed = inflating_thread->lock_stack().remove(object);
1451         inf->set_recursions(removed - 1);
1452       }
1453       return inf;
1454     }
1455 
1456     if (LockingMode != LM_LIGHTWEIGHT) {
1457       // New lightweight locking does not use INFLATING.
1458       // CASE: inflation in progress - inflating over a stack-lock.
1459       // Some other thread is converting from stack-locked to inflated.
1460       // Only that thread can complete inflation -- other threads must wait.
1461       // The INFLATING value is transient.
1462       // Currently, we spin/yield/park and poll the markword, waiting for inflation to finish.
1463       // We could always eliminate polling by parking the thread on some auxiliary list.
1464       if (mark == markWord::INFLATING()) {
1465         read_stable_mark(object);
1466         continue;
1467       }
1468     }
1469 
1470     // CASE: fast-locked
1471     // Could be fast-locked either by the inflating_thread or by some other thread.
1472     //
1473     // Note that we allocate the ObjectMonitor speculatively, _before_
1474     // attempting to set the object's mark to the new ObjectMonitor. If
1475     // the inflating_thread owns the monitor, then we set the ObjectMonitor's
1476     // owner to the inflating_thread. Otherwise, we set the ObjectMonitor's owner
1477     // to anonymous. If we lose the race to set the object's mark to the
1478     // new ObjectMonitor, then we just delete it and loop around again.
1479     //
1480     LogStreamHandle(Trace, monitorinflation) lsh;
1481     if (LockingMode == LM_LIGHTWEIGHT && mark.is_fast_locked()) {
1482       ObjectMonitor* monitor = new ObjectMonitor(object);
1483       monitor->set_header(mark.set_unlocked());
1484       bool own = inflating_thread != nullptr && inflating_thread->lock_stack().contains(object);
1485       if (own) {
1486         // Owned by inflating_thread.
1487         monitor->set_owner_from(nullptr, inflating_thread);
1488       } else {
1489         // Owned by somebody else.
1490         monitor->set_owner_anonymous();
1491       }
1492       markWord monitor_mark = markWord::encode(monitor);
1493       markWord old_mark = object->cas_set_mark(monitor_mark, mark);
1494       if (old_mark == mark) {
1495         // Success! Return inflated monitor.
1496         if (own) {
1497           size_t removed = inflating_thread->lock_stack().remove(object);
1498           monitor->set_recursions(removed - 1);
1499         }
1500         // Once the ObjectMonitor is configured and object is associated
1501         // with the ObjectMonitor, it is safe to allow async deflation:
1502         _in_use_list.add(monitor);
1503 
1504         // Hopefully the performance counters are allocated on distinct
1505         // cache lines to avoid false sharing on MP systems ...
1506         OM_PERFDATA_OP(Inflations, inc());
1507         if (log_is_enabled(Trace, monitorinflation)) {
1508           ResourceMark rm;
1509           lsh.print_cr("inflate(has_locker): object=" INTPTR_FORMAT ", mark="
1510                        INTPTR_FORMAT ", type='%s'", p2i(object),
1511                        object->mark().value(), object->klass()->external_name());
1512         }
1513         if (event.should_commit()) {
1514           post_monitor_inflate_event(&event, object, cause);
1515         }
1516         return monitor;
1517       } else {
1518         delete monitor;
1519         continue;  // Interference -- just retry
1520       }
1521     }
1522 
1523     // CASE: stack-locked
1524     // Could be stack-locked either by current or by some other thread.
1525     //
1526     // Note that we allocate the ObjectMonitor speculatively, _before_ attempting
1527     // to install INFLATING into the mark word.  We originally installed INFLATING,
1528     // allocated the ObjectMonitor, and then finally STed the address of the
1529     // ObjectMonitor into the mark.  This was correct, but artificially lengthened
1530     // the interval in which INFLATING appeared in the mark, thus increasing
1531     // the odds of inflation contention. If we lose the race to set INFLATING,
1532     // then we just delete the ObjectMonitor and loop around again.
1533     //
1534     if (LockingMode == LM_LEGACY && mark.has_locker()) {
1535       assert(LockingMode != LM_LIGHTWEIGHT, "cannot happen with new lightweight locking");
1536       ObjectMonitor* m = new ObjectMonitor(object);
1537       // Optimistically prepare the ObjectMonitor - anticipate successful CAS
1538       // We do this before the CAS in order to minimize the length of time
1539       // in which INFLATING appears in the mark.
1540 
1541       markWord cmp = object->cas_set_mark(markWord::INFLATING(), mark);
1542       if (cmp != mark) {
1543         delete m;
1544         continue;       // Interference -- just retry
1545       }
1546 
1547       // We've successfully installed INFLATING (0) into the mark-word.
1548       // This is the only case where 0 will appear in a mark-word.
1549       // Only the singular thread that successfully swings the mark-word
1550       // to 0 can perform (or more precisely, complete) inflation.
1551       //
1552       // Why do we CAS a 0 into the mark-word instead of just CASing the
1553       // mark-word from the stack-locked value directly to the new inflated state?
1554       // Consider what happens when a thread unlocks a stack-locked object.
1555       // It attempts to use CAS to swing the displaced header value from the
1556       // on-stack BasicLock back into the object header.  Recall also that the
1557       // header value (hash code, etc) can reside in (a) the object header, or
1558       // (b) a displaced header associated with the stack-lock, or (c) a displaced
1559       // header in an ObjectMonitor.  The inflate() routine must copy the header
1560       // value from the BasicLock on the owner's stack to the ObjectMonitor, all
1561       // the while preserving the hashCode stability invariants.  If the owner
1562       // decides to release the lock while the value is 0, the unlock will fail
1563       // and control will eventually pass from slow_exit() to inflate.  The owner
1564       // will then spin, waiting for the 0 value to disappear.   Put another way,
1565       // the 0 causes the owner to stall if the owner happens to try to
1566       // drop the lock (restoring the header from the BasicLock to the object)
1567       // while inflation is in-progress.  This protocol avoids races that might
1568       // would otherwise permit hashCode values to change or "flicker" for an object.
1569       // Critically, while object->mark is 0 mark.displaced_mark_helper() is stable.
1570       // 0 serves as a "BUSY" inflate-in-progress indicator.
1571 
1572 
1573       // fetch the displaced mark from the owner's stack.
1574       // The owner can't die or unwind past the lock while our INFLATING
1575       // object is in the mark.  Furthermore the owner can't complete
1576       // an unlock on the object, either.
1577       markWord dmw = mark.displaced_mark_helper();
1578       // Catch if the object's header is not neutral (not locked and
1579       // not marked is what we care about here).
1580       assert(dmw.is_neutral(), "invariant: header=" INTPTR_FORMAT, dmw.value());
1581 
1582       // Setup monitor fields to proper values -- prepare the monitor
1583       m->set_header(dmw);
1584 
1585       // Optimization: if the mark.locker stack address is associated
1586       // with this thread we could simply set m->_owner = current.
1587       // Note that a thread can inflate an object
1588       // that it has stack-locked -- as might happen in wait() -- directly
1589       // with CAS.  That is, we can avoid the xchg-nullptr .... ST idiom.
1590       m->set_owner_from(nullptr, mark.locker());
1591       // TODO-FIXME: assert BasicLock->dhw != 0.
1592 
1593       // Must preserve store ordering. The monitor state must
1594       // be stable at the time of publishing the monitor address.
1595       guarantee(object->mark() == markWord::INFLATING(), "invariant");
1596       // Release semantics so that above set_object() is seen first.
1597       object->release_set_mark(markWord::encode(m));
1598 
1599       // Once ObjectMonitor is configured and the object is associated
1600       // with the ObjectMonitor, it is safe to allow async deflation:
1601       _in_use_list.add(m);
1602 
1603       // Hopefully the performance counters are allocated on distinct cache lines
1604       // to avoid false sharing on MP systems ...
1605       OM_PERFDATA_OP(Inflations, inc());
1606       if (log_is_enabled(Trace, monitorinflation)) {
1607         ResourceMark rm;
1608         lsh.print_cr("inflate(has_locker): object=" INTPTR_FORMAT ", mark="
1609                      INTPTR_FORMAT ", type='%s'", p2i(object),
1610                      object->mark().value(), object->klass()->external_name());
1611       }
1612       if (event.should_commit()) {
1613         post_monitor_inflate_event(&event, object, cause);
1614       }
1615       return m;
1616     }
1617 
1618     // CASE: unlocked
1619     // TODO-FIXME: for entry we currently inflate and then try to CAS _owner.
1620     // If we know we're inflating for entry it's better to inflate by swinging a
1621     // pre-locked ObjectMonitor pointer into the object header.   A successful
1622     // CAS inflates the object *and* confers ownership to the inflating thread.
1623     // In the current implementation we use a 2-step mechanism where we CAS()
1624     // to inflate and then CAS() again to try to swing _owner from null to current.
1625     // An inflateTry() method that we could call from enter() would be useful.
1626 
1627     assert(mark.is_unlocked(), "invariant: header=" INTPTR_FORMAT, mark.value());
1628     ObjectMonitor* m = new ObjectMonitor(object);
1629     // prepare m for installation - set monitor to initial state
1630     m->set_header(mark);
1631 
1632     if (object->cas_set_mark(markWord::encode(m), mark) != mark) {
1633       delete m;
1634       m = nullptr;
1635       continue;
1636       // interference - the markword changed - just retry.
1637       // The state-transitions are one-way, so there's no chance of
1638       // live-lock -- "Inflated" is an absorbing state.
1639     }
1640 
1641     // Once the ObjectMonitor is configured and object is associated
1642     // with the ObjectMonitor, it is safe to allow async deflation:
1643     _in_use_list.add(m);
1644 
1645     // Hopefully the performance counters are allocated on distinct
1646     // cache lines to avoid false sharing on MP systems ...
1647     OM_PERFDATA_OP(Inflations, inc());
1648     if (log_is_enabled(Trace, monitorinflation)) {
1649       ResourceMark rm;
1650       lsh.print_cr("inflate(unlocked): object=" INTPTR_FORMAT ", mark="
1651                    INTPTR_FORMAT ", type='%s'", p2i(object),
1652                    object->mark().value(), object->klass()->external_name());
1653     }
1654     if (event.should_commit()) {
1655       post_monitor_inflate_event(&event, object, cause);
1656     }
1657     return m;
1658   }
1659 }
1660 
1661 // Walk the in-use list and deflate (at most MonitorDeflationMax) idle
1662 // ObjectMonitors. Returns the number of deflated ObjectMonitors.
1663 //
1664 size_t ObjectSynchronizer::deflate_monitor_list(ObjectMonitorDeflationSafepointer* safepointer) {
1665   MonitorList::Iterator iter = _in_use_list.iterator();
1666   size_t deflated_count = 0;
1667 
1668   while (iter.has_next()) {
1669     if (deflated_count >= (size_t)MonitorDeflationMax) {
1670       break;
1671     }
1672     ObjectMonitor* mid = iter.next();
1673     if (mid->deflate_monitor()) {
1674       deflated_count++;
1675     }
1676 
1677     // Must check for a safepoint/handshake and honor it.
1678     safepointer->block_for_safepoint("deflation", "deflated_count", deflated_count);
1679   }
1680 
1681   return deflated_count;
1682 }
1683 
1684 class HandshakeForDeflation : public HandshakeClosure {
1685  public:
1686   HandshakeForDeflation() : HandshakeClosure("HandshakeForDeflation") {}
1687 
1688   void do_thread(Thread* thread) {
1689     log_trace(monitorinflation)("HandshakeForDeflation::do_thread: thread="
1690                                 INTPTR_FORMAT, p2i(thread));
1691   }
1692 };
1693 
1694 class VM_RendezvousGCThreads : public VM_Operation {
1695 public:
1696   bool evaluate_at_safepoint() const override { return false; }
1697   VMOp_Type type() const override { return VMOp_RendezvousGCThreads; }
1698   void doit() override {
1699     Universe::heap()->safepoint_synchronize_begin();
1700     Universe::heap()->safepoint_synchronize_end();
1701   };
1702 };
1703 
1704 static size_t delete_monitors(GrowableArray<ObjectMonitor*>* delete_list,
1705                               ObjectMonitorDeflationSafepointer* safepointer) {
1706   NativeHeapTrimmer::SuspendMark sm("monitor deletion");
1707   size_t deleted_count = 0;
1708   for (ObjectMonitor* monitor: *delete_list) {
1709     delete monitor;
1710     deleted_count++;
1711     // A JavaThread must check for a safepoint/handshake and honor it.
1712     safepointer->block_for_safepoint("deletion", "deleted_count", deleted_count);
1713   }
1714   return deleted_count;
1715 }
1716 
1717 class ObjectMonitorDeflationLogging: public StackObj {
1718   LogStreamHandle(Debug, monitorinflation) _debug;
1719   LogStreamHandle(Info, monitorinflation)  _info;
1720   LogStream*                               _stream;
1721   elapsedTimer                             _timer;
1722 
1723   size_t ceiling() const { return ObjectSynchronizer::in_use_list_ceiling(); }
1724   size_t count() const   { return ObjectSynchronizer::_in_use_list.count(); }
1725   size_t max() const     { return ObjectSynchronizer::_in_use_list.max(); }
1726 
1727 public:
1728   ObjectMonitorDeflationLogging()
1729     : _debug(), _info(), _stream(nullptr) {
1730     if (_debug.is_enabled()) {
1731       _stream = &_debug;
1732     } else if (_info.is_enabled()) {
1733       _stream = &_info;
1734     }
1735   }
1736 
1737   void begin() {
1738     if (_stream != nullptr) {
1739       _stream->print_cr("begin deflating: in_use_list stats: ceiling=" SIZE_FORMAT ", count=" SIZE_FORMAT ", max=" SIZE_FORMAT,
1740                         ceiling(), count(), max());
1741       _timer.start();
1742     }
1743   }
1744 
1745   void before_handshake(size_t unlinked_count) {
1746     if (_stream != nullptr) {
1747       _timer.stop();
1748       _stream->print_cr("before handshaking: unlinked_count=" SIZE_FORMAT
1749                         ", in_use_list stats: ceiling=" SIZE_FORMAT ", count="
1750                         SIZE_FORMAT ", max=" SIZE_FORMAT,
1751                         unlinked_count, ceiling(), count(), max());
1752     }
1753   }
1754 
1755   void after_handshake() {
1756     if (_stream != nullptr) {
1757       _stream->print_cr("after handshaking: in_use_list stats: ceiling="
1758                         SIZE_FORMAT ", count=" SIZE_FORMAT ", max=" SIZE_FORMAT,
1759                         ceiling(), count(), max());
1760       _timer.start();
1761     }
1762   }
1763 
1764   void end(size_t deflated_count, size_t unlinked_count) {
1765     if (_stream != nullptr) {
1766       _timer.stop();
1767       if (deflated_count != 0 || unlinked_count != 0 || _debug.is_enabled()) {
1768         _stream->print_cr("deflated_count=" SIZE_FORMAT ", {unlinked,deleted}_count=" SIZE_FORMAT " monitors in %3.7f secs",
1769                           deflated_count, unlinked_count, _timer.seconds());
1770       }
1771       _stream->print_cr("end deflating: in_use_list stats: ceiling=" SIZE_FORMAT ", count=" SIZE_FORMAT ", max=" SIZE_FORMAT,
1772                         ceiling(), count(), max());
1773     }
1774   }
1775 
1776   void before_block_for_safepoint(const char* op_name, const char* cnt_name, size_t cnt) {
1777     if (_stream != nullptr) {
1778       _timer.stop();
1779       _stream->print_cr("pausing %s: %s=" SIZE_FORMAT ", in_use_list stats: ceiling="
1780                         SIZE_FORMAT ", count=" SIZE_FORMAT ", max=" SIZE_FORMAT,
1781                         op_name, cnt_name, cnt, ceiling(), count(), max());
1782     }
1783   }
1784 
1785   void after_block_for_safepoint(const char* op_name) {
1786     if (_stream != nullptr) {
1787       _stream->print_cr("resuming %s: in_use_list stats: ceiling=" SIZE_FORMAT
1788                         ", count=" SIZE_FORMAT ", max=" SIZE_FORMAT, op_name,
1789                         ceiling(), count(), max());
1790       _timer.start();
1791     }
1792   }
1793 };
1794 
1795 void ObjectMonitorDeflationSafepointer::block_for_safepoint(const char* op_name, const char* count_name, size_t counter) {
1796   if (!SafepointMechanism::should_process(_current)) {
1797     return;
1798   }
1799 
1800   // A safepoint/handshake has started.
1801   _log->before_block_for_safepoint(op_name, count_name, counter);
1802 
1803   {
1804     // Honor block request.
1805     ThreadBlockInVM tbivm(_current);
1806   }
1807 
1808   _log->after_block_for_safepoint(op_name);
1809 }
1810 
1811 // This function is called by the MonitorDeflationThread to deflate
1812 // ObjectMonitors.
1813 size_t ObjectSynchronizer::deflate_idle_monitors() {
1814   JavaThread* current = JavaThread::current();
1815   assert(current->is_monitor_deflation_thread(), "The only monitor deflater");
1816 
1817   // The async deflation request has been processed.
1818   _last_async_deflation_time_ns = os::javaTimeNanos();
1819   set_is_async_deflation_requested(false);
1820 
1821   ObjectMonitorDeflationLogging log;
1822   ObjectMonitorDeflationSafepointer safepointer(current, &log);
1823 
1824   log.begin();
1825 
1826   // Deflate some idle ObjectMonitors.
1827   size_t deflated_count = deflate_monitor_list(&safepointer);
1828 
1829   // Unlink the deflated ObjectMonitors from the in-use list.
1830   size_t unlinked_count = 0;
1831   size_t deleted_count = 0;
1832   if (deflated_count > 0) {
1833     ResourceMark rm(current);
1834     GrowableArray<ObjectMonitor*> delete_list((int)deflated_count);
1835     unlinked_count = _in_use_list.unlink_deflated(deflated_count, &delete_list, &safepointer);
1836 
1837     log.before_handshake(unlinked_count);
1838 
1839     // A JavaThread needs to handshake in order to safely free the
1840     // ObjectMonitors that were deflated in this cycle.
1841     HandshakeForDeflation hfd_hc;
1842     Handshake::execute(&hfd_hc);
1843     // Also, we sync and desync GC threads around the handshake, so that they can
1844     // safely read the mark-word and look-through to the object-monitor, without
1845     // being afraid that the object-monitor is going away.
1846     VM_RendezvousGCThreads sync_gc;
1847     VMThread::execute(&sync_gc);
1848 
1849     log.after_handshake();
1850 
1851     // After the handshake, safely free the ObjectMonitors that were
1852     // deflated and unlinked in this cycle.
1853 
1854     // Delete the unlinked ObjectMonitors.
1855     deleted_count = delete_monitors(&delete_list, &safepointer);
1856     assert(unlinked_count == deleted_count, "must be");
1857   }
1858 
1859   log.end(deflated_count, unlinked_count);
1860 
1861   OM_PERFDATA_OP(MonExtant, set_value(_in_use_list.count()));
1862   OM_PERFDATA_OP(Deflations, inc(deflated_count));
1863 
1864   GVars.stw_random = os::random();
1865 
1866   if (deflated_count != 0) {
1867     _no_progress_cnt = 0;
1868   } else if (_no_progress_skip_increment) {
1869     _no_progress_skip_increment = false;
1870   } else {
1871     _no_progress_cnt++;
1872   }
1873 
1874   return deflated_count;
1875 }
1876 
1877 // Monitor cleanup on JavaThread::exit
1878 
1879 // Iterate through monitor cache and attempt to release thread's monitors
1880 class ReleaseJavaMonitorsClosure: public MonitorClosure {
1881  private:
1882   JavaThread* _thread;
1883 
1884  public:
1885   ReleaseJavaMonitorsClosure(JavaThread* thread) : _thread(thread) {}
1886   void do_monitor(ObjectMonitor* mid) {
1887     intx rec = mid->complete_exit(_thread);
1888     _thread->dec_held_monitor_count(rec + 1);
1889   }
1890 };
1891 
1892 // Release all inflated monitors owned by current thread.  Lightweight monitors are
1893 // ignored.  This is meant to be called during JNI thread detach which assumes
1894 // all remaining monitors are heavyweight.  All exceptions are swallowed.
1895 // Scanning the extant monitor list can be time consuming.
1896 // A simple optimization is to add a per-thread flag that indicates a thread
1897 // called jni_monitorenter() during its lifetime.
1898 //
1899 // Instead of NoSafepointVerifier it might be cheaper to
1900 // use an idiom of the form:
1901 //   auto int tmp = SafepointSynchronize::_safepoint_counter ;
1902 //   <code that must not run at safepoint>
1903 //   guarantee (((tmp ^ _safepoint_counter) | (tmp & 1)) == 0) ;
1904 // Since the tests are extremely cheap we could leave them enabled
1905 // for normal product builds.
1906 
1907 void ObjectSynchronizer::release_monitors_owned_by_thread(JavaThread* current) {
1908   assert(current == JavaThread::current(), "must be current Java thread");
1909   NoSafepointVerifier nsv;
1910   ReleaseJavaMonitorsClosure rjmc(current);
1911   ObjectSynchronizer::owned_monitors_iterate(&rjmc, current);
1912   assert(!current->has_pending_exception(), "Should not be possible");
1913   current->clear_pending_exception();
1914   assert(current->held_monitor_count() == 0, "Should not be possible");
1915   // All monitors (including entered via JNI) have been unlocked above, so we need to clear jni count.
1916   current->clear_jni_monitor_count();
1917 }
1918 
1919 const char* ObjectSynchronizer::inflate_cause_name(const InflateCause cause) {
1920   switch (cause) {
1921     case inflate_cause_vm_internal:    return "VM Internal";
1922     case inflate_cause_monitor_enter:  return "Monitor Enter";
1923     case inflate_cause_wait:           return "Monitor Wait";
1924     case inflate_cause_notify:         return "Monitor Notify";
1925     case inflate_cause_hash_code:      return "Monitor Hash Code";
1926     case inflate_cause_jni_enter:      return "JNI Monitor Enter";
1927     case inflate_cause_jni_exit:       return "JNI Monitor Exit";
1928     default:
1929       ShouldNotReachHere();
1930   }
1931   return "Unknown";
1932 }
1933 
1934 //------------------------------------------------------------------------------
1935 // Debugging code
1936 
1937 u_char* ObjectSynchronizer::get_gvars_addr() {
1938   return (u_char*)&GVars;
1939 }
1940 
1941 u_char* ObjectSynchronizer::get_gvars_hc_sequence_addr() {
1942   return (u_char*)&GVars.hc_sequence;
1943 }
1944 
1945 size_t ObjectSynchronizer::get_gvars_size() {
1946   return sizeof(SharedGlobals);
1947 }
1948 
1949 u_char* ObjectSynchronizer::get_gvars_stw_random_addr() {
1950   return (u_char*)&GVars.stw_random;
1951 }
1952 
1953 // Do the final audit and print of ObjectMonitor stats; must be done
1954 // by the VMThread at VM exit time.
1955 void ObjectSynchronizer::do_final_audit_and_print_stats() {
1956   assert(Thread::current()->is_VM_thread(), "sanity check");
1957 
1958   if (is_final_audit()) {  // Only do the audit once.
1959     return;
1960   }
1961   set_is_final_audit();
1962   log_info(monitorinflation)("Starting the final audit.");
1963 
1964   if (log_is_enabled(Info, monitorinflation)) {
1965     LogStreamHandle(Info, monitorinflation) ls;
1966     audit_and_print_stats(&ls, true /* on_exit */);
1967   }
1968 }
1969 
1970 // This function can be called by the MonitorDeflationThread or it can be called when
1971 // we are trying to exit the VM. The list walker functions can run in parallel with
1972 // the other list operations.
1973 // Calls to this function can be added in various places as a debugging
1974 // aid.
1975 //
1976 void ObjectSynchronizer::audit_and_print_stats(outputStream* ls, bool on_exit) {
1977   int error_cnt = 0;
1978 
1979   ls->print_cr("Checking in_use_list:");
1980   chk_in_use_list(ls, &error_cnt);
1981 
1982   if (error_cnt == 0) {
1983     ls->print_cr("No errors found in in_use_list checks.");
1984   } else {
1985     log_error(monitorinflation)("found in_use_list errors: error_cnt=%d", error_cnt);
1986   }
1987 
1988   // When exiting, only log the interesting entries at the Info level.
1989   // When called at intervals by the MonitorDeflationThread, log output
1990   // at the Trace level since there can be a lot of it.
1991   if (!on_exit && log_is_enabled(Trace, monitorinflation)) {
1992     LogStreamHandle(Trace, monitorinflation) ls_tr;
1993     log_in_use_monitor_details(&ls_tr, true /* log_all */);
1994   } else if (on_exit) {
1995     log_in_use_monitor_details(ls, false /* log_all */);
1996   }
1997 
1998   ls->flush();
1999 
2000   guarantee(error_cnt == 0, "ERROR: found monitor list errors: error_cnt=%d", error_cnt);
2001 }
2002 
2003 // Check the in_use_list; log the results of the checks.
2004 void ObjectSynchronizer::chk_in_use_list(outputStream* out, int *error_cnt_p) {
2005   size_t l_in_use_count = _in_use_list.count();
2006   size_t l_in_use_max = _in_use_list.max();
2007   out->print_cr("count=" SIZE_FORMAT ", max=" SIZE_FORMAT, l_in_use_count,
2008                 l_in_use_max);
2009 
2010   size_t ck_in_use_count = 0;
2011   MonitorList::Iterator iter = _in_use_list.iterator();
2012   while (iter.has_next()) {
2013     ObjectMonitor* mid = iter.next();
2014     chk_in_use_entry(mid, out, error_cnt_p);
2015     ck_in_use_count++;
2016   }
2017 
2018   if (l_in_use_count == ck_in_use_count) {
2019     out->print_cr("in_use_count=" SIZE_FORMAT " equals ck_in_use_count="
2020                   SIZE_FORMAT, l_in_use_count, ck_in_use_count);
2021   } else {
2022     out->print_cr("WARNING: in_use_count=" SIZE_FORMAT " is not equal to "
2023                   "ck_in_use_count=" SIZE_FORMAT, l_in_use_count,
2024                   ck_in_use_count);
2025   }
2026 
2027   size_t ck_in_use_max = _in_use_list.max();
2028   if (l_in_use_max == ck_in_use_max) {
2029     out->print_cr("in_use_max=" SIZE_FORMAT " equals ck_in_use_max="
2030                   SIZE_FORMAT, l_in_use_max, ck_in_use_max);
2031   } else {
2032     out->print_cr("WARNING: in_use_max=" SIZE_FORMAT " is not equal to "
2033                   "ck_in_use_max=" SIZE_FORMAT, l_in_use_max, ck_in_use_max);
2034   }
2035 }
2036 
2037 // Check an in-use monitor entry; log any errors.
2038 void ObjectSynchronizer::chk_in_use_entry(ObjectMonitor* n, outputStream* out,
2039                                           int* error_cnt_p) {
2040   if (n->owner_is_DEFLATER_MARKER()) {
2041     // This could happen when monitor deflation blocks for a safepoint.
2042     return;
2043   }
2044 
2045   if (n->header().value() == 0) {
2046     out->print_cr("ERROR: monitor=" INTPTR_FORMAT ": in-use monitor must "
2047                   "have non-null _header field.", p2i(n));
2048     *error_cnt_p = *error_cnt_p + 1;
2049   }
2050   const oop obj = n->object_peek();
2051   if (obj != nullptr) {
2052     const markWord mark = obj->mark();
2053     if (!mark.has_monitor()) {
2054       out->print_cr("ERROR: monitor=" INTPTR_FORMAT ": in-use monitor's "
2055                     "object does not think it has a monitor: obj="
2056                     INTPTR_FORMAT ", mark=" INTPTR_FORMAT, p2i(n),
2057                     p2i(obj), mark.value());
2058       *error_cnt_p = *error_cnt_p + 1;
2059     }
2060     ObjectMonitor* const obj_mon = mark.monitor();
2061     if (n != obj_mon) {
2062       out->print_cr("ERROR: monitor=" INTPTR_FORMAT ": in-use monitor's "
2063                     "object does not refer to the same monitor: obj="
2064                     INTPTR_FORMAT ", mark=" INTPTR_FORMAT ", obj_mon="
2065                     INTPTR_FORMAT, p2i(n), p2i(obj), mark.value(), p2i(obj_mon));
2066       *error_cnt_p = *error_cnt_p + 1;
2067     }
2068   }
2069 }
2070 
2071 // Log details about ObjectMonitors on the in_use_list. The 'BHL'
2072 // flags indicate why the entry is in-use, 'object' and 'object type'
2073 // indicate the associated object and its type.
2074 void ObjectSynchronizer::log_in_use_monitor_details(outputStream* out, bool log_all) {
2075   if (_in_use_list.count() > 0) {
2076     stringStream ss;
2077     out->print_cr("In-use monitor info:");
2078     out->print_cr("(B -> is_busy, H -> has hash code, L -> lock status)");
2079     out->print_cr("%18s  %s  %18s  %18s",
2080                   "monitor", "BHL", "object", "object type");
2081     out->print_cr("==================  ===  ==================  ==================");
2082 
2083     auto is_interesting = [&](ObjectMonitor* monitor) {
2084       return log_all || monitor->has_owner() || monitor->is_busy();
2085     };
2086 
2087     monitors_iterate([&](ObjectMonitor* monitor) {
2088       if (is_interesting(monitor)) {
2089         const oop obj = monitor->object_peek();
2090         const markWord mark = monitor->header();
2091         ResourceMark rm;
2092         out->print(INTPTR_FORMAT "  %d%d%d  " INTPTR_FORMAT "  %s", p2i(monitor),
2093                    monitor->is_busy(), mark.hash() != 0, monitor->owner() != nullptr,
2094                    p2i(obj), obj == nullptr ? "" : obj->klass()->external_name());
2095         if (monitor->is_busy()) {
2096           out->print(" (%s)", monitor->is_busy_to_string(&ss));
2097           ss.reset();
2098         }
2099         out->cr();
2100       }
2101     });
2102   }
2103 
2104   out->flush();
2105 }