Skip to content

Commit d93b238

Browse files
committedNov 18, 2021
8277180: Intrinsify recursive ObjectMonitor locking for C2 x64 and A64
Reviewed-by: aph, ngasson
1 parent 00c388b commit d93b238

File tree

2 files changed

+38
-13
lines changed

2 files changed

+38
-13
lines changed
 

‎src/hotspot/cpu/aarch64/aarch64.ad

+22-4
Original file line numberDiff line numberDiff line change
@@ -3945,7 +3945,7 @@ encode %{
39453945
// Try to CAS m->owner from NULL to current thread.
39463946
__ add(tmp, disp_hdr, (ObjectMonitor::owner_offset_in_bytes()-markWord::monitor_value));
39473947
__ cmpxchg(tmp, zr, rthread, Assembler::xword, /*acquire*/ true,
3948-
/*release*/ true, /*weak*/ false, noreg); // Sets flags for result
3948+
/*release*/ true, /*weak*/ false, rscratch1); // Sets flags for result
39493949

39503950
// Store a non-null value into the box to avoid looking like a re-entrant
39513951
// lock. The fast-path monitor unlock code checks for
@@ -3954,6 +3954,15 @@ encode %{
39543954
__ mov(tmp, (address)markWord::unused_mark().value());
39553955
__ str(tmp, Address(box, BasicLock::displaced_header_offset_in_bytes()));
39563956

3957+
__ br(Assembler::EQ, cont); // CAS success means locking succeeded
3958+
3959+
__ cmp(rscratch1, rthread);
3960+
__ br(Assembler::NE, cont); // Check for recursive locking
3961+
3962+
// Recursive lock case
3963+
__ increment(Address(disp_hdr, ObjectMonitor::recursions_offset_in_bytes() - markWord::monitor_value), 1);
3964+
// flag == EQ still from the cmp above, checking if this is a reentrant lock
3965+
39573966
__ bind(cont);
39583967
// flag == EQ indicates success
39593968
// flag == NE indicates failure
@@ -3997,11 +4006,20 @@ encode %{
39974006
__ add(tmp, tmp, -(int)markWord::monitor_value); // monitor
39984007
__ ldr(rscratch1, Address(tmp, ObjectMonitor::owner_offset_in_bytes()));
39994008
__ ldr(disp_hdr, Address(tmp, ObjectMonitor::recursions_offset_in_bytes()));
4000-
__ eor(rscratch1, rscratch1, rthread); // Will be 0 if we are the owner.
4001-
__ orr(rscratch1, rscratch1, disp_hdr); // Will be 0 if there are 0 recursions
4002-
__ cmp(rscratch1, zr); // Sets flags for result
4009+
4010+
Label notRecursive;
4011+
__ cmp(rscratch1, rthread);
40034012
__ br(Assembler::NE, cont);
40044013

4014+
__ cbz(disp_hdr, notRecursive);
4015+
4016+
// Recursive lock
4017+
__ sub(disp_hdr, disp_hdr, 1u);
4018+
__ str(disp_hdr, Address(tmp, ObjectMonitor::recursions_offset_in_bytes()));
4019+
// flag == EQ was set in the ownership check above
4020+
__ b(cont);
4021+
4022+
__ bind(notRecursive);
40054023
__ ldr(rscratch1, Address(tmp, ObjectMonitor::EntryList_offset_in_bytes()));
40064024
__ ldr(disp_hdr, Address(tmp, ObjectMonitor::cxq_offset_in_bytes()));
40074025
__ orr(rscratch1, rscratch1, disp_hdr); // Will be 0 if both are 0.

‎src/hotspot/cpu/x86/c2_MacroAssembler_x86.cpp

+16-9
Original file line numberDiff line numberDiff line change
@@ -574,8 +574,13 @@ void C2_MacroAssembler::fast_lock(Register objReg, Register boxReg, Register tmp
574574
// Unconditionally set box->_displaced_header = markWord::unused_mark().
575575
// Without cast to int32_t this style of movptr will destroy r10 which is typically obj.
576576
movptr(Address(boxReg, 0), (int32_t)intptr_t(markWord::unused_mark().value()));
577-
// Intentional fall-through into DONE_LABEL ...
578577
// Propagate ICC.ZF from CAS above into DONE_LABEL.
578+
jcc(Assembler::equal, DONE_LABEL); // CAS above succeeded; propagate ZF = 1 (success)
579+
580+
cmpptr(r15_thread, rax); // Check if we are already the owner (recursive lock)
581+
jcc(Assembler::notEqual, DONE_LABEL); // If not recursive, ZF = 0 at this point (fail)
582+
incq(Address(scrReg, OM_OFFSET_NO_MONITOR_VALUE_TAG(recursions)));
583+
xorq(rax, rax); // Set ZF = 1 (success) for recursive lock, denoting locking success
579584
#endif // _LP64
580585
#if INCLUDE_RTM_OPT
581586
} // use_rtm()
@@ -670,10 +675,6 @@ void C2_MacroAssembler::fast_unlock(Register objReg, Register boxReg, Register t
670675
// Refer to the comments in synchronizer.cpp for how we might encode extra
671676
// state in _succ so we can avoid fetching EntryList|cxq.
672677
//
673-
// I'd like to add more cases in fast_lock() and fast_unlock() --
674-
// such as recursive enter and exit -- but we have to be wary of
675-
// I$ bloat, T$ effects and BP$ effects.
676-
//
677678
// If there's no contention try a 1-0 exit. That is, exit without
678679
// a costly MEMBAR or CAS. See synchronizer.cpp for details on how
679680
// we detect and recover from the race that the 1-0 exit admits.
@@ -721,9 +722,16 @@ void C2_MacroAssembler::fast_unlock(Register objReg, Register boxReg, Register t
721722
bind (CheckSucc);
722723
#else // _LP64
723724
// It's inflated
724-
xorptr(boxReg, boxReg);
725-
orptr(boxReg, Address(tmpReg, OM_OFFSET_NO_MONITOR_VALUE_TAG(recursions)));
726-
jccb (Assembler::notZero, DONE_LABEL);
725+
Label LNotRecursive, LSuccess, LGoSlowPath;
726+
727+
cmpptr(Address(tmpReg, OM_OFFSET_NO_MONITOR_VALUE_TAG(recursions)), 0);
728+
jccb(Assembler::equal, LNotRecursive);
729+
730+
// Recursive inflated unlock
731+
decq(Address(tmpReg, OM_OFFSET_NO_MONITOR_VALUE_TAG(recursions)));
732+
jmpb(LSuccess);
733+
734+
bind(LNotRecursive);
727735
movptr(boxReg, Address(tmpReg, OM_OFFSET_NO_MONITOR_VALUE_TAG(cxq)));
728736
orptr(boxReg, Address(tmpReg, OM_OFFSET_NO_MONITOR_VALUE_TAG(EntryList)));
729737
jccb (Assembler::notZero, CheckSucc);
@@ -732,7 +740,6 @@ void C2_MacroAssembler::fast_unlock(Register objReg, Register boxReg, Register t
732740
jmpb (DONE_LABEL);
733741

734742
// Try to avoid passing control into the slow_path ...
735-
Label LSuccess, LGoSlowPath ;
736743
bind (CheckSucc);
737744

738745
// The following optional optimization can be elided if necessary

0 commit comments

Comments
 (0)
Please sign in to comment.