Skip to content

Commit b629782

Browse files
author
Igor Veresov
committedMar 4, 2022
8279886: C1: Turn off SelectivePhiFunctions in presence of irreducible loops
Reviewed-by: kvn, dlong
1 parent 7e1c67d commit b629782

File tree

5 files changed

+56
-36
lines changed

5 files changed

+56
-36
lines changed
 

‎src/hotspot/share/c1/c1_Compilation.cpp

+1
Original file line numberDiff line numberDiff line change
@@ -560,6 +560,7 @@ Compilation::Compilation(AbstractCompiler* compiler, ciEnv* env, ciMethod* metho
560560
, _has_exception_handlers(false)
561561
, _has_fpu_code(true) // pessimistic assumption
562562
, _has_unsafe_access(false)
563+
, _has_irreducible_loops(false)
563564
, _would_profile(false)
564565
, _has_method_handle_invokes(false)
565566
, _has_reserved_stack_access(method->has_reserved_stack_access())

‎src/hotspot/share/c1/c1_Compilation.hpp

+3
Original file line numberDiff line numberDiff line change
@@ -77,6 +77,7 @@ class Compilation: public StackObj {
7777
bool _has_exception_handlers;
7878
bool _has_fpu_code;
7979
bool _has_unsafe_access;
80+
bool _has_irreducible_loops;
8081
bool _would_profile;
8182
bool _has_method_handle_invokes; // True if this method has MethodHandle invokes.
8283
bool _has_reserved_stack_access;
@@ -135,6 +136,7 @@ class Compilation: public StackObj {
135136
bool has_exception_handlers() const { return _has_exception_handlers; }
136137
bool has_fpu_code() const { return _has_fpu_code; }
137138
bool has_unsafe_access() const { return _has_unsafe_access; }
139+
bool has_irreducible_loops() const { return _has_irreducible_loops; }
138140
int max_vector_size() const { return 0; }
139141
ciMethod* method() const { return _method; }
140142
int osr_bci() const { return _osr_bci; }
@@ -162,6 +164,7 @@ class Compilation: public StackObj {
162164
void set_has_exception_handlers(bool f) { _has_exception_handlers = f; }
163165
void set_has_fpu_code(bool f) { _has_fpu_code = f; }
164166
void set_has_unsafe_access(bool f) { _has_unsafe_access = f; }
167+
void set_has_irreducible_loops(bool f) { _has_irreducible_loops = f; }
165168
void set_would_profile(bool f) { _would_profile = f; }
166169
void set_has_access_indexed(bool f) { _has_access_indexed = f; }
167170
// Add a set of exception handlers covering the given PC offset

‎src/hotspot/share/c1/c1_GraphBuilder.cpp

+45-31
Original file line numberDiff line numberDiff line change
@@ -59,7 +59,7 @@ class BlockListBuilder {
5959
// fields used by mark_loops
6060
ResourceBitMap _active; // for iteration of control flow graph
6161
ResourceBitMap _visited; // for iteration of control flow graph
62-
intArray _loop_map; // caches the information if a block is contained in a loop
62+
GrowableArray<ResourceBitMap> _loop_map; // caches the information if a block is contained in a loop
6363
int _next_loop_index; // next free loop number
6464
int _next_block_number; // for reverse postorder numbering of blocks
6565

@@ -84,7 +84,7 @@ class BlockListBuilder {
8484

8585
void make_loop_header(BlockBegin* block);
8686
void mark_loops();
87-
int mark_loops(BlockBegin* b, bool in_subroutine);
87+
BitMap& mark_loops(BlockBegin* b, bool in_subroutine);
8888

8989
// debugging
9090
#ifndef PRODUCT
@@ -376,17 +376,36 @@ void BlockListBuilder::mark_loops() {
376376

377377
_active.initialize(BlockBegin::number_of_blocks());
378378
_visited.initialize(BlockBegin::number_of_blocks());
379-
_loop_map = intArray(BlockBegin::number_of_blocks(), BlockBegin::number_of_blocks(), 0);
379+
_loop_map = GrowableArray<ResourceBitMap>(BlockBegin::number_of_blocks(), BlockBegin::number_of_blocks(), ResourceBitMap());
380+
for (int i = 0; i < BlockBegin::number_of_blocks(); i++) {
381+
_loop_map.at(i).initialize(BlockBegin::number_of_blocks());
382+
}
380383
_next_loop_index = 0;
381384
_next_block_number = _blocks.length();
382385

383-
// recursively iterate the control flow graph
384-
mark_loops(_bci2block->at(0), false);
386+
// The loop detection algorithm works as follows:
387+
// - We maintain the _loop_map, where for each block we have a bitmap indicating which loops contain this block.
388+
// - The CFG is recursively traversed (depth-first) and if we detect a loop, we assign the loop a unique number that is stored
389+
// in the bitmap associated with the loop header block. Until we return back through that loop header the bitmap contains
390+
// only a single bit corresponding to the loop number.
391+
// - The bit is then propagated for all the blocks in the loop after we exit them (post-order). There could be multiple bits
392+
// of course in case of nested loops.
393+
// - When we exit the loop header we remove that single bit and assign the real loop state for it.
394+
// - Now, the tricky part here is how we detect irriducible loops. In the algorithm above the loop state bits
395+
// are propagated to the predecessors. If we encounter an irreducible loop (a loop with multiple heads) we would see
396+
// a node with some loop bit set that would then propagate back and be never cleared because we would
397+
// never go back through the original loop header. Therefore if there are any irreducible loops the bits in the states
398+
// for these loops are going to propagate back to the root.
399+
BitMap& loop_state = mark_loops(_bci2block->at(0), false);
400+
if (!loop_state.is_empty()) {
401+
compilation()->set_has_irreducible_loops(true);
402+
}
385403
assert(_next_block_number >= 0, "invalid block numbers");
386404

387405
// Remove dangling Resource pointers before the ResourceMark goes out-of-scope.
388406
_active.resize(0);
389407
_visited.resize(0);
408+
_loop_map.clear();
390409
}
391410

392411
void BlockListBuilder::make_loop_header(BlockBegin* block) {
@@ -398,19 +417,17 @@ void BlockListBuilder::make_loop_header(BlockBegin* block) {
398417
if (!block->is_set(BlockBegin::parser_loop_header_flag)) {
399418
block->set(BlockBegin::parser_loop_header_flag);
400419

401-
assert(_loop_map.at(block->block_id()) == 0, "must not be set yet");
402-
assert(0 <= _next_loop_index && _next_loop_index < BitsPerInt, "_next_loop_index is used as a bit-index in integer");
403-
_loop_map.at_put(block->block_id(), 1 << _next_loop_index);
404-
if (_next_loop_index < 31) _next_loop_index++;
420+
assert(_loop_map.at(block->block_id()).is_empty(), "must not be set yet");
421+
assert(0 <= _next_loop_index && _next_loop_index < BlockBegin::number_of_blocks(), "_next_loop_index is too large");
422+
_loop_map.at(block->block_id()).set_bit(_next_loop_index++);
405423
} else {
406424
// block already marked as loop header
407-
assert(is_power_of_2((unsigned int)_loop_map.at(block->block_id())), "exactly one bit must be set");
425+
assert(_loop_map.at(block->block_id()).count_one_bits() == 1, "exactly one bit must be set");
408426
}
409427
}
410428

411-
int BlockListBuilder::mark_loops(BlockBegin* block, bool in_subroutine) {
429+
BitMap& BlockListBuilder::mark_loops(BlockBegin* block, bool in_subroutine) {
412430
int block_id = block->block_id();
413-
414431
if (_visited.at(block_id)) {
415432
if (_active.at(block_id)) {
416433
// reached block via backward branch
@@ -428,10 +445,11 @@ int BlockListBuilder::mark_loops(BlockBegin* block, bool in_subroutine) {
428445
_visited.set_bit(block_id);
429446
_active.set_bit(block_id);
430447

431-
intptr_t loop_state = 0;
448+
ResourceMark rm;
449+
ResourceBitMap loop_state(BlockBegin::number_of_blocks());
432450
for (int i = number_of_successors(block) - 1; i >= 0; i--) {
433451
// recursively process all successors
434-
loop_state |= mark_loops(successor_at(block, i), in_subroutine);
452+
loop_state.set_union(mark_loops(successor_at(block, i), in_subroutine));
435453
}
436454

437455
// clear active-bit after all successors are processed
@@ -441,26 +459,22 @@ int BlockListBuilder::mark_loops(BlockBegin* block, bool in_subroutine) {
441459
block->set_depth_first_number(_next_block_number);
442460
_next_block_number--;
443461

444-
if (loop_state != 0 || in_subroutine ) {
462+
if (!loop_state.is_empty() || in_subroutine ) {
445463
// block is contained at least in one loop, so phi functions are necessary
446464
// phi functions are also necessary for all locals stored in a subroutine
447465
scope()->requires_phi_function().set_union(block->stores_to_locals());
448466
}
449467

450468
if (block->is_set(BlockBegin::parser_loop_header_flag)) {
451-
int header_loop_state = _loop_map.at(block_id);
452-
assert(is_power_of_2((unsigned)header_loop_state), "exactly one bit must be set");
453-
454-
// If the highest bit is set (i.e. when integer value is negative), the method
455-
// has 32 or more loops. This bit is never cleared because it is used for multiple loops
456-
if (header_loop_state >= 0) {
457-
clear_bits(loop_state, header_loop_state);
458-
}
469+
BitMap& header_loop_state = _loop_map.at(block_id);
470+
assert(header_loop_state.count_one_bits() == 1, "exactly one bit must be set");
471+
// remove the bit with the loop number for the state (header is outside of the loop)
472+
loop_state.set_difference(header_loop_state);
459473
}
460474

461475
// cache and return loop information for this block
462-
_loop_map.at_put(block_id, loop_state);
463-
return loop_state;
476+
_loop_map.at(block_id).set_from(loop_state);
477+
return _loop_map.at(block_id);
464478
}
465479

466480
inline int BlockListBuilder::number_of_successors(BlockBegin* block)
@@ -2496,7 +2510,7 @@ XHandlers* GraphBuilder::handle_exception(Instruction* instruction) {
24962510
// The only test case we've seen so far which exhibits this
24972511
// problem is caught by the infinite recursion test in
24982512
// GraphBuilder::jsr() if the join doesn't work.
2499-
if (!entry->try_merge(cur_state)) {
2513+
if (!entry->try_merge(cur_state, compilation()->has_irreducible_loops())) {
25002514
BAILOUT_("error while joining with exception handler, prob. due to complicated jsr/rets", exception_handlers);
25012515
}
25022516

@@ -2982,7 +2996,7 @@ BlockEnd* GraphBuilder::iterate_bytecodes_for_block(int bci) {
29822996
BlockBegin* sux = end->sux_at(i);
29832997
assert(sux->is_predecessor(block()), "predecessor missing");
29842998
// be careful, bailout if bytecodes are strange
2985-
if (!sux->try_merge(end->state())) BAILOUT_("block join failed", NULL);
2999+
if (!sux->try_merge(end->state(), compilation()->has_irreducible_loops())) BAILOUT_("block join failed", NULL);
29863000
scope_data()->add_to_work_list(end->sux_at(i));
29873001
}
29883002

@@ -3136,7 +3150,7 @@ BlockBegin* GraphBuilder::setup_start_block(int osr_bci, BlockBegin* std_entry,
31363150

31373151
if (base->std_entry()->state() == NULL) {
31383152
// setup states for header blocks
3139-
base->std_entry()->merge(state);
3153+
base->std_entry()->merge(state, compilation()->has_irreducible_loops());
31403154
}
31413155

31423156
assert(base->std_entry()->state() != NULL, "");
@@ -3219,7 +3233,7 @@ void GraphBuilder::setup_osr_entry_block() {
32193233
Goto* g = new Goto(target, false);
32203234
append(g);
32213235
_osr_entry->set_end(g);
3222-
target->merge(_osr_entry->end()->state());
3236+
target->merge(_osr_entry->end()->state(), compilation()->has_irreducible_loops());
32233237

32243238
scope_data()->set_stream(NULL);
32253239
}
@@ -3278,7 +3292,7 @@ GraphBuilder::GraphBuilder(Compilation* compilation, IRScope* scope)
32783292

32793293
// setup state for std entry
32803294
_initial_state = state_at_entry();
3281-
start_block->merge(_initial_state);
3295+
start_block->merge(_initial_state, compilation->has_irreducible_loops());
32823296

32833297
// End nulls still exist here
32843298

@@ -4029,7 +4043,7 @@ bool GraphBuilder::try_inline_full(ciMethod* callee, bool holder_known, bool ign
40294043
// the entry bci for the callee instead of the call site bci.
40304044
append_with_bci(goto_callee, 0);
40314045
_block->set_end(goto_callee);
4032-
callee_start_block->merge(callee_state);
4046+
callee_start_block->merge(callee_state, compilation()->has_irreducible_loops());
40334047

40344048
_last = _block = callee_start_block;
40354049

‎src/hotspot/share/c1/c1_Instruction.cpp

+2-3
Original file line numberDiff line numberDiff line change
@@ -719,7 +719,7 @@ void BlockBegin::block_values_do(ValueVisitor* f) {
719719
#endif
720720

721721

722-
bool BlockBegin::try_merge(ValueStack* new_state) {
722+
bool BlockBegin::try_merge(ValueStack* new_state, bool has_irreducible_loops) {
723723
TRACE_PHI(tty->print_cr("********** try_merge for block B%d", block_id()));
724724

725725
// local variables used for state iteration
@@ -760,10 +760,9 @@ bool BlockBegin::try_merge(ValueStack* new_state) {
760760
}
761761

762762
BitMap& requires_phi_function = new_state->scope()->requires_phi_function();
763-
764763
for_each_local_value(new_state, index, new_value) {
765764
bool requires_phi = requires_phi_function.at(index) || (new_value->type()->is_double_word() && requires_phi_function.at(index + 1));
766-
if (requires_phi || !SelectivePhiFunctions) {
765+
if (requires_phi || !SelectivePhiFunctions || has_irreducible_loops) {
767766
new_state->setup_phi_for_local(this, index);
768767
TRACE_PHI(tty->print_cr("creating phi-function %c%d for local %d", new_state->local_at(index)->type()->tchar(), new_state->local_at(index)->id(), index));
769768
}

‎src/hotspot/share/c1/c1_Instruction.hpp

+5-2
Original file line numberDiff line numberDiff line change
@@ -1779,8 +1779,11 @@ LEAF(BlockBegin, StateSplit)
17791779
int loop_index() const { return _loop_index; }
17801780

17811781
// merging
1782-
bool try_merge(ValueStack* state); // try to merge states at block begin
1783-
void merge(ValueStack* state) { bool b = try_merge(state); assert(b, "merge failed"); }
1782+
bool try_merge(ValueStack* state, bool has_irreducible_loops); // try to merge states at block begin
1783+
void merge(ValueStack* state, bool has_irreducible_loops) {
1784+
bool b = try_merge(state, has_irreducible_loops);
1785+
assert(b, "merge failed");
1786+
}
17841787

17851788
// debugging
17861789
void print_block() PRODUCT_RETURN;

0 commit comments

Comments
 (0)
Please sign in to comment.