Skip to content

Commit b3faecf

Browse files
committedDec 8, 2021
8276116: C2: optimize long range checks in int counted loops
Reviewed-by: kvn
1 parent fe2ae8e commit b3faecf

File tree

8 files changed

+610
-100
lines changed

8 files changed

+610
-100
lines changed
 

‎src/hotspot/cpu/x86/x86_32.ad

+18
Original file line numberDiff line numberDiff line change
@@ -13130,6 +13130,24 @@ instruct cmovLL_mem_LTGE(cmpOp cmp, flagsReg_long_LTGE flags, eRegL dst, load_lo
1313013130
ins_pipe( pipe_cmov_reg_long );
1313113131
%}
1313213132

13133+
instruct cmovLL_reg_LTGE_U(cmpOpU cmp, flagsReg_ulong_LTGE flags, eRegL dst, eRegL src) %{
13134+
match(Set dst (CMoveL (Binary cmp flags) (Binary dst src)));
13135+
predicate(VM_Version::supports_cmov() && ( _kids[0]->_kids[0]->_leaf->as_Bool()->_test._test == BoolTest::lt || _kids[0]->_kids[0]->_leaf->as_Bool()->_test._test == BoolTest::ge ));
13136+
ins_cost(400);
13137+
expand %{
13138+
cmovLL_reg_LTGE(cmp, flags, dst, src);
13139+
%}
13140+
%}
13141+
13142+
instruct cmovLL_mem_LTGE_U(cmpOpU cmp, flagsReg_ulong_LTGE flags, eRegL dst, load_long_memory src) %{
13143+
match(Set dst (CMoveL (Binary cmp flags) (Binary dst (LoadL src))));
13144+
predicate(VM_Version::supports_cmov() && ( _kids[0]->_kids[0]->_leaf->as_Bool()->_test._test == BoolTest::lt || _kids[0]->_kids[0]->_leaf->as_Bool()->_test._test == BoolTest::ge ));
13145+
ins_cost(500);
13146+
expand %{
13147+
cmovLL_mem_LTGE(cmp, flags, dst, src);
13148+
%}
13149+
%}
13150+
1313313151
// Compare 2 longs and CMOVE ints.
1313413152
instruct cmovII_reg_LTGE(cmpOp cmp, flagsReg_long_LTGE flags, rRegI dst, rRegI src) %{
1313513153
predicate(VM_Version::supports_cmov() && ( _kids[0]->_kids[0]->_leaf->as_Bool()->_test._test == BoolTest::lt || _kids[0]->_kids[0]->_leaf->as_Bool()->_test._test == BoolTest::ge ));

‎src/hotspot/share/opto/compile.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -3463,7 +3463,7 @@ void Compile::final_graph_reshaping_main_switch(Node* n, Final_Reshape_Counts& f
34633463
}
34643464
break;
34653465
case Op_Loop:
3466-
assert(!n->as_Loop()->is_transformed_long_inner_loop() || _loop_opts_cnt == 0, "should have been turned into a counted loop");
3466+
assert(!n->as_Loop()->is_loop_nest_inner_loop() || _loop_opts_cnt == 0, "should have been turned into a counted loop");
34673467
case Op_CountedLoop:
34683468
case Op_LongCountedLoop:
34693469
case Op_OuterStripMinedLoop:

‎src/hotspot/share/opto/loopTransform.cpp

+46-17
Original file line numberDiff line numberDiff line change
@@ -1065,7 +1065,7 @@ void IdealLoopTree::policy_unroll_slp_analysis(CountedLoopNode *cl, PhaseIdealLo
10651065
// When TRUE, the estimated node budget is also requested.
10661066
//
10671067
// We will actually perform iteration-splitting, a more powerful form of RCE.
1068-
bool IdealLoopTree::policy_range_check(PhaseIdealLoop* phase, bool provisional) const {
1068+
bool IdealLoopTree::policy_range_check(PhaseIdealLoop* phase, bool provisional, BasicType bt) const {
10691069
if (!provisional && !RangeCheckElimination) return false;
10701070

10711071
// If nodes are depleted, some transform has miscalculated its needs.
@@ -1087,7 +1087,7 @@ bool IdealLoopTree::policy_range_check(PhaseIdealLoop* phase, bool provisional)
10871087

10881088
BaseCountedLoopNode* cl = _head->as_BaseCountedLoop();
10891089
Node *trip_counter = cl->phi();
1090-
BasicType bt = cl->bt();
1090+
assert(!cl->is_LongCountedLoop() || bt == T_LONG, "only long range checks in long counted loops");
10911091

10921092
// Check loop body for tests of trip-counter plus loop-invariant vs
10931093
// loop-invariant.
@@ -1135,7 +1135,7 @@ bool IdealLoopTree::policy_range_check(PhaseIdealLoop* phase, bool provisional)
11351135
}
11361136
}
11371137

1138-
if (!phase->is_scaled_iv_plus_offset(rc_exp, trip_counter, NULL, NULL)) {
1138+
if (!phase->is_scaled_iv_plus_offset(rc_exp, trip_counter, NULL, NULL, bt)) {
11391139
continue;
11401140
}
11411141
}
@@ -1145,7 +1145,9 @@ bool IdealLoopTree::policy_range_check(PhaseIdealLoop* phase, bool provisional)
11451145
if (is_loop_exit(iff)) {
11461146
// Found valid reason to split iterations (if there is room).
11471147
// NOTE: Usually a gross overestimate.
1148-
return provisional || phase->may_require_nodes(est_loop_clone_sz(2));
1148+
// Long range checks cause the loop to be transformed in a loop nest which only causes a fixed number of nodes
1149+
// to be added
1150+
return provisional || bt == T_LONG || phase->may_require_nodes(est_loop_clone_sz(2));
11491151
}
11501152
} // End of is IF
11511153
}
@@ -2508,34 +2510,52 @@ void PhaseIdealLoop::add_constraint(jlong stride_con, jlong scale_con, Node* off
25082510
}
25092511
}
25102512

2513+
bool PhaseIdealLoop::is_iv(Node* exp, Node* iv, BasicType bt) {
2514+
if (exp == iv) {
2515+
return true;
2516+
}
2517+
2518+
if (bt == T_LONG && iv->bottom_type()->isa_int() && exp->Opcode() == Op_ConvI2L && exp->in(1) == iv) {
2519+
return true;
2520+
}
2521+
return false;
2522+
}
2523+
25112524
//------------------------------is_scaled_iv---------------------------------
25122525
// Return true if exp is a constant times an induction var
2513-
bool PhaseIdealLoop::is_scaled_iv(Node* exp, Node* iv, jlong* p_scale, BasicType bt) {
2526+
bool PhaseIdealLoop::is_scaled_iv(Node* exp, Node* iv, jlong* p_scale, BasicType bt, bool* converted) {
25142527
exp = exp->uncast();
25152528
assert(bt == T_INT || bt == T_LONG, "unexpected int type");
2516-
if (exp == iv) {
2529+
if (is_iv(exp, iv, bt)) {
25172530
if (p_scale != NULL) {
25182531
*p_scale = 1;
25192532
}
25202533
return true;
25212534
}
2535+
if (bt == T_LONG && iv->bottom_type()->isa_int() && exp->Opcode() == Op_ConvI2L) {
2536+
exp = exp->in(1);
2537+
bt = T_INT;
2538+
if (converted != NULL) {
2539+
*converted = true;
2540+
}
2541+
}
25222542
int opc = exp->Opcode();
25232543
// Can't use is_Mul() here as it's true for AndI and AndL
25242544
if (opc == Op_Mul(bt)) {
2525-
if (exp->in(1)->uncast() == iv && exp->in(2)->is_Con()) {
2545+
if (is_iv(exp->in(1)->uncast(), iv, bt) && exp->in(2)->is_Con()) {
25262546
if (p_scale != NULL) {
25272547
*p_scale = exp->in(2)->get_integer_as_long(bt);
25282548
}
25292549
return true;
25302550
}
2531-
if (exp->in(2)->uncast() == iv && exp->in(1)->is_Con()) {
2551+
if (is_iv(exp->in(2)->uncast(), iv, bt) && exp->in(1)->is_Con()) {
25322552
if (p_scale != NULL) {
25332553
*p_scale = exp->in(1)->get_integer_as_long(bt);
25342554
}
25352555
return true;
25362556
}
25372557
} else if (opc == Op_LShift(bt)) {
2538-
if (exp->in(1)->uncast() == iv && exp->in(2)->is_Con()) {
2558+
if (is_iv(exp->in(1)->uncast(), iv, bt) && exp->in(2)->is_Con()) {
25392559
if (p_scale != NULL) {
25402560
jint shift_amount = exp->in(2)->get_int();
25412561
if (bt == T_INT) {
@@ -2552,9 +2572,9 @@ bool PhaseIdealLoop::is_scaled_iv(Node* exp, Node* iv, jlong* p_scale, BasicType
25522572

25532573
//-----------------------------is_scaled_iv_plus_offset------------------------------
25542574
// Return true if exp is a simple induction variable expression: k1*iv + (invar + k2)
2555-
bool PhaseIdealLoop::is_scaled_iv_plus_offset(Node* exp, Node* iv, jlong* p_scale, Node** p_offset, BasicType bt, int depth) {
2575+
bool PhaseIdealLoop::is_scaled_iv_plus_offset(Node* exp, Node* iv, jlong* p_scale, Node** p_offset, BasicType bt, bool* converted, int depth) {
25562576
assert(bt == T_INT || bt == T_LONG, "unexpected int type");
2557-
if (is_scaled_iv(exp, iv, p_scale, bt)) {
2577+
if (is_scaled_iv(exp, iv, p_scale, bt, converted)) {
25582578
if (p_offset != NULL) {
25592579
Node *zero = _igvn.integercon(0, bt);
25602580
set_ctrl(zero, C->root());
@@ -2565,13 +2585,13 @@ bool PhaseIdealLoop::is_scaled_iv_plus_offset(Node* exp, Node* iv, jlong* p_scal
25652585
exp = exp->uncast();
25662586
int opc = exp->Opcode();
25672587
if (opc == Op_Add(bt)) {
2568-
if (is_scaled_iv(exp->in(1), iv, p_scale, bt)) {
2588+
if (is_scaled_iv(exp->in(1), iv, p_scale, bt, converted)) {
25692589
if (p_offset != NULL) {
25702590
*p_offset = exp->in(2);
25712591
}
25722592
return true;
25732593
}
2574-
if (is_scaled_iv(exp->in(2), iv, p_scale, bt)) {
2594+
if (is_scaled_iv(exp->in(2), iv, p_scale, bt, converted)) {
25752595
if (p_offset != NULL) {
25762596
*p_offset = exp->in(1);
25772597
}
@@ -2581,7 +2601,7 @@ bool PhaseIdealLoop::is_scaled_iv_plus_offset(Node* exp, Node* iv, jlong* p_scal
25812601
Node* offset2 = NULL;
25822602
if (depth < 2 &&
25832603
is_scaled_iv_plus_offset(exp->in(1), iv, p_scale,
2584-
p_offset != NULL ? &offset2 : NULL, bt, depth+1)) {
2604+
p_offset != NULL ? &offset2 : NULL, bt, converted, depth+1)) {
25852605
if (p_offset != NULL) {
25862606
Node *ctrl_off2 = get_ctrl(offset2);
25872607
Node* offset = AddNode::make(offset2, exp->in(2), bt);
@@ -2592,7 +2612,7 @@ bool PhaseIdealLoop::is_scaled_iv_plus_offset(Node* exp, Node* iv, jlong* p_scal
25922612
}
25932613
}
25942614
} else if (opc == Op_Sub(bt)) {
2595-
if (is_scaled_iv(exp->in(1), iv, p_scale, bt)) {
2615+
if (is_scaled_iv(exp->in(1), iv, p_scale, bt, converted)) {
25962616
if (p_offset != NULL) {
25972617
Node *zero = _igvn.integercon(0, bt);
25982618
set_ctrl(zero, C->root());
@@ -2603,7 +2623,7 @@ bool PhaseIdealLoop::is_scaled_iv_plus_offset(Node* exp, Node* iv, jlong* p_scal
26032623
}
26042624
return true;
26052625
}
2606-
if (is_scaled_iv(exp->in(2), iv, p_scale, bt)) {
2626+
if (is_scaled_iv(exp->in(2), iv, p_scale, bt, converted)) {
26072627
if (p_offset != NULL) {
26082628
// We can't handle a scale of min_jint (or min_jlong) here as -1 * min_jint = min_jint
26092629
if (*p_scale == min_signed_integer(bt)) {
@@ -3432,6 +3452,8 @@ bool IdealLoopTree::iteration_split_impl(PhaseIdealLoop *phase, Node_List &old_n
34323452
} else if (policy_unswitching(phase)) {
34333453
phase->do_unswitching(this, old_new);
34343454
return false; // need to recalculate idom data
3455+
} else if (_head->is_LongCountedLoop()) {
3456+
phase->create_loop_nest(this, old_new);
34353457
}
34363458
return true;
34373459
}
@@ -3475,7 +3497,8 @@ bool IdealLoopTree::iteration_split_impl(PhaseIdealLoop *phase, Node_List &old_n
34753497
// unrolling), plus any needed for RCE purposes.
34763498

34773499
bool should_unroll = policy_unroll(phase);
3478-
bool should_rce = policy_range_check(phase, false);
3500+
bool should_rce = policy_range_check(phase, false, T_INT);
3501+
bool should_rce_long = policy_range_check(phase, false, T_LONG);
34793502

34803503
// If not RCE'ing (iteration splitting), then we do not need a pre-loop.
34813504
// We may still need to peel an initial iteration but we will not
@@ -3490,6 +3513,9 @@ bool IdealLoopTree::iteration_split_impl(PhaseIdealLoop *phase, Node_List &old_n
34903513
// peeling.
34913514
if (should_rce || should_unroll) {
34923515
if (cl->is_normal_loop()) { // Convert to 'pre/main/post' loops
3516+
if (should_rce_long && phase->create_loop_nest(this, old_new)) {
3517+
return true;
3518+
}
34933519
uint estimate = est_loop_clone_sz(3);
34943520
if (!phase->may_require_nodes(estimate)) {
34953521
return false;
@@ -3531,6 +3557,9 @@ bool IdealLoopTree::iteration_split_impl(PhaseIdealLoop *phase, Node_List &old_n
35313557
phase->do_peeling(this, old_new);
35323558
}
35333559
}
3560+
if (should_rce_long) {
3561+
phase->create_loop_nest(this, old_new);
3562+
}
35343563
}
35353564
return true;
35363565
}

‎src/hotspot/share/opto/loopnode.cpp

+195-62
Large diffs are not rendered by default.

‎src/hotspot/share/opto/loopnode.hpp

+26-14
Original file line numberDiff line numberDiff line change
@@ -77,8 +77,8 @@ class LoopNode : public RegionNode {
7777
StripMined = 1<<15,
7878
SubwordLoop = 1<<16,
7979
ProfileTripFailed = 1<<17,
80-
TransformedLongInnerLoop = 1<<18,
81-
TransformedLongOuterLoop = 1<<19};
80+
LoopNestInnerLoop = 1 << 18,
81+
LoopNestLongOuterLoop = 1 << 19};
8282
char _unswitch_count;
8383
enum { _unswitch_max=3 };
8484
char _postloop_flags;
@@ -103,8 +103,8 @@ class LoopNode : public RegionNode {
103103
bool is_strip_mined() const { return _loop_flags & StripMined; }
104104
bool is_profile_trip_failed() const { return _loop_flags & ProfileTripFailed; }
105105
bool is_subword_loop() const { return _loop_flags & SubwordLoop; }
106-
bool is_transformed_long_inner_loop() const { return _loop_flags & TransformedLongInnerLoop; }
107-
bool is_transformed_long_outer_loop() const { return _loop_flags & TransformedLongOuterLoop; }
106+
bool is_loop_nest_inner_loop() const { return _loop_flags & LoopNestInnerLoop; }
107+
bool is_loop_nest_outer_loop() const { return _loop_flags & LoopNestLongOuterLoop; }
108108

109109
void mark_partial_peel_failed() { _loop_flags |= PartialPeelFailed; }
110110
void mark_has_reductions() { _loop_flags |= HasReductions; }
@@ -119,8 +119,8 @@ class LoopNode : public RegionNode {
119119
void clear_strip_mined() { _loop_flags &= ~StripMined; }
120120
void mark_profile_trip_failed() { _loop_flags |= ProfileTripFailed; }
121121
void mark_subword_loop() { _loop_flags |= SubwordLoop; }
122-
void mark_transformed_long_inner_loop() { _loop_flags |= TransformedLongInnerLoop; }
123-
void mark_transformed_long_outer_loop() { _loop_flags |= TransformedLongOuterLoop; }
122+
void mark_loop_nest_inner_loop() { _loop_flags |= LoopNestInnerLoop; }
123+
void mark_loop_nest_outer_loop() { _loop_flags |= LoopNestLongOuterLoop; }
124124

125125
int unswitch_max() { return _unswitch_max; }
126126
int unswitch_count() { return _unswitch_count; }
@@ -216,6 +216,8 @@ class BaseCountedLoopNode : public LoopNode {
216216

217217
virtual BasicType bt() const = 0;
218218

219+
jlong stride_con() const;
220+
219221
static BaseCountedLoopNode* make(Node* entry, Node* backedge, BasicType bt);
220222
};
221223

@@ -364,7 +366,6 @@ class LongCountedLoopNode : public BaseCountedLoopNode {
364366

365367
LongCountedLoopEndNode* loopexit_or_null() const { return (LongCountedLoopEndNode*) BaseCountedLoopNode::loopexit_or_null(); }
366368
LongCountedLoopEndNode* loopexit() const { return (LongCountedLoopEndNode*) BaseCountedLoopNode::loopexit(); }
367-
jlong stride_con() const;
368369
};
369370

370371

@@ -512,6 +513,12 @@ inline Node* BaseCountedLoopNode::phi() const {
512513
return cle != NULL ? cle->phi() : NULL;
513514
}
514515

516+
inline jlong BaseCountedLoopNode::stride_con() const {
517+
BaseCountedLoopEndNode* cle = loopexit_or_null();
518+
return cle != NULL ? cle->stride_con() : 0;
519+
}
520+
521+
515522
//------------------------------LoopLimitNode-----------------------------
516523
// Counted Loop limit node which represents exact final iterator value:
517524
// trip_count = (limit - init_trip + stride - 1)/stride
@@ -710,7 +717,7 @@ class IdealLoopTree : public ResourceObj {
710717
// Return TRUE or FALSE if the loop should be range-check-eliminated.
711718
// Gather a list of IF tests that are dominated by iteration splitting;
712719
// also gather the end of the first split and the start of the 2nd split.
713-
bool policy_range_check(PhaseIdealLoop* phase, bool provisional) const;
720+
bool policy_range_check(PhaseIdealLoop* phase, bool provisional, BasicType bt) const;
714721

715722
// Return TRUE if "iff" is a range check.
716723
bool is_range_check_if(IfNode *iff, PhaseIdealLoop *phase, Invariance& invar DEBUG_ONLY(COMMA ProjNode *predicate_proj)) const;
@@ -1146,8 +1153,8 @@ class PhaseIdealLoop : public PhaseTransform {
11461153

11471154
bool is_counted_loop(Node* x, IdealLoopTree*&loop, BasicType iv_bt);
11481155

1149-
Node* long_loop_replace_long_iv(Node* iv_to_replace, Node* inner_iv, Node* outer_phi, Node* inner_head);
1150-
bool transform_long_counted_loop(IdealLoopTree* loop, Node_List &old_new);
1156+
Node* loop_nest_replace_iv(Node* iv_to_replace, Node* inner_iv, Node* outer_phi, Node* inner_head, BasicType bt);
1157+
bool create_loop_nest(IdealLoopTree* loop, Node_List &old_new);
11511158
#ifdef ASSERT
11521159
bool convert_to_long_loop(Node* cmp, Node* phi, IdealLoopTree* loop);
11531160
#endif
@@ -1248,10 +1255,12 @@ class PhaseIdealLoop : public PhaseTransform {
12481255
void mark_reductions( IdealLoopTree *loop );
12491256

12501257
// Return true if exp is a constant times an induction var
1251-
bool is_scaled_iv(Node* exp, Node* iv, jlong* p_scale, BasicType bt);
1258+
bool is_scaled_iv(Node* exp, Node* iv, jlong* p_scale, BasicType bt, bool* converted);
1259+
1260+
bool is_iv(Node* exp, Node* iv, BasicType bt);
12521261

12531262
// Return true if exp is a scaled induction var plus (or minus) constant
1254-
bool is_scaled_iv_plus_offset(Node* exp, Node* iv, jlong* p_scale, Node** p_offset, BasicType bt, int depth = 0);
1263+
bool is_scaled_iv_plus_offset(Node* exp, Node* iv, jlong* p_scale, Node** p_offset, BasicType bt, bool* converted = NULL, int depth = 0);
12551264
bool is_scaled_iv_plus_offset(Node* exp, Node* iv, int* p_scale, Node** p_offset) {
12561265
jlong long_scale;
12571266
if (is_scaled_iv_plus_offset(exp, iv, &long_scale, p_offset, T_INT)) {
@@ -1610,9 +1619,9 @@ class PhaseIdealLoop : public PhaseTransform {
16101619

16111620
void rpo(Node* start, Node_Stack &stk, VectorSet &visited, Node_List &rpo_list) const;
16121621

1613-
void check_long_counted_loop(IdealLoopTree* loop, Node* x) NOT_DEBUG_RETURN;
1622+
void check_counted_loop_shape(IdealLoopTree* loop, Node* x, BasicType bt) NOT_DEBUG_RETURN;
16141623

1615-
LoopNode* create_inner_head(IdealLoopTree* loop, LongCountedLoopNode* head, LongCountedLoopEndNode* exit_test);
1624+
LoopNode* create_inner_head(IdealLoopTree* loop, BaseCountedLoopNode* head, IfNode* exit_test);
16161625

16171626

16181627
int extract_long_range_checks(const IdealLoopTree* loop, jlong stride_con, int iters_limit, PhiNode* phi,
@@ -1635,6 +1644,9 @@ class PhaseIdealLoop : public PhaseTransform {
16351644
Node* clamp(Node* R, Node* L, Node* H);
16361645

16371646
bool safe_for_if_replacement(const Node* dom) const;
1647+
1648+
void strip_mined_nest_back_to_counted_loop(IdealLoopTree* loop, const BaseCountedLoopNode* head, Node* back_control,
1649+
IfNode*&exit_test, SafePointNode*&safepoint);
16381650
};
16391651

16401652

‎src/hotspot/share/opto/loopopts.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -1053,7 +1053,7 @@ Node *PhaseIdealLoop::split_if_with_blocks_pre( Node *n ) {
10531053

10541054
// Do not clone the trip counter through on a CountedLoop
10551055
// (messes up the canonical shape).
1056-
if (((n_blk->is_CountedLoop() || (n_blk->is_Loop() && n_blk->as_Loop()->is_transformed_long_inner_loop())) && n->Opcode() == Op_AddI) ||
1056+
if (((n_blk->is_CountedLoop() || (n_blk->is_Loop() && n_blk->as_Loop()->is_loop_nest_inner_loop())) && n->Opcode() == Op_AddI) ||
10571057
(n_blk->is_LongCountedLoop() && n->Opcode() == Op_AddL)) {
10581058
return n;
10591059
}

‎test/hotspot/jtreg/compiler/c2/irTests/TestLongRangeChecks.java

+39-3
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@
2828

2929
/*
3030
* @test
31-
* @bug 8259609
31+
* @bug 8259609 8276116
3232
* @summary C2: optimize long range checks in long counted loops
3333
* @library /test/lib /
3434
* @run driver compiler.c2.irTests.TestLongRangeChecks
@@ -41,8 +41,8 @@ public static void main(String[] args) {
4141

4242

4343
@Test
44-
@IR(counts = { IRNode.LOOP, "1"})
45-
@IR(failOn = { IRNode.COUNTEDLOOP})
44+
@IR(counts = { IRNode.LOOP, "1" })
45+
@IR(failOn = { IRNode.COUNTEDLOOP })
4646
public static void testStridePosScalePos(long start, long stop, long length, long offset) {
4747
final long scale = 1;
4848
final long stride = 1;
@@ -60,4 +60,40 @@ public static void testStridePosScalePos(long start, long stop, long length, lon
6060
private void testStridePosScalePos_runner() {
6161
testStridePosScalePos(0, 100, 100, 0);
6262
}
63+
64+
@Test
65+
@IR(counts = { IRNode.LOOP, "1" })
66+
@IR(failOn = { IRNode.COUNTEDLOOP })
67+
public static void testStridePosScalePosInIntLoop1(int start, int stop, long length, long offset) {
68+
final long scale = 2;
69+
final int stride = 1;
70+
71+
// Same but with int loop
72+
for (int i = start; i < stop; i += stride) {
73+
Objects.checkIndex(scale * i + offset, length);
74+
}
75+
}
76+
77+
@Run(test = "testStridePosScalePosInIntLoop1")
78+
private void testStridePosScalePosInIntLoop1_runner() {
79+
testStridePosScalePosInIntLoop1(0, 100, 200, 0);
80+
}
81+
82+
@Test
83+
@IR(counts = { IRNode.LOOP, "1" })
84+
@IR(failOn = { IRNode.COUNTEDLOOP })
85+
public static void testStridePosScalePosInIntLoop2(int start, int stop, long length, long offset) {
86+
final int scale = 2;
87+
final int stride = 1;
88+
89+
// Same but with int loop
90+
for (int i = start; i < stop; i += stride) {
91+
Objects.checkIndex(scale * i + offset, length);
92+
}
93+
}
94+
95+
@Run(test = "testStridePosScalePosInIntLoop2")
96+
private void testStridePosScalePosInIntLoop2_runner() {
97+
testStridePosScalePosInIntLoop2(0, 100, 200, 0);
98+
}
6399
}

‎test/hotspot/jtreg/compiler/rangechecks/TestLongRangeCheck.java

+284-2
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@
2323

2424
/**
2525
* @test
26-
* @bug 8259609
26+
* @bug 8259609 8276116
2727
* @summary C2: optimize long range checks in long counted loops
2828
* @requires vm.compiler2.enabled
2929
* @requires vm.compMode != "Xcomp"
@@ -32,7 +32,7 @@
3232
* @build sun.hotspot.WhiteBox
3333
* @run driver jdk.test.lib.helpers.ClassFileInstaller sun.hotspot.WhiteBox
3434
*
35-
* @run main/othervm -ea -Xbootclasspath/a:. -XX:+UnlockDiagnosticVMOptions -XX:+WhiteBoxAPI -XX:-BackgroundCompilation TestLongRangeCheck
35+
* @run main/othervm -ea -Xbootclasspath/a:. -XX:+UnlockDiagnosticVMOptions -XX:+WhiteBoxAPI -XX:-BackgroundCompilation -XX:-UseOnStackReplacement TestLongRangeCheck
3636
*
3737
*/
3838

@@ -193,6 +193,115 @@ public static void main(String[] args) throws Exception {
193193
m.invoke(null, 0, 100, Long.MAX_VALUE, Long.MAX_VALUE - 50, 0, 50);
194194
assertIsCompiled(m);
195195
}
196+
197+
test("testStridePosScalePosInIntLoop", 0, 100, 100, 0);
198+
199+
test("testStrideNegScaleNegInIntLoop", 0, 100, 100, 100);
200+
201+
test("testStrideNegScalePosInIntLoop", 0, 100, 100, 0);
202+
203+
test("testStridePosScaleNegInIntLoop", 0, 100, 100, 99);
204+
205+
test("testStridePosScalePosNotOneInIntLoop", 0, 100, 1090, 0);
206+
207+
test("testStrideNegScaleNegNotOneInIntLoop", 0, 100, 1090, 1100);
208+
209+
test("testStrideNegScalePosNotOneInIntLoop", 0, 100, 1090, 0);
210+
211+
test("testStridePosScaleNegNotOneInIntLoop", 0, 100, 1090, 1089);
212+
213+
v = ((long)Integer.MAX_VALUE / 10000) * 9999;
214+
215+
test("testStridePosNotOneScalePosInIntLoop", -v, v, v * 4, 2 * v);
216+
217+
test("testStrideNegNotOneScaleNegInIntLoop", -v, v, v * 4, 2 * v);
218+
219+
test("testStrideNegNotOneScalePosInIntLoop", -v, v, v * 4, 2 * v);
220+
221+
test("testStridePosNotOneScaleNegInIntLoop", -v, v, v * 4, 2 * v - 1);
222+
223+
// offset causes overflow
224+
{
225+
Method m = newClassLoader().loadClass("TestLongRangeCheck").getDeclaredMethod("testStridePosScalePosInIntLoop", long.class, long.class, long.class, long.class);
226+
m.invoke(null, 0, 100, 100, 0);
227+
compile(m);
228+
229+
m.invoke(null, 0, 100, 100, 0);
230+
assertIsCompiled(m);
231+
try {
232+
m.invoke(null, 0, 100, 100, Long.MAX_VALUE - 50);
233+
throw new RuntimeException("should have thrown");
234+
} catch(InvocationTargetException e) {
235+
if (!(e.getCause() instanceof IndexOutOfBoundsException)) {
236+
throw new RuntimeException("unexpected exception");
237+
}
238+
}
239+
assertIsNotCompiled(m);
240+
}
241+
// no spurious deopt if the range check doesn't fail because not executed
242+
{
243+
Method m = newClassLoader().loadClass("TestLongRangeCheck").getDeclaredMethod("testStridePosScalePosConditional", long.class, long.class, long.class, long.class, long.class, long.class);
244+
m.invoke(null, 0, 100, 100, 0, 0, 100);
245+
compile(m);
246+
247+
m.invoke(null, 0, 100, 100, -50, 50, 100);
248+
assertIsCompiled(m);
249+
}
250+
{
251+
Method m = newClassLoader().loadClass("TestLongRangeCheck").getDeclaredMethod("testStridePosScalePosConditional", long.class, long.class, long.class, long.class, long.class, long.class);
252+
m.invoke(null, 0, 100, 100, 0, 0, 100);
253+
compile(m);
254+
255+
m.invoke(null, 0, 100, Long.MAX_VALUE, Long.MAX_VALUE - 50, 0, 50);
256+
assertIsCompiled(m);
257+
}
258+
259+
test("testStridePosScalePosNotOneInIntLoop2", 0, 100, 1090, 0);
260+
261+
test("testStrideNegScaleNegNotOneInIntLoop2", 0, 100, 1090, 1100);
262+
263+
test("testStrideNegScalePosNotOneInIntLoop2", 0, 100, 1090, 0);
264+
265+
test("testStridePosScaleNegNotOneInIntLoop2", 0, 100, 1090, 1089);
266+
267+
{
268+
Method m = newClassLoader().loadClass("TestLongRangeCheck").getDeclaredMethod("testStridePosScalePosInIntLoopOverflow", long.class, long.class, long.class, long.class);
269+
long stride = 1 << 14;
270+
long scale = 1 << 15;
271+
long offset = stride * scale * 4;
272+
long length = offset + stride * scale * 3 + 1;
273+
long stop = stride * 5;
274+
275+
m.invoke(null, 0, stop, length, offset);
276+
compile(m);
277+
278+
m.invoke(null, 0, stop, length, offset);
279+
// deoptimizes even though no range check fails
280+
}
281+
{
282+
Method m = newClassLoader().loadClass("TestLongRangeCheck").getDeclaredMethod("testStridePosScalePosInIntLoopOverflow", long.class, long.class, long.class, long.class);
283+
long stride = 1 << 14;
284+
long scale = 1 << 15;
285+
long offset = stride * scale * 4;
286+
long length = offset + stride * scale * 3 + 1;
287+
long stop = stride * 5;
288+
289+
m.invoke(null, 0, stop, length, offset);
290+
compile(m);
291+
292+
offset = 0;
293+
stop = stride * 5;
294+
295+
try {
296+
m.invoke(null, 0, stop, length, offset);
297+
throw new RuntimeException("should have thrown");
298+
} catch(InvocationTargetException e) {
299+
if (!(e.getCause() instanceof IndexOutOfBoundsException)) {
300+
throw new RuntimeException("unexpected exception");
301+
}
302+
}
303+
assertIsNotCompiled(m);
304+
}
196305
}
197306

198307
public static void testStridePosScalePos(long start, long stop, long length, long offset) {
@@ -301,4 +410,177 @@ public static void testStridePosScalePosConditional(long start, long stop, long
301410
}
302411
}
303412
}
413+
414+
private static void checkInputs(long... inputs) {
415+
for (int i = 0; i < inputs.length; i++) {
416+
if ((long)((int)inputs[i]) != inputs[i]) {
417+
throw new RuntimeException("bad arguments");
418+
}
419+
}
420+
}
421+
422+
public static void testStridePosScalePosInIntLoop(long start, long stop, long length, long offset) {
423+
checkInputs(start, stop);
424+
final long scale = 1;
425+
final int stride = 1;
426+
for (int i = (int)start; i < (int)stop; i += stride) {
427+
Preconditions.checkIndex(scale * i + offset, length, null);
428+
}
429+
}
430+
431+
public static void testStrideNegScaleNegInIntLoop(long start, long stop, long length, long offset) {
432+
checkInputs(start, stop);
433+
final long scale = -1;
434+
final int stride = 1;
435+
for (int i = (int)stop; i > (int)start; i -= stride) {
436+
Preconditions.checkIndex(scale * i + offset, length, null);
437+
}
438+
}
439+
440+
public static void testStrideNegScalePosInIntLoop(long start, long stop, long length, long offset) {
441+
checkInputs(start, stop);
442+
final long scale = 1;
443+
final int stride = 1;
444+
for (int i = (int)(stop-1); i >= (int)start; i -= stride) {
445+
Preconditions.checkIndex(scale * i + offset, length, null);
446+
}
447+
}
448+
449+
public static void testStridePosScaleNegInIntLoop(long start, long stop, long length, long offset) {
450+
checkInputs(start, stop);
451+
final long scale = -1;
452+
final int stride = 1;
453+
for (int i = (int)start; i < (int)stop; i += stride) {
454+
Preconditions.checkIndex(scale * i + offset, length, null);
455+
}
456+
}
457+
458+
public static void testStridePosScalePosNotOneInIntLoop(long start, long stop, long length, long offset) {
459+
checkInputs(start, stop);
460+
final long scale = 11;
461+
final int stride = 1;
462+
for (int i = (int)start; i < (int)stop; i += stride) {
463+
Preconditions.checkIndex(scale * i + offset, length, null);
464+
}
465+
}
466+
467+
public static void testStrideNegScaleNegNotOneInIntLoop(long start, long stop, long length, long offset) {
468+
checkInputs(start, stop);
469+
final long scale = -11;
470+
final int stride = 1;
471+
for (int i = (int)stop; i > (int)start; i -= stride) {
472+
Preconditions.checkIndex(scale * i + offset, length, null);
473+
}
474+
}
475+
476+
public static void testStrideNegScalePosNotOneInIntLoop(long start, long stop, long length, long offset) {
477+
checkInputs(start, stop);
478+
final long scale = 11;
479+
final int stride = 1;
480+
for (int i = (int)(stop-1); i >= (int)start; i -= stride) {
481+
Preconditions.checkIndex(scale * i + offset, length, null);
482+
}
483+
}
484+
485+
public static void testStridePosScaleNegNotOneInIntLoop(long start, long stop, long length, long offset) {
486+
checkInputs(start, stop);
487+
final long scale = -11;
488+
final int stride = 1;
489+
for (int i = (int)start; i < (int)stop; i += stride) {
490+
Preconditions.checkIndex(scale * i + offset, length, null);
491+
}
492+
}
493+
494+
public static void testStridePosNotOneScalePosInIntLoop(long start, long stop, long length, long offset) {
495+
checkInputs(start, stop);
496+
final long scale = 2;
497+
final int stride = Integer.MAX_VALUE / 10000;
498+
for (int i = (int)start; i < (int)stop; i += stride) {
499+
Preconditions.checkIndex(scale * i + offset, length, null);
500+
}
501+
}
502+
503+
public static void testStrideNegNotOneScaleNegInIntLoop(long start, long stop, long length, long offset) {
504+
checkInputs(start, stop);
505+
final long scale = -2;
506+
final int stride = Integer.MAX_VALUE / 10000;
507+
for (int i = (int)stop; i > (int)start; i -= stride) {
508+
Preconditions.checkIndex(scale * i + offset, length, null);
509+
}
510+
}
511+
512+
public static void testStrideNegNotOneScalePosInIntLoop(long start, long stop, long length, long offset) {
513+
checkInputs(start, stop);
514+
final long scale = 2;
515+
final int stride = Integer.MAX_VALUE / 10000;
516+
for (int i = (int)(stop-1); i >= (int)start; i -= stride) {
517+
Preconditions.checkIndex(scale * i + offset, length, null);
518+
}
519+
}
520+
521+
public static void testStridePosNotOneScaleNegInIntLoop(long start, long stop, long length, long offset) {
522+
checkInputs(start, stop);
523+
final long scale = -2;
524+
final int stride = Integer.MAX_VALUE / 10000;
525+
for (int i = (int)start; i < (int)stop; i += stride) {
526+
Preconditions.checkIndex(scale * i + offset, length, null);
527+
}
528+
}
529+
530+
public static void testStridePosScalePosConditionalInIntLoop(long start, long stop, long length, long offset, long start2, long stop2) {
531+
checkInputs(start, stop, start2, stop2);
532+
Preconditions.checkIndex(0, length, null);
533+
final long scale = 1;
534+
final int stride = 1;
535+
for (int i = (int)start; i < (int)stop; i += stride) {
536+
if (i >= (int)start2 && i < (int)stop2) {
537+
Preconditions.checkIndex(scale * i + offset, length, null);
538+
}
539+
}
540+
}
541+
542+
public static void testStridePosScalePosNotOneInIntLoop2(long start, long stop, long length, long offset) {
543+
checkInputs(start, stop);
544+
final int scale = 11;
545+
final int stride = 1;
546+
for (int i = (int)start; i < (int)stop; i += stride) {
547+
Preconditions.checkIndex(scale * i + offset, length, null);
548+
}
549+
}
550+
551+
public static void testStrideNegScaleNegNotOneInIntLoop2(long start, long stop, long length, long offset) {
552+
checkInputs(start, stop);
553+
final int scale = -11;
554+
final int stride = 1;
555+
for (int i = (int)stop; i > (int)start; i -= stride) {
556+
Preconditions.checkIndex(scale * i + offset, length, null);
557+
}
558+
}
559+
560+
public static void testStrideNegScalePosNotOneInIntLoop2(long start, long stop, long length, long offset) {
561+
checkInputs(start, stop);
562+
final int scale = 11;
563+
final int stride = 1;
564+
for (int i = (int)(stop-1); i >= (int)start; i -= stride) {
565+
Preconditions.checkIndex(scale * i + offset, length, null);
566+
}
567+
}
568+
569+
public static void testStridePosScaleNegNotOneInIntLoop2(long start, long stop, long length, long offset) {
570+
checkInputs(start, stop);
571+
final int scale = -11;
572+
final int stride = 1;
573+
for (int i = (int)start; i < (int)stop; i += stride) {
574+
Preconditions.checkIndex(scale * i + offset, length, null);
575+
}
576+
}
577+
578+
public static void testStridePosScalePosInIntLoopOverflow(long start, long stop, long length, long offset) {
579+
checkInputs(start, stop);
580+
final int scale = 1 << 15;
581+
final int stride = 1 << 14;
582+
for (int i = (int)start; i < (int)stop; i += stride) {
583+
Preconditions.checkIndex(scale * i + offset, length, null);
584+
}
585+
}
304586
}

0 commit comments

Comments
 (0)
Please sign in to comment.