@@ -118,9 +118,20 @@ IfNode* PhaseIdealLoop::find_unswitching_candidate(const IdealLoopTree *loop) co
118
118
// execute.
119
119
void PhaseIdealLoop::do_unswitching (IdealLoopTree *loop, Node_List &old_new) {
120
120
121
- // Find first invariant test that doesn't exit the loop
122
121
LoopNode *head = loop->_head ->as_Loop ();
123
-
122
+ Node* entry = head->skip_strip_mined ()->in (LoopNode::EntryControl);
123
+ if (find_predicate_insertion_point (entry, Deoptimization::Reason_loop_limit_check) != NULL
124
+ || (UseProfiledLoopPredicate && find_predicate_insertion_point (entry, Deoptimization::Reason_profile_predicate) != NULL )
125
+ || (UseLoopPredicate && find_predicate_insertion_point (entry, Deoptimization::Reason_predicate) != NULL )) {
126
+ assert (entry->is_IfProj (), " sanity - must be ifProj since there is at least one predicate" );
127
+ if (entry->outcnt () > 1 ) {
128
+ // Bailout if there are loop predicates from which there are additional control dependencies (i.e. from
129
+ // loop entry 'entry') to previously partially peeled statements since this case is not handled and can lead
130
+ // to wrong execution. Remove this bailout, once this is fixed.
131
+ return ;
132
+ }
133
+ }
134
+ // Find first invariant test that doesn't exit the loop
124
135
IfNode* unswitch_iff = find_unswitching_candidate ((const IdealLoopTree *)loop);
125
136
assert (unswitch_iff != NULL , " should be at least one" );
126
137
@@ -140,7 +151,7 @@ void PhaseIdealLoop::do_unswitching(IdealLoopTree *loop, Node_List &old_new) {
140
151
141
152
#ifdef ASSERT
142
153
Node* uniqc = proj_true->unique_ctrl_out ();
143
- Node* entry = head->skip_strip_mined ()->in (LoopNode::EntryControl);
154
+ entry = head->skip_strip_mined ()->in (LoopNode::EntryControl);
144
155
Node* predicate = find_predicate (entry);
145
156
if (predicate != NULL ) {
146
157
entry = skip_loop_predicates (entry);
@@ -281,123 +292,6 @@ ProjNode* PhaseIdealLoop::create_slow_version_of_loop(IdealLoopTree *loop,
281
292
_igvn.replace_input_of (slow_l, LoopNode::EntryControl, ifslow_pred);
282
293
set_idom (slow_l, ifslow_pred, dom_depth (l));
283
294
284
- if (iffast != iffast_pred && entry->outcnt () > 1 ) {
285
- // This situation occurs when only non-CFG nodes (i.e. no control dependencies between them) with a control
286
- // input from the loop header were partially peeled before (now control dependent on loop entry control).
287
- // If additional CFG nodes were peeled, then the insertion point of the loop predicates from the parsing stage
288
- // would not be found anymore and the predicates not cloned at all (i.e. iffast == iffast_pred) as it happens
289
- // for normal peeling. Those partially peeled statements have a control input from the old loop entry control
290
- // and need to be executed after the predicates. These control dependencies need to be removed from the old
291
- // entry control and added to the new entry control nodes 'iffast_pred' and 'ifslow_pred'. Since each node can
292
- // only have one control input, we need to create clones for all statements (2) that can be reached over a path
293
- // from the old entry control 'entry' (1) to a loop phi (8, 9). The old nodes (2) will be moved to the fast loop and the
294
- // new cloned nodes (10) to the slow loop.
295
- //
296
- // The result of the following algorithm is visualized below. The cloned loop predicates for the fast loop
297
- // are between the loop selection node (3) and the entry control for the fast loop (4) and for the slow loop
298
- // between the loop selection node (3) and the entry control for the slow loop (5), respectively.
299
- //
300
- // 1 entry 1 entry
301
- // / \ |
302
- // 2 stmt 3 iff 3 iff
303
- // | / \ / \
304
- // | .. .. .. ..
305
- // | / \ / \
306
- // | 4 iffast_p 5 ifslow_p 4 iffast_p 5 ifslow_p
307
- // | | | / \ / \
308
- // | 6 head 7 slow_head ==> 6 head 2 stmt 7 slow_head 10 cloned_stmt
309
- // | | | \ / \ /
310
- // +--\ | +--\ | 8 phi 9 phi
311
- // | 8 phi | 9 phi
312
- // | |
313
- // +----------+
314
- //
315
- assert (ifslow != ifslow_pred, " sanity - must also be different" );
316
-
317
- ResourceMark rm;
318
- Unique_Node_List worklist;
319
- Unique_Node_List phis;
320
- Node_List old_clone;
321
- LoopNode* slow_head = old_new[head->_idx ]->as_Loop ();
322
-
323
- // 1) Do a BFS starting from the outputs of the original entry control node 'entry' to all (loop) phis
324
- // and add the non-phi nodes to the worklist.
325
- // First get all outputs of 'entry' which are not the new "loop selection check" 'iff'.
326
- for (DUIterator_Fast imax, i = entry->fast_outs (imax); i < imax; i++) {
327
- Node* stmt = entry->fast_out (i);
328
- if (stmt != iff) {
329
- assert (!stmt->is_CFG (), " cannot be a CFG node" );
330
- worklist.push (stmt);
331
- }
332
- }
333
-
334
- // Then do a BFS from all collected nodes so far and stop if a phi node is hit.
335
- // Keep track of them on a separate 'phis' list to adjust their inputs later.
336
- for (uint i = 0 ; i < worklist.size (); i++) {
337
- Node* stmt = worklist.at (i);
338
- for (DUIterator_Fast jmax, j = stmt->fast_outs (jmax); j < jmax; j++) {
339
- Node* out = stmt->fast_out (j);
340
- assert (!out->is_CFG (), " cannot be a CFG node" );
341
- if (out->is_Phi ()) {
342
- assert (out->in (PhiNode::Region) == head || out->in (PhiNode::Region) == slow_head,
343
- " phi must be either part of the slow or the fast loop" );
344
- phis.push (out);
345
- } else {
346
- worklist.push (out);
347
- }
348
- }
349
- }
350
-
351
- // 2) All nodes of interest are in 'worklist' and are now cloned. This could not be done simultaneously
352
- // in step 1 in an easy way because we could have cloned a node which has an input that is added to the
353
- // worklist later. As a result, the BFS would hit a clone which does not need to be cloned again.
354
- // While cloning a node, the control inputs to 'entry' are updated such that the old node points to
355
- // 'iffast_pred' and the clone to 'ifslow_pred', respectively.
356
- for (uint i = 0 ; i < worklist.size (); i++) {
357
- Node* stmt = worklist.at (i);
358
- assert (!stmt->is_CFG (), " cannot be a CFG node" );
359
- Node* cloned_stmt = stmt->clone ();
360
- old_clone.map (stmt->_idx , cloned_stmt);
361
- _igvn.register_new_node_with_optimizer (cloned_stmt);
362
-
363
- if (stmt->in (0 ) == entry) {
364
- _igvn.replace_input_of (stmt, 0 , iffast_pred);
365
- set_ctrl (stmt, iffast_pred);
366
- _igvn.replace_input_of (cloned_stmt, 0 , ifslow_pred);
367
- set_ctrl (cloned_stmt, ifslow_pred);
368
- }
369
- }
370
-
371
- // 3) Update the entry control of all collected phi nodes of the slow loop to use the cloned nodes
372
- // instead of the old ones from the worklist
373
- for (uint i = 0 ; i < phis.size (); i++) {
374
- assert (phis.at (i)->is_Phi (), " must be a phi" );
375
- PhiNode* phi = phis.at (i)->as_Phi ();
376
- if (phi->in (PhiNode::Region) == slow_head) {
377
- // Slow loop: Update phi entry control to use the cloned version instead of the old one from the worklist
378
- Node* entry_control = phi->in (LoopNode::EntryControl);
379
- _igvn.replace_input_of (phi, LoopNode::EntryControl, old_clone[phi->in (LoopNode::EntryControl)->_idx ]);
380
- }
381
-
382
- }
383
-
384
- // 4) Replace all input edges of cloned nodes from old nodes on the worklist by an input edge from their
385
- // corresponding cloned version.
386
- for (uint i = 0 ; i < worklist.size (); i++) {
387
- Node* stmt = worklist.at (i);
388
- for (uint j = 0 ; j < stmt->req (); j++) {
389
- Node* in = stmt->in (j);
390
- if (in == NULL ) {
391
- continue ;
392
- }
393
-
394
- if (worklist.contains (in)) {
395
- // Replace the edge old1->clone_of_old_2 with an edge clone_of_old1->clone_of_old2
396
- old_clone[stmt->_idx ]->set_req (j, old_clone[in->_idx ]);
397
- }
398
- }
399
- }
400
- }
401
295
recompute_dom_depth ();
402
296
403
297
return iffast;
0 commit comments