Skip to content

Commit a0a09d5

Browse files
committedDec 22, 2022
8298176: remove OpaqueZeroTripGuardPostLoop once main-loop disappears
Reviewed-by: thartmann, chagedorn, kvn
1 parent fef70d7 commit a0a09d5

File tree

7 files changed

+191
-3
lines changed

7 files changed

+191
-3
lines changed
 

‎src/hotspot/share/opto/loopTransform.cpp

+2-2
Original file line numberDiff line numberDiff line change
@@ -1705,7 +1705,7 @@ void PhaseIdealLoop::insert_pre_post_loops(IdealLoopTree *loop, Node_List &old_n
17051705
// pre-loop, the main-loop may not execute at all. Later in life this
17061706
// zero-trip guard will become the minimum-trip guard when we unroll
17071707
// the main-loop.
1708-
Node *min_opaq = new OpaqueZeroTripGuardNode(C, limit);
1708+
Node *min_opaq = new OpaqueZeroTripGuardNode(C, limit, b_test);
17091709
Node *min_cmp = new CmpINode(pre_incr, min_opaq);
17101710
Node *min_bol = new BoolNode(min_cmp, b_test);
17111711
register_new_node(min_opaq, new_pre_exit);
@@ -1994,7 +1994,7 @@ Node *PhaseIdealLoop::insert_post_loop(IdealLoopTree* loop, Node_List& old_new,
19941994
// (the previous loop trip-counter exit value) because we will be changing
19951995
// the exit value (via additional unrolling) so we cannot constant-fold away the zero
19961996
// trip guard until all unrolling is done.
1997-
Node *zer_opaq = new OpaqueZeroTripGuardNode(C, incr);
1997+
Node *zer_opaq = new OpaqueZeroTripGuardNode(C, incr, main_end->test_trip());
19981998
Node *zer_cmp = new CmpINode(zer_opaq, limit);
19991999
Node *zer_bol = new BoolNode(zer_cmp, main_end->test_trip());
20002000
register_new_node(zer_opaq, new_main_exit);

‎src/hotspot/share/opto/opaquenode.hpp

+9-1
Original file line numberDiff line numberDiff line change
@@ -27,6 +27,7 @@
2727

2828
#include "opto/node.hpp"
2929
#include "opto/opcodes.hpp"
30+
#include "subnode.hpp"
3031

3132
//------------------------------Opaque1Node------------------------------------
3233
// A node to prevent unwanted optimizations. Allows constant folding.
@@ -72,9 +73,16 @@ class OpaqueLoopStrideNode : public Opaque1Node {
7273

7374
class OpaqueZeroTripGuardNode : public Opaque1Node {
7475
public:
75-
OpaqueZeroTripGuardNode(Compile* C, Node *n) : Opaque1Node(C, n) {
76+
// This captures the test that returns true when the loop is entered. It depends on whether the loop goes up or down.
77+
// This is used by CmpINode::Value.
78+
BoolTest::mask _loop_entered_mask;
79+
OpaqueZeroTripGuardNode(Compile* C, Node* n, BoolTest::mask loop_entered_test) :
80+
Opaque1Node(C, n), _loop_entered_mask(loop_entered_test) {
7681
}
7782
virtual int Opcode() const;
83+
virtual uint size_of() const {
84+
return sizeof(*this);
85+
}
7886
};
7987

8088
//------------------------------Opaque3Node------------------------------------

‎src/hotspot/share/opto/phaseX.cpp

+14
Original file line numberDiff line numberDiff line change
@@ -1678,6 +1678,13 @@ void PhaseIterGVN::add_users_to_worklist( Node *n ) {
16781678
}
16791679
}
16801680
}
1681+
if (use->Opcode() == Op_OpaqueZeroTripGuard) {
1682+
assert(use->outcnt() <= 1, "OpaqueZeroTripGuard can't be shared");
1683+
if (use->outcnt() == 1) {
1684+
Node* cmp = use->unique_out();
1685+
_worklist.push(cmp);
1686+
}
1687+
}
16811688
}
16821689
}
16831690

@@ -1848,6 +1855,7 @@ void PhaseCCP::push_more_uses(Unique_Node_List& worklist, Node* parent, const No
18481855
push_loadp(worklist, use);
18491856
push_and(worklist, parent, use);
18501857
push_cast_ii(worklist, parent, use);
1858+
push_opaque_zero_trip_guard(worklist, use);
18511859
}
18521860

18531861

@@ -1968,6 +1976,12 @@ void PhaseCCP::push_cast_ii(Unique_Node_List& worklist, const Node* parent, cons
19681976
}
19691977
}
19701978

1979+
void PhaseCCP::push_opaque_zero_trip_guard(Unique_Node_List& worklist, const Node* use) const {
1980+
if (use->Opcode() == Op_OpaqueZeroTripGuard) {
1981+
push_if_not_bottom_type(worklist, use->unique_out());
1982+
}
1983+
}
1984+
19711985
//------------------------------do_transform-----------------------------------
19721986
// Top level driver for the recursive transformer
19731987
void PhaseCCP::do_transform() {

‎src/hotspot/share/opto/phaseX.hpp

+1
Original file line numberDiff line numberDiff line change
@@ -596,6 +596,7 @@ class PhaseCCP : public PhaseIterGVN {
596596
static void push_load_barrier(Unique_Node_List& worklist, const BarrierSetC2* barrier_set, const Node* use);
597597
void push_and(Unique_Node_List& worklist, const Node* parent, const Node* use) const;
598598
void push_cast_ii(Unique_Node_List& worklist, const Node* parent, const Node* use) const;
599+
void push_opaque_zero_trip_guard(Unique_Node_List& worklist, const Node* use) const;
599600

600601
public:
601602
PhaseCCP( PhaseIterGVN *igvn ); // Compute conditional constants

‎src/hotspot/share/opto/subnode.cpp

+42
Original file line numberDiff line numberDiff line change
@@ -34,6 +34,7 @@
3434
#include "opto/matcher.hpp"
3535
#include "opto/movenode.hpp"
3636
#include "opto/mulnode.hpp"
37+
#include "opto/opaquenode.hpp"
3738
#include "opto/opcodes.hpp"
3839
#include "opto/phaseX.hpp"
3940
#include "opto/subnode.hpp"
@@ -661,6 +662,47 @@ const Type *CmpINode::sub( const Type *t1, const Type *t2 ) const {
661662
return TypeInt::CC; // else use worst case results
662663
}
663664

665+
const Type* CmpINode::Value(PhaseGVN* phase) const {
666+
Node* in1 = in(1);
667+
Node* in2 = in(2);
668+
// If this test is the zero trip guard for a main or post loop, check whether, with the opaque node removed, the test
669+
// would constant fold so the loop is never entered. If so return the type of the test without the opaque node removed:
670+
// make the loop unreachable.
671+
// The reason for this is that the iv phi captures the bounds of the loop and if the loop becomes unreachable, it can
672+
// become top. In that case, the loop must be removed.
673+
// This is safe because:
674+
// - as optimizations proceed, the range of iterations executed by the main loop narrows. If no iterations remain, then
675+
// we're done with optimizations for that loop.
676+
// - the post loop is initially not reachable but as long as there's a main loop, the zero trip guard for the post
677+
// loop takes a phi that merges the pre and main loop's iv and can't constant fold the zero trip guard. Once, the main
678+
// loop is removed, there's no need to preserve the zero trip guard for the post loop anymore.
679+
if (in1 != NULL && in2 != NULL) {
680+
uint input = 0;
681+
Node* cmp = NULL;
682+
BoolTest::mask test;
683+
if (in1->Opcode() == Op_OpaqueZeroTripGuard && phase->type(in1) != Type::TOP) {
684+
cmp = new CmpINode(in1->in(1), in2);
685+
test = ((OpaqueZeroTripGuardNode*)in1)->_loop_entered_mask;
686+
}
687+
if (in2->Opcode() == Op_OpaqueZeroTripGuard && phase->type(in2) != Type::TOP) {
688+
assert(cmp == NULL, "A cmp with 2 OpaqueZeroTripGuard inputs");
689+
cmp = new CmpINode(in1, in2->in(1));
690+
test = ((OpaqueZeroTripGuardNode*)in2)->_loop_entered_mask;
691+
}
692+
if (cmp != NULL) {
693+
const Type* cmp_t = cmp->Value(phase);
694+
const Type* t = BoolTest(test).cc2logical(cmp_t);
695+
cmp->destruct(phase);
696+
if (t == TypeInt::ZERO) {
697+
return cmp_t;
698+
}
699+
}
700+
}
701+
702+
return SubNode::Value(phase);
703+
}
704+
705+
664706
// Simplify a CmpU (compare 2 integers) node, based on local information.
665707
// If both inputs are constants, compare them.
666708
const Type *CmpUNode::sub( const Type *t1, const Type *t2 ) const {

‎src/hotspot/share/opto/subnode.hpp

+1
Original file line numberDiff line numberDiff line change
@@ -153,6 +153,7 @@ class CmpINode : public CmpNode {
153153
virtual int Opcode() const;
154154
virtual Node *Ideal(PhaseGVN *phase, bool can_reshape);
155155
virtual const Type *sub( const Type *, const Type * ) const;
156+
virtual const Type* Value(PhaseGVN* phase) const;
156157
};
157158

158159
//------------------------------CmpUNode---------------------------------------
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,122 @@
1+
/*
2+
* Copyright (c) 2022, Oracle and/or its affiliates. All rights reserved.
3+
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4+
*
5+
* This code is free software; you can redistribute it and/or modify it
6+
* under the terms of the GNU General Public License version 2 only, as
7+
* published by the Free Software Foundation.
8+
*
9+
* This code is distributed in the hope that it will be useful, but WITHOUT
10+
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11+
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
12+
* version 2 for more details (a copy is included in the LICENSE file that
13+
* accompanied this code).
14+
*
15+
* You should have received a copy of the GNU General Public License version
16+
* 2 along with this work; if not, write to the Free Software Foundation,
17+
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18+
*
19+
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
20+
* or visit www.oracle.com if you need additional information or have any
21+
* questions.
22+
*/
23+
24+
/*
25+
* @test
26+
* @bug 8298176
27+
* @summary Must remove OpaqueZeroTripGuardPostLoop after main loop disappears else
28+
* the zero-trip-guard of the post loop cannot die and leaves an inconsistent
29+
* graph behind.
30+
* @run main/othervm -Xcomp -XX:-TieredCompilation
31+
* -XX:CompileCommand=compileonly,TestOpaqueZeroTripGuardPostLoopRemoval::test*
32+
* -XX:CompileCommand=dontinline,TestOpaqueZeroTripGuardPostLoopRemoval::*
33+
* TestOpaqueZeroTripGuardPostLoopRemoval
34+
*/
35+
36+
public class TestOpaqueZeroTripGuardPostLoopRemoval {
37+
static long x;
38+
39+
public static void main(String[] strArr) {
40+
test_001();
41+
test_002();
42+
try {
43+
test_003();
44+
} catch (Exception e) {
45+
// Expected
46+
}
47+
test_004();
48+
test_005();
49+
}
50+
51+
static void test_001() {
52+
int b = 6;
53+
for (long l = 1; l < 9; l++) {
54+
b++;
55+
}
56+
for (int i = 1; i < 1000; i*=2) {
57+
for (int j = 1; j < 2; j++) {
58+
x = b + 1;
59+
}
60+
}
61+
}
62+
63+
static void test_002() {
64+
int b = 6;
65+
for (long l = 60; l < 3000; l+=3) {
66+
// bounds of loop: no work for post loop
67+
b += 33; // any multiple of iv step
68+
}
69+
for (int i = 1; i < 1000; i*=2) {
70+
for (int j = 1; j < 2; j++) {
71+
x = b + 1;
72+
}
73+
}
74+
}
75+
76+
static void dontInline() {
77+
throw new RuntimeException();
78+
}
79+
80+
static int test_003() {
81+
int y = 3;
82+
for (int i = 0; i < 9; ) {
83+
for (long l = 1; l < 5; l++) {
84+
y *= 2;
85+
}
86+
while (true) {
87+
dontInline();
88+
}
89+
}
90+
return y;
91+
}
92+
93+
static void test_004() {
94+
for (int i2 = 4; i2 < 13; i2++) {
95+
double d = 56;
96+
for (long l = 1; l < 5; l++) {
97+
d = d + 3;
98+
}
99+
for (int i = 0; i < 10; i++) {
100+
for (int d2 = i2; d2 < 2; d2 = 3) {
101+
}
102+
}
103+
}
104+
}
105+
106+
public static int test_005() {
107+
long arr[]=new long[400];
108+
for (int i = 3; i < 177; i++) {
109+
for (int j = 0; j < 10; j++){}
110+
}
111+
int y = 0;
112+
for (int i = 15; i < 356; i++) {
113+
// Inner loop prevents strip-mining of outer loop
114+
// later, inner loop is removed, so outer does pre-main-post without strip-mining
115+
for (int j = 0; j < 10; j++){
116+
y |= 1;
117+
}
118+
}
119+
return y;
120+
}
121+
}
122+

0 commit comments

Comments
 (0)
Please sign in to comment.