Skip to content

Commit cd8709e

Browse files
committedApr 29, 2022
8284883: JVM crash: guarantee(sect->end() <= sect->limit()) failed: sanity on AVX512
Reviewed-by: kvn, jbhateja
1 parent 3d07b3c commit cd8709e

File tree

4 files changed

+90
-9
lines changed

4 files changed

+90
-9
lines changed
 

‎src/hotspot/cpu/x86/macroAssembler_x86.cpp

+33-8
Original file line numberDiff line numberDiff line change
@@ -5277,10 +5277,28 @@ void MacroAssembler::clear_mem(Register base, int cnt, Register rtmp, XMMRegiste
52775277

52785278
int vector64_count = (cnt & (~0x7)) >> 3;
52795279
cnt = cnt & 0x7;
5280+
const int fill64_per_loop = 4;
5281+
const int max_unrolled_fill64 = 8;
52805282

52815283
// 64 byte initialization loop.
52825284
vpxor(xtmp, xtmp, xtmp, use64byteVector ? AVX_512bit : AVX_256bit);
5283-
for (int i = 0; i < vector64_count; i++) {
5285+
int start64 = 0;
5286+
if (vector64_count > max_unrolled_fill64) {
5287+
Label LOOP;
5288+
Register index = rtmp;
5289+
5290+
start64 = vector64_count - (vector64_count % fill64_per_loop);
5291+
5292+
movl(index, 0);
5293+
BIND(LOOP);
5294+
for (int i = 0; i < fill64_per_loop; i++) {
5295+
fill64(Address(base, index, Address::times_1, i * 64), xtmp, use64byteVector);
5296+
}
5297+
addl(index, fill64_per_loop * 64);
5298+
cmpl(index, start64 * 64);
5299+
jccb(Assembler::less, LOOP);
5300+
}
5301+
for (int i = start64; i < vector64_count; i++) {
52845302
fill64(base, i * 64, xtmp, use64byteVector);
52855303
}
52865304

@@ -8874,22 +8892,29 @@ void MacroAssembler::fill32_masked(uint shift, Register dst, int disp,
88748892
}
88758893

88768894

8877-
void MacroAssembler::fill32(Register dst, int disp, XMMRegister xmm) {
8895+
void MacroAssembler::fill32(Address dst, XMMRegister xmm) {
88788896
assert(MaxVectorSize >= 32, "vector length should be >= 32");
8879-
vmovdqu(Address(dst, disp), xmm);
8897+
vmovdqu(dst, xmm);
88808898
}
88818899

8882-
void MacroAssembler::fill64(Register dst, int disp, XMMRegister xmm, bool use64byteVector) {
8900+
void MacroAssembler::fill32(Register dst, int disp, XMMRegister xmm) {
8901+
fill32(Address(dst, disp), xmm);
8902+
}
8903+
8904+
void MacroAssembler::fill64(Address dst, XMMRegister xmm, bool use64byteVector) {
88838905
assert(MaxVectorSize >= 32, "vector length should be >= 32");
8884-
BasicType type[] = {T_BYTE, T_SHORT, T_INT, T_LONG};
88858906
if (!use64byteVector) {
8886-
fill32(dst, disp, xmm);
8887-
fill32(dst, disp + 32, xmm);
8907+
fill32(dst, xmm);
8908+
fill32(dst.plus_disp(32), xmm);
88888909
} else {
8889-
evmovdquq(Address(dst, disp), xmm, Assembler::AVX_512bit);
8910+
evmovdquq(dst, xmm, Assembler::AVX_512bit);
88908911
}
88918912
}
88928913

8914+
void MacroAssembler::fill64(Register dst, int disp, XMMRegister xmm, bool use64byteVector) {
8915+
fill64(Address(dst, disp), xmm, use64byteVector);
8916+
}
8917+
88938918
#ifdef _LP64
88948919
void MacroAssembler::generate_fill_avx3(BasicType type, Register to, Register value,
88958920
Register count, Register rtmp, XMMRegister xtmp) {

‎src/hotspot/cpu/x86/macroAssembler_x86.hpp

+4
Original file line numberDiff line numberDiff line change
@@ -1985,8 +1985,12 @@ class MacroAssembler: public Assembler {
19851985
XMMRegister xmm, KRegister mask, Register length,
19861986
Register temp);
19871987

1988+
void fill32(Address dst, XMMRegister xmm);
1989+
19881990
void fill32(Register dst, int disp, XMMRegister xmm);
19891991

1992+
void fill64(Address dst, XMMRegister xmm, bool use64byteVector = false);
1993+
19901994
void fill64(Register dst, int dis, XMMRegister xmm, bool use64byteVector = false);
19911995

19921996
#ifdef _LP64

‎src/hotspot/share/opto/memnode.cpp

+2-1
Original file line numberDiff line numberDiff line change
@@ -3072,7 +3072,7 @@ Node* ClearArrayNode::Identity(PhaseGVN* phase) {
30723072
// Clearing a short array is faster with stores
30733073
Node *ClearArrayNode::Ideal(PhaseGVN *phase, bool can_reshape) {
30743074
// Already know this is a large node, do not try to ideal it
3075-
if (!IdealizeClearArrayNode || _is_large) return NULL;
3075+
if (_is_large) return NULL;
30763076

30773077
const int unit = BytesPerLong;
30783078
const TypeX* t = phase->type(in(2))->isa_intptr_t();
@@ -3093,6 +3093,7 @@ Node *ClearArrayNode::Ideal(PhaseGVN *phase, bool can_reshape) {
30933093
} else if (size > 2 && Matcher::match_rule_supported_vector(Op_ClearArray, 4, T_LONG)) {
30943094
return NULL;
30953095
}
3096+
if (!IdealizeClearArrayNode) return NULL;
30963097
Node *mem = in(1);
30973098
if( phase->type(mem)==Type::TOP ) return NULL;
30983099
Node *adr = in(3);
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,51 @@
1+
/*
2+
* Copyright (c) 2022, Oracle and/or its affiliates. All rights reserved.
3+
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4+
*
5+
* This code is free software; you can redistribute it and/or modify it
6+
* under the terms of the GNU General Public License version 2 only, as
7+
* published by the Free Software Foundation.
8+
*
9+
* This code is distributed in the hope that it will be useful, but WITHOUT
10+
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11+
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
12+
* version 2 for more details (a copy is included in the LICENSE file that
13+
* accompanied this code).
14+
*
15+
* You should have received a copy of the GNU General Public License version
16+
* 2 along with this work; if not, write to the Free Software Foundation,
17+
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18+
*
19+
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
20+
* or visit www.oracle.com if you need additional information or have any
21+
* questions.
22+
*
23+
*/
24+
25+
/*
26+
* @test ClearArray.java
27+
* @bug 8284883
28+
* @compile ClearArray.java
29+
* @summary ClearArray instruction overflows scratch buffer
30+
* @run main/othervm -XX:+UnlockDiagnosticVMOptions -XX:-TieredCompilation -Xbatch
31+
* -XX:InitArrayShortSize=32768 -XX:-IdealizeClearArrayNode compiler.c2.ClearArray
32+
* @run main/othervm -XX:+UnlockDiagnosticVMOptions -XX:+IgnoreUnrecognizedVMOptions -XX:-TieredCompilation -Xbatch
33+
* -XX:InitArrayShortSize=32768 -XX:-IdealizeClearArrayNode -XX:UseAVX=3 compiler.c2.ClearArray
34+
*/
35+
36+
package compiler.c2;
37+
38+
public class ClearArray {
39+
40+
static long[] STATIC;
41+
42+
static void foo() {
43+
STATIC = new long[2048 - 1];
44+
}
45+
46+
public static void main(String[] args) {
47+
for (int i = 0; i < 20_000; ++i) {
48+
foo();
49+
}
50+
}
51+
}

0 commit comments

Comments
 (0)
Please sign in to comment.