Skip to content

Commit e0151a6

Browse files
Xiaohong GongNingsheng Jian
Xiaohong Gong
authored and
Ningsheng Jian
committedApr 16, 2021
8264104: Eliminate unnecessary vector mask conversion during VectorUnbox for floating point VectorMask
Reviewed-by: kvn, vlivanov
1 parent 64e2130 commit e0151a6

File tree

9 files changed

+103
-1
lines changed

9 files changed

+103
-1
lines changed
 

‎src/hotspot/cpu/aarch64/aarch64_neon.ad

+30
Original file line numberDiff line numberDiff line change
@@ -3334,6 +3334,36 @@ instruct storemask2L(vecD dst, vecX src, immI_8 size)
33343334
ins_pipe(pipe_slow);
33353335
%}
33363336

3337+
// vector mask cast
3338+
3339+
instruct vmaskcastD(vecD dst)
3340+
%{
3341+
predicate(n->bottom_type()->is_vect()->length_in_bytes() == 8 &&
3342+
n->in(1)->bottom_type()->is_vect()->length_in_bytes() == 8 &&
3343+
n->bottom_type()->is_vect()->length() == n->in(1)->bottom_type()->is_vect()->length());
3344+
match(Set dst (VectorMaskCast dst));
3345+
ins_cost(0);
3346+
format %{ "vmaskcast $dst\t# empty" %}
3347+
ins_encode %{
3348+
// empty
3349+
%}
3350+
ins_pipe(pipe_class_empty);
3351+
%}
3352+
3353+
instruct vmaskcastX(vecX dst)
3354+
%{
3355+
predicate(n->bottom_type()->is_vect()->length_in_bytes() == 16 &&
3356+
n->in(1)->bottom_type()->is_vect()->length_in_bytes() == 16 &&
3357+
n->bottom_type()->is_vect()->length() == n->in(1)->bottom_type()->is_vect()->length());
3358+
match(Set dst (VectorMaskCast dst));
3359+
ins_cost(0);
3360+
format %{ "vmaskcast $dst\t# empty" %}
3361+
ins_encode %{
3362+
// empty
3363+
%}
3364+
ins_pipe(pipe_class_empty);
3365+
%}
3366+
33373367
//-------------------------------- LOAD_IOTA_INDICES----------------------------------
33383368

33393369
instruct loadcon8B(vecD dst, immI0 src)

‎src/hotspot/cpu/aarch64/aarch64_neon_ad.m4

+21
Original file line numberDiff line numberDiff line change
@@ -1258,6 +1258,27 @@ instruct storemask2L(vecD dst, vecX src, immI_8 size)
12581258
ins_pipe(pipe_slow);
12591259
%}
12601260

1261+
// vector mask cast
1262+
dnl
1263+
define(`VECTOR_MASK_CAST', `
1264+
instruct vmaskcast$1`'(vec$1 dst)
1265+
%{
1266+
predicate(n->bottom_type()->is_vect()->length_in_bytes() == $2 &&
1267+
n->in(1)->bottom_type()->is_vect()->length_in_bytes() == $2 &&
1268+
n->bottom_type()->is_vect()->length() == n->in(1)->bottom_type()->is_vect()->length());
1269+
match(Set dst (VectorMaskCast dst));
1270+
ins_cost(0);
1271+
format %{ "vmaskcast $dst\t# empty" %}
1272+
ins_encode %{
1273+
// empty
1274+
%}
1275+
ins_pipe(pipe_class_empty);
1276+
%}')dnl
1277+
dnl $1 $2
1278+
VECTOR_MASK_CAST(D, 8)
1279+
VECTOR_MASK_CAST(X, 16)
1280+
dnl
1281+
12611282
//-------------------------------- LOAD_IOTA_INDICES----------------------------------
12621283
dnl
12631284
define(`PREDICATE', `ifelse($1, 8,

‎src/hotspot/cpu/aarch64/aarch64_sve.ad

+15
Original file line numberDiff line numberDiff line change
@@ -1760,3 +1760,18 @@ instruct vsubD(vReg dst, vReg src1, vReg src2) %{
17601760
%}
17611761
ins_pipe(pipe_slow);
17621762
%}
1763+
1764+
// vector mask cast
1765+
1766+
instruct vmaskcast(vReg dst) %{
1767+
predicate(UseSVE > 0 && n->bottom_type()->is_vect()->length() == n->in(1)->bottom_type()->is_vect()->length() &&
1768+
n->bottom_type()->is_vect()->length_in_bytes() == n->in(1)->bottom_type()->is_vect()->length_in_bytes());
1769+
match(Set dst (VectorMaskCast dst));
1770+
ins_cost(0);
1771+
format %{ "vmaskcast $dst\t# empty (sve)" %}
1772+
ins_encode %{
1773+
// empty
1774+
%}
1775+
ins_pipe(pipe_class_empty);
1776+
%}
1777+

‎src/hotspot/cpu/aarch64/aarch64_sve_ad.m4

+15
Original file line numberDiff line numberDiff line change
@@ -904,3 +904,18 @@ BINARY_OP_UNPREDICATED(vsubI, SubVI, S, 4, sve_sub)
904904
BINARY_OP_UNPREDICATED(vsubL, SubVL, D, 2, sve_sub)
905905
BINARY_OP_UNPREDICATED(vsubF, SubVF, S, 4, sve_fsub)
906906
BINARY_OP_UNPREDICATED(vsubD, SubVD, D, 2, sve_fsub)
907+
908+
// vector mask cast
909+
910+
instruct vmaskcast(vReg dst) %{
911+
predicate(UseSVE > 0 && n->bottom_type()->is_vect()->length() == n->in(1)->bottom_type()->is_vect()->length() &&
912+
n->bottom_type()->is_vect()->length_in_bytes() == n->in(1)->bottom_type()->is_vect()->length_in_bytes());
913+
match(Set dst (VectorMaskCast dst));
914+
ins_cost(0);
915+
format %{ "vmaskcast $dst\t# empty (sve)" %}
916+
ins_encode %{
917+
// empty
918+
%}
919+
ins_pipe(pipe_class_empty);
920+
%}
921+

‎src/hotspot/share/adlc/formssel.cpp

+2-1
Original file line numberDiff line numberDiff line change
@@ -4200,7 +4200,8 @@ bool MatchRule::is_vector() const {
42004200
"FmaVD", "FmaVF","PopCountVI",
42014201
// Next are not supported currently.
42024202
"PackB","PackS","PackI","PackL","PackF","PackD","Pack2L","Pack2D",
4203-
"ExtractB","ExtractUB","ExtractC","ExtractS","ExtractI","ExtractL","ExtractF","ExtractD"
4203+
"ExtractB","ExtractUB","ExtractC","ExtractS","ExtractI","ExtractL","ExtractF","ExtractD",
4204+
"VectorMaskCast"
42044205
};
42054206
int cnt = sizeof(vector_list)/sizeof(char*);
42064207
if (_rChild) {

‎src/hotspot/share/opto/classes.hpp

+1
Original file line numberDiff line numberDiff line change
@@ -446,6 +446,7 @@ macro(VectorBoxAllocate)
446446
macro(VectorUnbox)
447447
macro(VectorMaskWrapper)
448448
macro(VectorMaskCmp)
449+
macro(VectorMaskCast)
449450
macro(VectorTest)
450451
macro(VectorBlend)
451452
macro(VectorRearrange)

‎src/hotspot/share/opto/vectornode.cpp

+7
Original file line numberDiff line numberDiff line change
@@ -1232,6 +1232,13 @@ Node* VectorUnboxNode::Ideal(PhaseGVN* phase, bool can_reshape) {
12321232
bool is_vector_mask = vbox_klass->is_subclass_of(ciEnv::current()->vector_VectorMask_klass());
12331233
bool is_vector_shuffle = vbox_klass->is_subclass_of(ciEnv::current()->vector_VectorShuffle_klass());
12341234
if (is_vector_mask) {
1235+
if (in_vt->length_in_bytes() == out_vt->length_in_bytes() &&
1236+
Matcher::match_rule_supported_vector(Op_VectorMaskCast, out_vt->length(), out_vt->element_basic_type())) {
1237+
// Apply "VectorUnbox (VectorBox vmask) ==> VectorMaskCast (vmask)"
1238+
// directly. This could avoid the transformation ordering issue from
1239+
// "VectorStoreMask (VectorLoadMask vmask) => vmask".
1240+
return new VectorMaskCastNode(value, out_vt);
1241+
}
12351242
// VectorUnbox (VectorBox vmask) ==> VectorLoadMask (VectorStoreMask vmask)
12361243
value = phase->transform(VectorStoreMaskNode::make(*phase, value, in_vt->element_basic_type(), in_vt->length()));
12371244
return new VectorLoadMaskNode(value, out_vt);

‎src/hotspot/share/opto/vectornode.hpp

+11
Original file line numberDiff line numberDiff line change
@@ -1240,6 +1240,17 @@ class VectorStoreMaskNode : public VectorNode {
12401240
static VectorStoreMaskNode* make(PhaseGVN& gvn, Node* in, BasicType in_type, uint num_elem);
12411241
};
12421242

1243+
class VectorMaskCastNode : public VectorNode {
1244+
public:
1245+
VectorMaskCastNode(Node* in, const TypeVect* vt) : VectorNode(in, vt) {
1246+
const TypeVect* in_vt = in->bottom_type()->is_vect();
1247+
assert(in_vt->length() == vt->length(), "vector length must match");
1248+
assert(type2aelembytes(in_vt->element_basic_type()) == type2aelembytes(vt->element_basic_type()), "element size must match");
1249+
}
1250+
1251+
virtual int Opcode() const;
1252+
};
1253+
12431254
// This is intended for use as a simple reinterpret node that has no cast.
12441255
class VectorReinterpretNode : public VectorNode {
12451256
private:

‎src/hotspot/share/runtime/vmStructs.cpp

+1
Original file line numberDiff line numberDiff line change
@@ -1878,6 +1878,7 @@ typedef HashtableEntry<InstanceKlass*, mtClass> KlassHashtableEntry;
18781878
declare_c2_type(VectorInsertNode, VectorNode) \
18791879
declare_c2_type(VectorUnboxNode, VectorNode) \
18801880
declare_c2_type(VectorReinterpretNode, VectorNode) \
1881+
declare_c2_type(VectorMaskCastNode, VectorNode) \
18811882
declare_c2_type(VectorBoxNode, Node) \
18821883
declare_c2_type(VectorBoxAllocateNode, CallStaticJavaNode) \
18831884
declare_c2_type(VectorTestNode, Node) \

0 commit comments

Comments
 (0)
Please sign in to comment.