Skip to content

Commit 941a7ac

Browse files
author
Fei Gao
committedMar 24, 2023
8304301: Remove the global option SuperWordMaxVectorSize
Reviewed-by: sviswanathan, kvn
1 parent ac6af6a commit 941a7ac

14 files changed

+66
-54
lines changed
 

‎src/hotspot/cpu/aarch64/aarch64.ad

+4
Original file line numberDiff line numberDiff line change
@@ -2375,6 +2375,10 @@ const int Matcher::min_vector_size(const BasicType bt) {
23752375
return MIN2(size, max_size);
23762376
}
23772377

2378+
const int Matcher::superword_max_vector_size(const BasicType bt) {
2379+
return Matcher::max_vector_size(bt);
2380+
}
2381+
23782382
// Actual max scalable vector register length.
23792383
const int Matcher::scalable_vector_reg_size(const BasicType bt) {
23802384
return Matcher::max_vector_size(bt);

‎src/hotspot/cpu/arm/arm.ad

+5-1
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
//
2-
// Copyright (c) 2008, 2022, Oracle and/or its affiliates. All rights reserved.
2+
// Copyright (c) 2008, 2023, Oracle and/or its affiliates. All rights reserved.
33
// DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
44
//
55
// This code is free software; you can redistribute it and/or modify it
@@ -1074,6 +1074,10 @@ const int Matcher::min_vector_size(const BasicType bt) {
10741074
return 8/type2aelembytes(bt);
10751075
}
10761076

1077+
const int Matcher::superword_max_vector_size(const BasicType bt) {
1078+
return Matcher::max_vector_size(bt);
1079+
}
1080+
10771081
// Is this branch offset short enough that a short branch can be used?
10781082
//
10791083
// NOTE: If the platform does not provide any short branch variants, then

‎src/hotspot/cpu/ppc/ppc.ad

+4
Original file line numberDiff line numberDiff line change
@@ -2239,6 +2239,10 @@ const int Matcher::min_vector_size(const BasicType bt) {
22392239
return max_vector_size(bt); // Same as max.
22402240
}
22412241

2242+
const int Matcher::superword_max_vector_size(const BasicType bt) {
2243+
return Matcher::max_vector_size(bt);
2244+
}
2245+
22422246
const int Matcher::scalable_vector_reg_size(const BasicType bt) {
22432247
return -1;
22442248
}

‎src/hotspot/cpu/riscv/riscv.ad

+4
Original file line numberDiff line numberDiff line change
@@ -1945,6 +1945,10 @@ const int Matcher::min_vector_size(const BasicType bt) {
19451945
return MIN2(size, max_size);
19461946
}
19471947

1948+
const int Matcher::superword_max_vector_size(const BasicType bt) {
1949+
return Matcher::max_vector_size(bt);
1950+
}
1951+
19481952
// Vector ideal reg.
19491953
const uint Matcher::vector_ideal_reg(int len) {
19501954
assert(MaxVectorSize >= len, "");

‎src/hotspot/cpu/s390/s390.ad

+4
Original file line numberDiff line numberDiff line change
@@ -1571,6 +1571,10 @@ const int Matcher::min_vector_size(const BasicType bt) {
15711571
return max_vector_size(bt); // Same as max.
15721572
}
15731573

1574+
const int Matcher::superword_max_vector_size(const BasicType bt) {
1575+
return Matcher::max_vector_size(bt);
1576+
}
1577+
15741578
const int Matcher::scalable_vector_reg_size(const BasicType bt) {
15751579
return -1;
15761580
}

‎src/hotspot/cpu/x86/vm_version_x86.cpp

+11-21
Original file line numberDiff line numberDiff line change
@@ -1312,27 +1312,6 @@ void VM_Version::get_processor_features() {
13121312
FLAG_SET_DEFAULT(MaxVectorSize, max_vector_size);
13131313
}
13141314

1315-
#if defined(COMPILER2)
1316-
if (FLAG_IS_DEFAULT(SuperWordMaxVectorSize)) {
1317-
if (FLAG_IS_DEFAULT(UseAVX) && UseAVX > 2 &&
1318-
is_intel_skylake() && _stepping >= 5) {
1319-
// Limit auto vectorization to 256 bit (32 byte) by default on Cascade Lake
1320-
FLAG_SET_DEFAULT(SuperWordMaxVectorSize, MIN2(MaxVectorSize, (intx)32));
1321-
} else {
1322-
FLAG_SET_DEFAULT(SuperWordMaxVectorSize, MaxVectorSize);
1323-
}
1324-
} else {
1325-
if (SuperWordMaxVectorSize > MaxVectorSize) {
1326-
warning("SuperWordMaxVectorSize cannot be greater than MaxVectorSize %i", (int) MaxVectorSize);
1327-
FLAG_SET_DEFAULT(SuperWordMaxVectorSize, MaxVectorSize);
1328-
}
1329-
if (!is_power_of_2(SuperWordMaxVectorSize)) {
1330-
warning("SuperWordMaxVectorSize must be a power of 2, setting to MaxVectorSize: %i", (int) MaxVectorSize);
1331-
FLAG_SET_DEFAULT(SuperWordMaxVectorSize, MaxVectorSize);
1332-
}
1333-
}
1334-
#endif
1335-
13361315
#if defined(COMPILER2) && defined(ASSERT)
13371316
if (MaxVectorSize > 0) {
13381317
if (supports_avx() && PrintMiscellaneous && Verbose && TraceNewVectors) {
@@ -2094,6 +2073,17 @@ void VM_Version::check_virtualizations() {
20942073
}
20952074
}
20962075

2076+
#ifdef COMPILER2
2077+
// Determine if it's running on Cascade Lake using default options.
2078+
bool VM_Version::is_default_intel_cascade_lake() {
2079+
return FLAG_IS_DEFAULT(UseAVX) &&
2080+
FLAG_IS_DEFAULT(MaxVectorSize) &&
2081+
UseAVX > 2 &&
2082+
is_intel_skylake() &&
2083+
_stepping >= 5;
2084+
}
2085+
#endif
2086+
20972087
// avx3_threshold() sets the threshold at which 64-byte instructions are used
20982088
// for implementing the array copy and clear operations.
20992089
// The Intel platforms that supports the serialize instruction

‎src/hotspot/cpu/x86/vm_version_x86.hpp

+5
Original file line numberDiff line numberDiff line change
@@ -711,6 +711,11 @@ class VM_Version : public Abstract_VM_Version {
711711
static bool is_intel_skylake() { return is_intel_family_core() &&
712712
extended_cpu_model() == CPU_MODEL_SKYLAKE; }
713713

714+
#ifdef COMPILER2
715+
// Determine if it's running on Cascade Lake using default options.
716+
static bool is_default_intel_cascade_lake();
717+
#endif
718+
714719
static int avx3_threshold();
715720

716721
static bool is_intel_tsc_synched_at_init();

‎src/hotspot/cpu/x86/x86.ad

+9
Original file line numberDiff line numberDiff line change
@@ -2296,6 +2296,15 @@ const int Matcher::min_vector_size(const BasicType bt) {
22962296
return MIN2(size,max_size);
22972297
}
22982298

2299+
const int Matcher::superword_max_vector_size(const BasicType bt) {
2300+
// Limit the max vector size for auto vectorization to 256 bits (32 bytes)
2301+
// by default on Cascade Lake
2302+
if (VM_Version::is_default_intel_cascade_lake()) {
2303+
return MIN2(Matcher::max_vector_size(bt), 32 / type2aelembytes(bt));
2304+
}
2305+
return Matcher::max_vector_size(bt);
2306+
}
2307+
22992308
const int Matcher::scalable_vector_reg_size(const BasicType bt) {
23002309
return -1;
23012310
}

‎src/hotspot/share/opto/c2_globals.hpp

-5
Original file line numberDiff line numberDiff line change
@@ -82,11 +82,6 @@
8282
"actual size could be less depending on elements type") \
8383
range(0, max_jint) \
8484
\
85-
product(intx, SuperWordMaxVectorSize, 64, DIAGNOSTIC, \
86-
"Vector size limit in bytes for superword, " \
87-
"superword vector size limit in bytes") \
88-
range(0, max_jint) \
89-
\
9085
product(intx, ArrayOperationPartialInlineSize, 0, DIAGNOSTIC, \
9186
"Partial inline size used for small array operations" \
9287
"(e.g. copy,cmp) acceleration.") \

‎src/hotspot/share/opto/matcher.hpp

+2
Original file line numberDiff line numberDiff line change
@@ -351,6 +351,8 @@ class Matcher : public PhaseTransform {
351351
return (Matcher::max_vector_size(bt) >= size &&
352352
Matcher::min_vector_size(bt) <= size);
353353
}
354+
// Limits on max vector size (number of elements) for auto-vectorization.
355+
static const int superword_max_vector_size(const BasicType bt);
354356

355357
// Actual max scalable vector register length.
356358
static const int scalable_vector_reg_size(const BasicType bt);

‎src/hotspot/share/opto/superword.cpp

+8-18
Original file line numberDiff line numberDiff line change
@@ -198,16 +198,6 @@ bool SuperWord::transform_loop(IdealLoopTree* lpt, bool do_optimization) {
198198
return success;
199199
}
200200

201-
//------------------------------max vector size------------------------------
202-
int SuperWord::max_vector_size(BasicType bt) {
203-
int max_vector = Matcher::max_vector_size(bt);
204-
int sw_max_vector_limit = SuperWordMaxVectorSize / type2aelembytes(bt);
205-
if (max_vector > sw_max_vector_limit) {
206-
max_vector = sw_max_vector_limit;
207-
}
208-
return max_vector;
209-
}
210-
211201
//------------------------------early unrolling analysis------------------------------
212202
void SuperWord::unrolling_analysis(int &local_loop_unroll_factor) {
213203
bool is_slp = true;
@@ -226,7 +216,7 @@ void SuperWord::unrolling_analysis(int &local_loop_unroll_factor) {
226216
ignored_loop_nodes[i] = -1;
227217
}
228218

229-
int max_vector = max_vector_size(T_BYTE);
219+
int max_vector = Matcher::superword_max_vector_size(T_BYTE);
230220

231221
// Process the loop, some/all of the stack entries will not be in order, ergo
232222
// need to preprocess the ignored initial state before we process the loop
@@ -361,7 +351,7 @@ void SuperWord::unrolling_analysis(int &local_loop_unroll_factor) {
361351

362352
if (is_java_primitive(bt) == false) continue;
363353

364-
int cur_max_vector = max_vector_size(bt);
354+
int cur_max_vector = Matcher::superword_max_vector_size(bt);
365355

366356
// If a max vector exists which is not larger than _local_loop_unroll_factor
367357
// stop looking, we already have the max vector to map to.
@@ -1054,13 +1044,13 @@ int SuperWord::get_vw_bytes_special(MemNode* s) {
10541044
}
10551045
}
10561046
if (should_combine_adjacent) {
1057-
vw = MIN2(max_vector_size(btype)*type2aelembytes(btype), vw * 2);
1047+
vw = MIN2(Matcher::superword_max_vector_size(btype)*type2aelembytes(btype), vw * 2);
10581048
}
10591049
}
10601050

10611051
// Check for special case where there is a type conversion between different data size.
10621052
int vectsize = max_vector_size_in_def_use_chain(s);
1063-
if (vectsize < max_vector_size(btype)) {
1053+
if (vectsize < Matcher::superword_max_vector_size(btype)) {
10641054
vw = MIN2(vectsize * type2aelembytes(btype), vw);
10651055
}
10661056

@@ -1254,8 +1244,8 @@ bool SuperWord::stmts_can_pack(Node* s1, Node* s2, int align) {
12541244
if(!is_java_primitive(bt1) || !is_java_primitive(bt2))
12551245
return false;
12561246
BasicType longer_bt = longer_type_for_conversion(s1);
1257-
if (max_vector_size(bt1) < 2 ||
1258-
(longer_bt != T_ILLEGAL && max_vector_size(longer_bt) < 2)) {
1247+
if (Matcher::superword_max_vector_size(bt1) < 2 ||
1248+
(longer_bt != T_ILLEGAL && Matcher::superword_max_vector_size(longer_bt) < 2)) {
12591249
return false; // No vectors for this type
12601250
}
12611251

@@ -3669,10 +3659,10 @@ int SuperWord::max_vector_size_in_def_use_chain(Node* n) {
36693659
vt = (newt == T_ILLEGAL) ? vt : newt;
36703660
}
36713661

3672-
int max = max_vector_size(vt);
3662+
int max = Matcher::superword_max_vector_size(vt);
36733663
// If now there is no vectors for the longest type, the nodes with the longest
36743664
// type in the def-use chain are not packed in SuperWord::stmts_can_pack.
3675-
return max < 2 ? max_vector_size(bt) : max;
3665+
return max < 2 ? Matcher::superword_max_vector_size(bt) : max;
36763666
}
36773667

36783668
//-------------------------compute_vector_element_type-----------------------

‎src/hotspot/share/opto/superword.hpp

-2
Original file line numberDiff line numberDiff line change
@@ -329,8 +329,6 @@ class SuperWord : public ResourceObj {
329329

330330
bool transform_loop(IdealLoopTree* lpt, bool do_optimization);
331331

332-
int max_vector_size(BasicType bt);
333-
334332
void unrolling_analysis(int &local_loop_unroll_factor);
335333

336334
// Accessors for SWPointer

‎src/hotspot/share/opto/vectornode.cpp

+7-6
Original file line numberDiff line numberDiff line change
@@ -298,17 +298,18 @@ int VectorNode::replicate_opcode(BasicType bt) {
298298
}
299299
}
300300

301-
bool VectorNode::vector_size_supported(BasicType bt, uint vlen) {
302-
return (Matcher::vector_size_supported(bt, vlen) &&
303-
(vlen * type2aelembytes(bt) <= (uint)SuperWordMaxVectorSize));
301+
// Limits on vector size (number of elements) for auto-vectorization.
302+
bool VectorNode::vector_size_supported_superword(const BasicType bt, int size) {
303+
return Matcher::superword_max_vector_size(bt) >= size &&
304+
Matcher::min_vector_size(bt) <= size;
304305
}
305306

306307
// Also used to check if the code generator
307308
// supports the vector operation.
308309
bool VectorNode::implemented(int opc, uint vlen, BasicType bt) {
309310
if (is_java_primitive(bt) &&
310311
(vlen > 1) && is_power_of_2(vlen) &&
311-
vector_size_supported(bt, vlen)) {
312+
vector_size_supported_superword(bt, vlen)) {
312313
int vopc = VectorNode::opcode(opc, bt);
313314
// For rotate operation we will do a lazy de-generation into
314315
// OrV/LShiftV/URShiftV pattern if the target does not support
@@ -1379,7 +1380,7 @@ bool VectorCastNode::implemented(int opc, uint vlen, BasicType src_type, BasicTy
13791380
if (is_java_primitive(dst_type) &&
13801381
is_java_primitive(src_type) &&
13811382
(vlen > 1) && is_power_of_2(vlen) &&
1382-
VectorNode::vector_size_supported(dst_type, vlen)) {
1383+
VectorNode::vector_size_supported_superword(dst_type, vlen)) {
13831384
int vopc = VectorCastNode::opcode(opc, src_type);
13841385
return vopc > 0 && Matcher::match_rule_supported_superword(vopc, vlen, dst_type);
13851386
}
@@ -1473,7 +1474,7 @@ Node* ReductionNode::make_reduction_input(PhaseGVN& gvn, int opc, BasicType bt)
14731474
bool ReductionNode::implemented(int opc, uint vlen, BasicType bt) {
14741475
if (is_java_primitive(bt) &&
14751476
(vlen > 1) && is_power_of_2(vlen) &&
1476-
VectorNode::vector_size_supported(bt, vlen)) {
1477+
VectorNode::vector_size_supported_superword(bt, vlen)) {
14771478
int vopc = ReductionNode::opcode(opc, bt);
14781479
return vopc != opc && Matcher::match_rule_supported_superword(vopc, vlen, bt);
14791480
}

‎src/hotspot/share/opto/vectornode.hpp

+3-1
Original file line numberDiff line numberDiff line change
@@ -92,7 +92,9 @@ class VectorNode : public TypeNode {
9292

9393
static int opcode(int opc, BasicType bt);
9494
static int replicate_opcode(BasicType bt);
95-
static bool vector_size_supported(BasicType bt, uint vlen);
95+
96+
// Limits on vector size (number of elements) for auto-vectorization.
97+
static bool vector_size_supported_superword(const BasicType bt, int size);
9698
static bool implemented(int opc, uint vlen, BasicType bt);
9799
static bool is_shift(Node* n);
98100
static bool is_vshift_cnt(Node* n);

0 commit comments

Comments
 (0)
Please sign in to comment.