8339063: [aarch64] Skip verify_sve_vector_length after native calls if SVE supports 128 bits VL only

Reviewed-by: adinn, fgao
This commit is contained in:
Joshua Zhu 2024-09-02 15:37:58 +00:00 committed by Andrew Dinn
parent b1163bcc88
commit 0e6bb514c8
7 changed files with 46 additions and 27 deletions

View File

@ -2334,7 +2334,7 @@ bool Matcher::is_short_branch_offset(int rule, int br_size, int offset) {
// Vector width in bytes. // Vector width in bytes.
int Matcher::vector_width_in_bytes(BasicType bt) { int Matcher::vector_width_in_bytes(BasicType bt) {
// The MaxVectorSize should have been set by detecting SVE max vector register size. // The MaxVectorSize should have been set by detecting SVE max vector register size.
int size = MIN2((UseSVE > 0) ? 256 : 16, (int)MaxVectorSize); int size = MIN2((UseSVE > 0) ? (int)FloatRegister::sve_vl_max : (int)FloatRegister::neon_vl, (int)MaxVectorSize);
// Minimum 2 values in vector // Minimum 2 values in vector
if (size < 2*type2aelembytes(bt)) size = 0; if (size < 2*type2aelembytes(bt)) size = 0;
// But never < 4 // But never < 4
@ -2373,7 +2373,7 @@ int Matcher::scalable_vector_reg_size(const BasicType bt) {
// Vector ideal reg. // Vector ideal reg.
uint Matcher::vector_ideal_reg(int len) { uint Matcher::vector_ideal_reg(int len) {
if (UseSVE > 0 && 16 < len && len <= 256) { if (UseSVE > 0 && FloatRegister::neon_vl < len && len <= FloatRegister::sve_vl_max) {
return Op_VecA; return Op_VecA;
} }
switch(len) { switch(len) {

View File

@ -155,7 +155,7 @@ source %{
} }
int length_in_bytes = vlen * type2aelembytes(bt); int length_in_bytes = vlen * type2aelembytes(bt);
if (UseSVE == 0 && length_in_bytes > 16) { if (UseSVE == 0 && length_in_bytes > FloatRegister::neon_vl) {
return false; return false;
} }

View File

@ -145,7 +145,7 @@ source %{
} }
int length_in_bytes = vlen * type2aelembytes(bt); int length_in_bytes = vlen * type2aelembytes(bt);
if (UseSVE == 0 && length_in_bytes > 16) { if (UseSVE == 0 && length_in_bytes > FloatRegister::neon_vl) {
return false; return false;
} }

View File

@ -6413,8 +6413,10 @@ void MacroAssembler::cache_wbsync(bool is_pre) {
} }
void MacroAssembler::verify_sve_vector_length(Register tmp) { void MacroAssembler::verify_sve_vector_length(Register tmp) {
if (!UseSVE || VM_Version::get_max_supported_sve_vector_length() == FloatRegister::sve_vl_min) {
return;
}
// Make sure that native code does not change SVE vector length. // Make sure that native code does not change SVE vector length.
if (!UseSVE) return;
Label verify_ok; Label verify_ok;
movw(tmp, zr); movw(tmp, zr);
sve_inc(tmp, B); sve_inc(tmp, B);

View File

@ -1,5 +1,5 @@
/* /*
* Copyright (c) 2000, 2023, Oracle and/or its affiliates. All rights reserved. * Copyright (c) 2000, 2024, Oracle and/or its affiliates. All rights reserved.
* Copyright (c) 2014, 2021, Red Hat Inc. All rights reserved. * Copyright (c) 2014, 2021, Red Hat Inc. All rights reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
* *
@ -166,7 +166,13 @@ class FloatRegister {
max_slots_per_register = 4, max_slots_per_register = 4,
save_slots_per_register = 2, save_slots_per_register = 2,
slots_per_neon_register = 4, slots_per_neon_register = 4,
extra_save_slots_per_neon_register = slots_per_neon_register - save_slots_per_register extra_save_slots_per_neon_register = slots_per_neon_register - save_slots_per_register,
neon_vl = 16,
// VLmax: The maximum sve vector length is determined by the hardware
// sve_vl_min <= VLmax <= sve_vl_max.
sve_vl_min = 16,
// Maximum supported vector length across all CPUs
sve_vl_max = 256
}; };
class FloatRegisterImpl: public AbstractRegisterImpl { class FloatRegisterImpl: public AbstractRegisterImpl {

View File

@ -25,6 +25,7 @@
#include "precompiled.hpp" #include "precompiled.hpp"
#include "pauth_aarch64.hpp" #include "pauth_aarch64.hpp"
#include "register_aarch64.hpp"
#include "runtime/arguments.hpp" #include "runtime/arguments.hpp"
#include "runtime/globals_extension.hpp" #include "runtime/globals_extension.hpp"
#include "runtime/java.hpp" #include "runtime/java.hpp"
@ -44,6 +45,7 @@ int VM_Version::_zva_length;
int VM_Version::_dcache_line_size; int VM_Version::_dcache_line_size;
int VM_Version::_icache_line_size; int VM_Version::_icache_line_size;
int VM_Version::_initial_sve_vector_length; int VM_Version::_initial_sve_vector_length;
int VM_Version::_max_supported_sve_vector_length;
bool VM_Version::_rop_protection; bool VM_Version::_rop_protection;
uintptr_t VM_Version::_pac_mask; uintptr_t VM_Version::_pac_mask;
@ -507,13 +509,20 @@ void VM_Version::initialize() {
if (UseSVE > 0) { if (UseSVE > 0) {
if (FLAG_IS_DEFAULT(MaxVectorSize)) { if (FLAG_IS_DEFAULT(MaxVectorSize)) {
MaxVectorSize = _initial_sve_vector_length; MaxVectorSize = _initial_sve_vector_length;
} else if (MaxVectorSize < 16) { } else if (MaxVectorSize < FloatRegister::sve_vl_min) {
warning("SVE does not support vector length less than 16 bytes. Disabling SVE."); warning("SVE does not support vector length less than %d bytes. Disabling SVE.",
FloatRegister::sve_vl_min);
UseSVE = 0; UseSVE = 0;
} else if ((MaxVectorSize % 16) == 0 && is_power_of_2(MaxVectorSize)) { } else if (!((MaxVectorSize % FloatRegister::sve_vl_min) == 0 && is_power_of_2(MaxVectorSize))) {
vm_exit_during_initialization(err_msg("Unsupported MaxVectorSize: %d", (int)MaxVectorSize));
}
if (UseSVE > 0) {
// Acquire the largest supported vector length of this machine
_max_supported_sve_vector_length = set_and_get_current_sve_vector_length(FloatRegister::sve_vl_max);
if (MaxVectorSize != _max_supported_sve_vector_length) {
int new_vl = set_and_get_current_sve_vector_length(MaxVectorSize); int new_vl = set_and_get_current_sve_vector_length(MaxVectorSize);
_initial_sve_vector_length = new_vl;
// Update MaxVectorSize to the largest supported value.
if (new_vl < 0) { if (new_vl < 0) {
vm_exit_during_initialization( vm_exit_during_initialization(
err_msg("Current system does not support SVE vector length for MaxVectorSize: %d", err_msg("Current system does not support SVE vector length for MaxVectorSize: %d",
@ -523,14 +532,14 @@ void VM_Version::initialize() {
new_vl, new_vl); new_vl, new_vl);
} }
MaxVectorSize = new_vl; MaxVectorSize = new_vl;
} else { }
vm_exit_during_initialization(err_msg("Unsupported MaxVectorSize: %d", (int)MaxVectorSize)); _initial_sve_vector_length = MaxVectorSize;
} }
} }
if (UseSVE == 0) { // NEON if (UseSVE == 0) { // NEON
int min_vector_size = 8; int min_vector_size = 8;
int max_vector_size = 16; int max_vector_size = FloatRegister::neon_vl;
if (!FLAG_IS_DEFAULT(MaxVectorSize)) { if (!FLAG_IS_DEFAULT(MaxVectorSize)) {
if (!is_power_of_2(MaxVectorSize)) { if (!is_power_of_2(MaxVectorSize)) {
vm_exit_during_initialization(err_msg("Unsupported MaxVectorSize: %d", (int)MaxVectorSize)); vm_exit_during_initialization(err_msg("Unsupported MaxVectorSize: %d", (int)MaxVectorSize));
@ -542,11 +551,11 @@ void VM_Version::initialize() {
FLAG_SET_DEFAULT(MaxVectorSize, max_vector_size); FLAG_SET_DEFAULT(MaxVectorSize, max_vector_size);
} }
} else { } else {
FLAG_SET_DEFAULT(MaxVectorSize, 16); FLAG_SET_DEFAULT(MaxVectorSize, FloatRegister::neon_vl);
} }
} }
int inline_size = (UseSVE > 0 && MaxVectorSize >= 16) ? MaxVectorSize : 0; int inline_size = (UseSVE > 0 && MaxVectorSize >= FloatRegister::sve_vl_min) ? MaxVectorSize : 0;
if (FLAG_IS_DEFAULT(ArrayOperationPartialInlineSize)) { if (FLAG_IS_DEFAULT(ArrayOperationPartialInlineSize)) {
FLAG_SET_DEFAULT(ArrayOperationPartialInlineSize, inline_size); FLAG_SET_DEFAULT(ArrayOperationPartialInlineSize, inline_size);
} else if (ArrayOperationPartialInlineSize != 0 && ArrayOperationPartialInlineSize != inline_size) { } else if (ArrayOperationPartialInlineSize != 0 && ArrayOperationPartialInlineSize != inline_size) {

View File

@ -46,6 +46,7 @@ protected:
static int _dcache_line_size; static int _dcache_line_size;
static int _icache_line_size; static int _icache_line_size;
static int _initial_sve_vector_length; static int _initial_sve_vector_length;
static int _max_supported_sve_vector_length;
static bool _rop_protection; static bool _rop_protection;
static uintptr_t _pac_mask; static uintptr_t _pac_mask;
@ -165,6 +166,7 @@ enum Ampere_CPU_Model {
static int icache_line_size() { return _icache_line_size; } static int icache_line_size() { return _icache_line_size; }
static int dcache_line_size() { return _dcache_line_size; } static int dcache_line_size() { return _dcache_line_size; }
static int get_initial_sve_vector_length() { return _initial_sve_vector_length; }; static int get_initial_sve_vector_length() { return _initial_sve_vector_length; };
static int get_max_supported_sve_vector_length() { return _max_supported_sve_vector_length; };
// Aarch64 supports fast class initialization checks // Aarch64 supports fast class initialization checks
static bool supports_fast_class_init_checks() { return true; } static bool supports_fast_class_init_checks() { return true; }