diff --git a/gcc/config/riscv/riscv-vsetvl.cc b/gcc/config/riscv/riscv-vsetvl.cc index b3e07d4c3aace01e7f6549d319ce885322212572..1da95daeeb0313939c5fe0da5572f86163547e3d 100644 --- a/gcc/config/riscv/riscv-vsetvl.cc +++ b/gcc/config/riscv/riscv-vsetvl.cc @@ -1497,9 +1497,6 @@ private: { gcc_assert (prev.valid_p () && next.valid_p ()); - if (prev.get_ratio () != next.get_ratio ()) - return false; - if (next.has_vl () && next.vl_used_by_non_rvv_insn_p ()) return false; @@ -2188,7 +2185,7 @@ private: return true; } - bool preds_has_same_avl_p (const vsetvl_info &curr_info) + bool preds_all_same_avl_and_ratio_p (const vsetvl_info &curr_info) { gcc_assert ( !bitmap_empty_p (m_vsetvl_def_in[curr_info.get_bb ()->index ()])); @@ -2200,7 +2197,8 @@ private: { const vsetvl_info &prev_info = *m_vsetvl_def_exprs[expr_index]; if (!prev_info.valid_p () - || !m_dem.avl_available_p (prev_info, curr_info)) + || !m_dem.avl_available_p (prev_info, curr_info) + || prev_info.get_ratio () != curr_info.get_ratio ()) return false; } @@ -3171,7 +3169,7 @@ pre_vsetvl::pre_global_vsetvl_info () curr_info = block_info.local_infos[0]; } if (curr_info.valid_p () && !curr_info.vl_used_by_non_rvv_insn_p () - && preds_has_same_avl_p (curr_info)) + && preds_all_same_avl_and_ratio_p (curr_info)) curr_info.set_change_vtype_only (); vsetvl_info prev_info = vsetvl_info (); @@ -3179,7 +3177,8 @@ pre_vsetvl::pre_global_vsetvl_info () for (auto &curr_info : block_info.local_infos) { if (prev_info.valid_p () && curr_info.valid_p () - && m_dem.avl_available_p (prev_info, curr_info)) + && m_dem.avl_available_p (prev_info, curr_info) + && prev_info.get_ratio () == curr_info.get_ratio ()) curr_info.set_change_vtype_only (); prev_info = curr_info; } diff --git a/gcc/testsuite/gcc.target/riscv/rvv/vsetvl/avl_single-84.c b/gcc/testsuite/gcc.target/riscv/rvv/vsetvl/avl_single-84.c index a584dd97dc033865275add2ba1650b9565e87440..5cd0f285029035b8a39d3112c8544bdd3566eb1d 100644 --- a/gcc/testsuite/gcc.target/riscv/rvv/vsetvl/avl_single-84.c +++ b/gcc/testsuite/gcc.target/riscv/rvv/vsetvl/avl_single-84.c @@ -17,6 +17,6 @@ double f0 (int8_t * restrict in, int8_t * restrict out, int n, int m, unsigned c } /* { dg-final { scan-assembler-times {vsetvli\s+[a-x0-9]+,\s*zero,\s*e8,\s*m2,\s*t[au],\s*m[au]} 1 { target { no-opts "-O0" no-opts "-Os" no-opts "-Oz" no-opts "-O1" no-opts "-g" no-opts "-funroll-loops" } } } } */ -/* { dg-final { scan-assembler-times {vsetvli\s+zero,\s*zero,\s*e64,\s*m1,\s*t[au],\s*m[au]} 2 { target { no-opts "-O0" no-opts "-Os" no-opts "-Oz" no-opts "-O1" no-opts "-g" no-opts "-funroll-loops" } } } } */ -/* { dg-final { scan-assembler-times {vsetvli} 3 { target { no-opts "-O0" no-opts "-O1" no-opts "-Os" no-opts "-Oz" no-opts "-g" no-opts "-funroll-loops" } } } } */ - +/* { dg-final { scan-assembler-not {vsetvli\s+zero,\s*zero} { target { no-opts "-O0" no-opts "-Os" no-opts "-Oz" no-opts "-O1" no-opts "-g" no-opts "-funroll-loops" } } } } */ +/* { dg-final { scan-assembler-times {vsetvli} 1 { target { no-opts "-O0" no-opts "-O1" no-opts "-Os" no-opts "-Oz" no-opts "-g" no-opts "-funroll-loops" } } } } */ +/* { dg-final { scan-assembler-times {vsetivli} 2 { target { no-opts "-O0" no-opts "-O1" no-opts "-Os" no-opts "-Oz" no-opts "-g" no-opts "-funroll-loops" } } } } */ diff --git a/gcc/testsuite/gcc.target/riscv/rvv/vsetvl/pr111037-3.c b/gcc/testsuite/gcc.target/riscv/rvv/vsetvl/pr111037-3.c index 0f40642c8b6174d1eb66ff3142ffaf8c0ff8c30b..13344ecdd3ba8349023047d8b7915637477073a9 100644 --- a/gcc/testsuite/gcc.target/riscv/rvv/vsetvl/pr111037-3.c +++ b/gcc/testsuite/gcc.target/riscv/rvv/vsetvl/pr111037-3.c @@ -13,4 +13,4 @@ void foo(_Float16 y, int16_t z, int64_t *i64p) } /* { dg-final { scan-assembler-times {vsetivli\s+zero,\s*1,\s*e64,\s*m1,\s*t[au],\s*m[au]} 1 } } */ -/* { dg-final { scan-assembler-times {vsetvli\s+zero,\s*zero,\s*e16,\s*m1,\s*t[au],\s*m[au]} 1 } } */ +/* { dg-final { scan-assembler-times {vsetivli\s+zero,\s*1,\s*e16,\s*m1,\s*t[au],\s*m[au]} 1 } } */ diff --git a/gcc/testsuite/gcc.target/riscv/rvv/vsetvl/pr112776.c b/gcc/testsuite/gcc.target/riscv/rvv/vsetvl/pr112776.c new file mode 100644 index 0000000000000000000000000000000000000000..853690178ace4b93d2e800b03c37d2c249eea44c --- /dev/null +++ b/gcc/testsuite/gcc.target/riscv/rvv/vsetvl/pr112776.c @@ -0,0 +1,36 @@ +/* { dg-do compile } */ +/* { dg-options "-march=rv64gcv -mabi=lp64d -O3" } */ + +#include "riscv_vector.h" + +void +foo (float *r, const float *x) +{ + int i, k; + + vfloat32m4_t x_vec; + vfloat32m4_t x_forward_vec; + vfloat32m4_t temp_vec; + vfloat32m1_t dst_vec; + vfloat32m1_t src_vec; + + float result = 0.0f; + float shift_prev = 0.0f; + + size_t n = 64; + for (size_t vl; n > 0; n -= vl) + { + vl = __riscv_vsetvl_e32m4 (n); + x_vec = __riscv_vle32_v_f32m4 (&x[0], vl); + x_forward_vec = __riscv_vle32_v_f32m4 (&x[0], vl); + temp_vec = __riscv_vfmul_vv_f32m4 (x_vec, x_forward_vec, vl); + src_vec = __riscv_vfmv_s_tu (src_vec, 0.0f, vl); + dst_vec = __riscv_vfmv_s_tu (dst_vec, 0.0f, vl); + dst_vec = __riscv_vfredosum_tu (dst_vec, temp_vec, src_vec, vl); + r[0] = __riscv_vfmv_f_s_f32m1_f32 (dst_vec); + } +} + +/* { dg-final { scan-assembler-times {vsetvli} 1 } } */ +/* { dg-final { scan-assembler-not {vsetivli} } } */ +/* { dg-final { scan-assembler-times {vsetvli\t[a-x0-9]+,\s*[a-x0-9]+,\s*e32,\s*m4,\s*tu,\s*m[au]} 1 } } */