;; -------------------------------------------------------------------------
(define_insn_and_split "<optab><mode>3"
- [(set (match_operand:VI 0 "register_operand" "=vr")
- (any_shift:VI
- (match_operand:VI 1 "register_operand" " vr")
+ [(set (match_operand:V_VLSI 0 "register_operand" "=vr")
+ (any_shift:V_VLSI
+ (match_operand:V_VLSI 1 "register_operand" " vr")
(match_operand:<VEL> 2 "csr_operand" " rK")))]
"TARGET_VECTOR && can_create_pseudo_p ()"
"#"
;; -------------------------------------------------------------------------
(define_insn_and_split "v<optab><mode>3"
- [(set (match_operand:VI 0 "register_operand" "=vr,vr")
- (any_shift:VI
- (match_operand:VI 1 "register_operand" " vr,vr")
- (match_operand:VI 2 "vector_shift_operand" " vr,vk")))]
+ [(set (match_operand:V_VLSI 0 "register_operand" "=vr,vr")
+ (any_shift:V_VLSI
+ (match_operand:V_VLSI 1 "register_operand" " vr,vr")
+ (match_operand:V_VLSI 2 "vector_shift_operand" " vr,vk")))]
"TARGET_VECTOR && can_create_pseudo_p ()"
"#"
"&& 1"
for (int i = 0; i < NUM; ++i) \
a[i] = b[i] OP c[i] ? b[i] : c[i]; \
}
+
+#define DEF_OP_VI_7(PREFIX, NUM, TYPE, OP) \
+ void __attribute__ ((noinline, noclone)) \
+ PREFIX##_##TYPE##NUM (TYPE *restrict a, TYPE *restrict b, TYPE *restrict c) \
+ { \
+ for (int i = 0; i < NUM; ++i) \
+ a[i] = b[i] OP 7; \
+ }
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 -fno-schedule-insns -fno-schedule-insns2 --param=riscv-autovec-lmul=m8" } */
+
+#include "def.h"
+
+DEF_OP_VV (shift, 1, int8_t, >>)
+DEF_OP_VV (shift, 2, int8_t, >>)
+DEF_OP_VV (shift, 4, int8_t, >>)
+DEF_OP_VV (shift, 8, int8_t, >>)
+DEF_OP_VV (shift, 16, int8_t, >>)
+DEF_OP_VV (shift, 32, int8_t, >>)
+DEF_OP_VV (shift, 64, int8_t, >>)
+DEF_OP_VV (shift, 128, int8_t, >>)
+DEF_OP_VV (shift, 256, int8_t, >>)
+DEF_OP_VV (shift, 512, int8_t, >>)
+DEF_OP_VV (shift, 1024, int8_t, >>)
+DEF_OP_VV (shift, 2048, int8_t, >>)
+DEF_OP_VV (shift, 4096, int8_t, >>)
+
+DEF_OP_VV (shift, 1, int16_t, >>)
+DEF_OP_VV (shift, 2, int16_t, >>)
+DEF_OP_VV (shift, 4, int16_t, >>)
+DEF_OP_VV (shift, 8, int16_t, >>)
+DEF_OP_VV (shift, 16, int16_t, >>)
+DEF_OP_VV (shift, 32, int16_t, >>)
+DEF_OP_VV (shift, 64, int16_t, >>)
+DEF_OP_VV (shift, 128, int16_t, >>)
+DEF_OP_VV (shift, 256, int16_t, >>)
+DEF_OP_VV (shift, 512, int16_t, >>)
+DEF_OP_VV (shift, 1024, int16_t, >>)
+DEF_OP_VV (shift, 2048, int16_t, >>)
+
+DEF_OP_VV (shift, 1, int32_t, >>)
+DEF_OP_VV (shift, 2, int32_t, >>)
+DEF_OP_VV (shift, 4, int32_t, >>)
+DEF_OP_VV (shift, 8, int32_t, >>)
+DEF_OP_VV (shift, 16, int32_t, >>)
+DEF_OP_VV (shift, 32, int32_t, >>)
+DEF_OP_VV (shift, 64, int32_t, >>)
+DEF_OP_VV (shift, 128, int32_t, >>)
+DEF_OP_VV (shift, 256, int32_t, >>)
+DEF_OP_VV (shift, 512, int32_t, >>)
+DEF_OP_VV (shift, 1024, int32_t, >>)
+
+DEF_OP_VV (shift, 1, int64_t, >>)
+DEF_OP_VV (shift, 2, int64_t, >>)
+DEF_OP_VV (shift, 4, int64_t, >>)
+DEF_OP_VV (shift, 8, int64_t, >>)
+DEF_OP_VV (shift, 16, int64_t, >>)
+DEF_OP_VV (shift, 32, int64_t, >>)
+DEF_OP_VV (shift, 64, int64_t, >>)
+DEF_OP_VV (shift, 128, int64_t, >>)
+DEF_OP_VV (shift, 256, int64_t, >>)
+DEF_OP_VV (shift, 512, int64_t, >>)
+
+/* { dg-final { scan-assembler-times {vsra\.vv\s+v[0-9]+,\s*v[0-9]+,\s*v[0-9]+} 39 } } */
+/* { dg-final { scan-assembler-not {csrr} } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 -fno-schedule-insns -fno-schedule-insns2 --param=riscv-autovec-lmul=m8" } */
+
+#include "def.h"
+
+DEF_OP_VV (shift, 1, uint8_t, >>)
+DEF_OP_VV (shift, 2, uint8_t, >>)
+DEF_OP_VV (shift, 4, uint8_t, >>)
+DEF_OP_VV (shift, 8, uint8_t, >>)
+DEF_OP_VV (shift, 16, uint8_t, >>)
+DEF_OP_VV (shift, 32, uint8_t, >>)
+DEF_OP_VV (shift, 64, uint8_t, >>)
+DEF_OP_VV (shift, 128, uint8_t, >>)
+DEF_OP_VV (shift, 256, uint8_t, >>)
+DEF_OP_VV (shift, 512, uint8_t, >>)
+DEF_OP_VV (shift, 1024, uint8_t, >>)
+DEF_OP_VV (shift, 2048, uint8_t, >>)
+DEF_OP_VV (shift, 4096, uint8_t, >>)
+
+DEF_OP_VV (shift, 1, uint16_t, >>)
+DEF_OP_VV (shift, 2, uint16_t, >>)
+DEF_OP_VV (shift, 4, uint16_t, >>)
+DEF_OP_VV (shift, 8, uint16_t, >>)
+DEF_OP_VV (shift, 16, uint16_t, >>)
+DEF_OP_VV (shift, 32, uint16_t, >>)
+DEF_OP_VV (shift, 64, uint16_t, >>)
+DEF_OP_VV (shift, 128, uint16_t, >>)
+DEF_OP_VV (shift, 256, uint16_t, >>)
+DEF_OP_VV (shift, 512, uint16_t, >>)
+DEF_OP_VV (shift, 1024, uint16_t, >>)
+DEF_OP_VV (shift, 2048, uint16_t, >>)
+
+DEF_OP_VV (shift, 1, uint32_t, >>)
+DEF_OP_VV (shift, 2, uint32_t, >>)
+DEF_OP_VV (shift, 4, uint32_t, >>)
+DEF_OP_VV (shift, 8, uint32_t, >>)
+DEF_OP_VV (shift, 16, uint32_t, >>)
+DEF_OP_VV (shift, 32, uint32_t, >>)
+DEF_OP_VV (shift, 64, uint32_t, >>)
+DEF_OP_VV (shift, 128, uint32_t, >>)
+DEF_OP_VV (shift, 256, uint32_t, >>)
+DEF_OP_VV (shift, 512, uint32_t, >>)
+DEF_OP_VV (shift, 1024, uint32_t, >>)
+
+DEF_OP_VV (shift, 1, uint64_t, >>)
+DEF_OP_VV (shift, 2, uint64_t, >>)
+DEF_OP_VV (shift, 4, uint64_t, >>)
+DEF_OP_VV (shift, 8, uint64_t, >>)
+DEF_OP_VV (shift, 16, uint64_t, >>)
+DEF_OP_VV (shift, 32, uint64_t, >>)
+DEF_OP_VV (shift, 64, uint64_t, >>)
+DEF_OP_VV (shift, 128, uint64_t, >>)
+DEF_OP_VV (shift, 256, uint64_t, >>)
+DEF_OP_VV (shift, 512, uint64_t, >>)
+
+/* { dg-final { scan-assembler-times {vsrl\.vv\s+v[0-9]+,\s*v[0-9]+,\s*v[0-9]+} 39 } } */
+/* { dg-final { scan-assembler-not {csrr} } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 -fno-schedule-insns -fno-schedule-insns2 --param=riscv-autovec-lmul=m8" } */
+
+#include "def.h"
+
+DEF_OP_VV (shift, 1, int8_t, <<)
+DEF_OP_VV (shift, 2, int8_t, <<)
+DEF_OP_VV (shift, 4, int8_t, <<)
+DEF_OP_VV (shift, 8, int8_t, <<)
+DEF_OP_VV (shift, 16, int8_t, <<)
+DEF_OP_VV (shift, 32, int8_t, <<)
+DEF_OP_VV (shift, 64, int8_t, <<)
+DEF_OP_VV (shift, 128, int8_t, <<)
+DEF_OP_VV (shift, 256, int8_t, <<)
+DEF_OP_VV (shift, 512, int8_t, <<)
+DEF_OP_VV (shift, 1024, int8_t, <<)
+DEF_OP_VV (shift, 2048, int8_t, <<)
+DEF_OP_VV (shift, 4096, int8_t, <<)
+
+DEF_OP_VV (shift, 1, int16_t, <<)
+DEF_OP_VV (shift, 2, int16_t, <<)
+DEF_OP_VV (shift, 4, int16_t, <<)
+DEF_OP_VV (shift, 8, int16_t, <<)
+DEF_OP_VV (shift, 16, int16_t, <<)
+DEF_OP_VV (shift, 32, int16_t, <<)
+DEF_OP_VV (shift, 64, int16_t, <<)
+DEF_OP_VV (shift, 128, int16_t, <<)
+DEF_OP_VV (shift, 256, int16_t, <<)
+DEF_OP_VV (shift, 512, int16_t, <<)
+DEF_OP_VV (shift, 1024, int16_t, <<)
+DEF_OP_VV (shift, 2048, int16_t, <<)
+
+DEF_OP_VV (shift, 1, int32_t, <<)
+DEF_OP_VV (shift, 2, int32_t, <<)
+DEF_OP_VV (shift, 4, int32_t, <<)
+DEF_OP_VV (shift, 8, int32_t, <<)
+DEF_OP_VV (shift, 16, int32_t, <<)
+DEF_OP_VV (shift, 32, int32_t, <<)
+DEF_OP_VV (shift, 64, int32_t, <<)
+DEF_OP_VV (shift, 128, int32_t, <<)
+DEF_OP_VV (shift, 256, int32_t, <<)
+DEF_OP_VV (shift, 512, int32_t, <<)
+DEF_OP_VV (shift, 1024, int32_t, <<)
+
+DEF_OP_VV (shift, 1, int64_t, <<)
+DEF_OP_VV (shift, 2, int64_t, <<)
+DEF_OP_VV (shift, 4, int64_t, <<)
+DEF_OP_VV (shift, 8, int64_t, <<)
+DEF_OP_VV (shift, 16, int64_t, <<)
+DEF_OP_VV (shift, 32, int64_t, <<)
+DEF_OP_VV (shift, 64, int64_t, <<)
+DEF_OP_VV (shift, 128, int64_t, <<)
+DEF_OP_VV (shift, 256, int64_t, <<)
+DEF_OP_VV (shift, 512, int64_t, <<)
+
+/* { dg-final { scan-assembler-times {vsll\.vv\s+v[0-9]+,\s*v[0-9]+,\s*v[0-9]+} 41 } } */
+/* TODO: Ideally, we should make sure there is no "csrr vlenb". However, we still have 'csrr vlenb' for some cases since we don't support VLS mode conversion which are needed by division. */
+/* { dg-final { scan-assembler-times {csrr} 18 } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 -fno-schedule-insns -fno-schedule-insns2 --param=riscv-autovec-lmul=m8" } */
+
+#include "def.h"
+
+DEF_OP_VI_7 (shift, 1, int8_t, >>)
+DEF_OP_VI_7 (shift, 2, int8_t, >>)
+DEF_OP_VI_7 (shift, 4, int8_t, >>)
+DEF_OP_VI_7 (shift, 8, int8_t, >>)
+DEF_OP_VI_7 (shift, 16, int8_t, >>)
+DEF_OP_VI_7 (shift, 32, int8_t, >>)
+DEF_OP_VI_7 (shift, 64, int8_t, >>)
+DEF_OP_VI_7 (shift, 128, int8_t, >>)
+DEF_OP_VI_7 (shift, 256, int8_t, >>)
+DEF_OP_VI_7 (shift, 512, int8_t, >>)
+DEF_OP_VI_7 (shift, 1024, int8_t, >>)
+DEF_OP_VI_7 (shift, 2048, int8_t, >>)
+DEF_OP_VI_7 (shift, 4096, int8_t, >>)
+
+DEF_OP_VI_7 (shift, 1, int16_t, >>)
+DEF_OP_VI_7 (shift, 2, int16_t, >>)
+DEF_OP_VI_7 (shift, 4, int16_t, >>)
+DEF_OP_VI_7 (shift, 8, int16_t, >>)
+DEF_OP_VI_7 (shift, 16, int16_t, >>)
+DEF_OP_VI_7 (shift, 32, int16_t, >>)
+DEF_OP_VI_7 (shift, 64, int16_t, >>)
+DEF_OP_VI_7 (shift, 128, int16_t, >>)
+DEF_OP_VI_7 (shift, 256, int16_t, >>)
+DEF_OP_VI_7 (shift, 512, int16_t, >>)
+DEF_OP_VI_7 (shift, 1024, int16_t, >>)
+DEF_OP_VI_7 (shift, 2048, int16_t, >>)
+
+DEF_OP_VI_7 (shift, 1, int32_t, >>)
+DEF_OP_VI_7 (shift, 2, int32_t, >>)
+DEF_OP_VI_7 (shift, 4, int32_t, >>)
+DEF_OP_VI_7 (shift, 8, int32_t, >>)
+DEF_OP_VI_7 (shift, 16, int32_t, >>)
+DEF_OP_VI_7 (shift, 32, int32_t, >>)
+DEF_OP_VI_7 (shift, 64, int32_t, >>)
+DEF_OP_VI_7 (shift, 128, int32_t, >>)
+DEF_OP_VI_7 (shift, 256, int32_t, >>)
+DEF_OP_VI_7 (shift, 512, int32_t, >>)
+DEF_OP_VI_7 (shift, 1024, int32_t, >>)
+
+DEF_OP_VI_7 (shift, 1, int64_t, >>)
+DEF_OP_VI_7 (shift, 2, int64_t, >>)
+DEF_OP_VI_7 (shift, 4, int64_t, >>)
+DEF_OP_VI_7 (shift, 8, int64_t, >>)
+DEF_OP_VI_7 (shift, 16, int64_t, >>)
+DEF_OP_VI_7 (shift, 32, int64_t, >>)
+DEF_OP_VI_7 (shift, 64, int64_t, >>)
+DEF_OP_VI_7 (shift, 128, int64_t, >>)
+DEF_OP_VI_7 (shift, 256, int64_t, >>)
+DEF_OP_VI_7 (shift, 512, int64_t, >>)
+
+/* { dg-final { scan-assembler-times {vsra\.vi\s+v[0-9]+,\s*v[0-9]+,\s*7} 42 } } */
+/* { dg-final { scan-assembler-not {csrr} } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 -fno-schedule-insns -fno-schedule-insns2 --param=riscv-autovec-lmul=m8" } */
+
+#include "def.h"
+
+DEF_OP_VI_7 (shift, 1, uint8_t, >>)
+DEF_OP_VI_7 (shift, 2, uint8_t, >>)
+DEF_OP_VI_7 (shift, 4, uint8_t, >>)
+DEF_OP_VI_7 (shift, 8, uint8_t, >>)
+DEF_OP_VI_7 (shift, 16, uint8_t, >>)
+DEF_OP_VI_7 (shift, 32, uint8_t, >>)
+DEF_OP_VI_7 (shift, 64, uint8_t, >>)
+DEF_OP_VI_7 (shift, 128, uint8_t, >>)
+DEF_OP_VI_7 (shift, 256, uint8_t, >>)
+DEF_OP_VI_7 (shift, 512, uint8_t, >>)
+DEF_OP_VI_7 (shift, 1024, uint8_t, >>)
+DEF_OP_VI_7 (shift, 2048, uint8_t, >>)
+DEF_OP_VI_7 (shift, 4096, uint8_t, >>)
+
+DEF_OP_VI_7 (shift, 1, uint16_t, >>)
+DEF_OP_VI_7 (shift, 2, uint16_t, >>)
+DEF_OP_VI_7 (shift, 4, uint16_t, >>)
+DEF_OP_VI_7 (shift, 8, uint16_t, >>)
+DEF_OP_VI_7 (shift, 16, uint16_t, >>)
+DEF_OP_VI_7 (shift, 32, uint16_t, >>)
+DEF_OP_VI_7 (shift, 64, uint16_t, >>)
+DEF_OP_VI_7 (shift, 128, uint16_t, >>)
+DEF_OP_VI_7 (shift, 256, uint16_t, >>)
+DEF_OP_VI_7 (shift, 512, uint16_t, >>)
+DEF_OP_VI_7 (shift, 1024, uint16_t, >>)
+DEF_OP_VI_7 (shift, 2048, uint16_t, >>)
+
+DEF_OP_VI_7 (shift, 1, uint32_t, >>)
+DEF_OP_VI_7 (shift, 2, uint32_t, >>)
+DEF_OP_VI_7 (shift, 4, uint32_t, >>)
+DEF_OP_VI_7 (shift, 8, uint32_t, >>)
+DEF_OP_VI_7 (shift, 16, uint32_t, >>)
+DEF_OP_VI_7 (shift, 32, uint32_t, >>)
+DEF_OP_VI_7 (shift, 64, uint32_t, >>)
+DEF_OP_VI_7 (shift, 128, uint32_t, >>)
+DEF_OP_VI_7 (shift, 256, uint32_t, >>)
+DEF_OP_VI_7 (shift, 512, uint32_t, >>)
+DEF_OP_VI_7 (shift, 1024, uint32_t, >>)
+
+DEF_OP_VI_7 (shift, 1, uint64_t, >>)
+DEF_OP_VI_7 (shift, 2, uint64_t, >>)
+DEF_OP_VI_7 (shift, 4, uint64_t, >>)
+DEF_OP_VI_7 (shift, 8, uint64_t, >>)
+DEF_OP_VI_7 (shift, 16, uint64_t, >>)
+DEF_OP_VI_7 (shift, 32, uint64_t, >>)
+DEF_OP_VI_7 (shift, 64, uint64_t, >>)
+DEF_OP_VI_7 (shift, 128, uint64_t, >>)
+DEF_OP_VI_7 (shift, 256, uint64_t, >>)
+DEF_OP_VI_7 (shift, 512, uint64_t, >>)
+
+/* { dg-final { scan-assembler-times {vsrl\.vi\s+v[0-9]+,\s*v[0-9]+,\s*7} 42 } } */
+/* { dg-final { scan-assembler-not {csrr} } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 -fno-schedule-insns -fno-schedule-insns2 --param=riscv-autovec-lmul=m8" } */
+
+#include "def.h"
+
+DEF_OP_VI_7 (shift, 1, int8_t, <<)
+DEF_OP_VI_7 (shift, 2, int8_t, <<)
+DEF_OP_VI_7 (shift, 4, int8_t, <<)
+DEF_OP_VI_7 (shift, 8, int8_t, <<)
+DEF_OP_VI_7 (shift, 16, int8_t, <<)
+DEF_OP_VI_7 (shift, 32, int8_t, <<)
+DEF_OP_VI_7 (shift, 64, int8_t, <<)
+DEF_OP_VI_7 (shift, 128, int8_t, <<)
+DEF_OP_VI_7 (shift, 256, int8_t, <<)
+DEF_OP_VI_7 (shift, 512, int8_t, <<)
+DEF_OP_VI_7 (shift, 1024, int8_t, <<)
+DEF_OP_VI_7 (shift, 2048, int8_t, <<)
+DEF_OP_VI_7 (shift, 4096, int8_t, <<)
+
+DEF_OP_VI_7 (shift, 1, int16_t, <<)
+DEF_OP_VI_7 (shift, 2, int16_t, <<)
+DEF_OP_VI_7 (shift, 4, int16_t, <<)
+DEF_OP_VI_7 (shift, 8, int16_t, <<)
+DEF_OP_VI_7 (shift, 16, int16_t, <<)
+DEF_OP_VI_7 (shift, 32, int16_t, <<)
+DEF_OP_VI_7 (shift, 64, int16_t, <<)
+DEF_OP_VI_7 (shift, 128, int16_t, <<)
+DEF_OP_VI_7 (shift, 256, int16_t, <<)
+DEF_OP_VI_7 (shift, 512, int16_t, <<)
+DEF_OP_VI_7 (shift, 1024, int16_t, <<)
+DEF_OP_VI_7 (shift, 2048, int16_t, <<)
+
+DEF_OP_VI_7 (shift, 1, int32_t, <<)
+DEF_OP_VI_7 (shift, 2, int32_t, <<)
+DEF_OP_VI_7 (shift, 4, int32_t, <<)
+DEF_OP_VI_7 (shift, 8, int32_t, <<)
+DEF_OP_VI_7 (shift, 16, int32_t, <<)
+DEF_OP_VI_7 (shift, 32, int32_t, <<)
+DEF_OP_VI_7 (shift, 64, int32_t, <<)
+DEF_OP_VI_7 (shift, 128, int32_t, <<)
+DEF_OP_VI_7 (shift, 256, int32_t, <<)
+DEF_OP_VI_7 (shift, 512, int32_t, <<)
+DEF_OP_VI_7 (shift, 1024, int32_t, <<)
+
+DEF_OP_VI_7 (shift, 1, int64_t, <<)
+DEF_OP_VI_7 (shift, 2, int64_t, <<)
+DEF_OP_VI_7 (shift, 4, int64_t, <<)
+DEF_OP_VI_7 (shift, 8, int64_t, <<)
+DEF_OP_VI_7 (shift, 16, int64_t, <<)
+DEF_OP_VI_7 (shift, 32, int64_t, <<)
+DEF_OP_VI_7 (shift, 64, int64_t, <<)
+DEF_OP_VI_7 (shift, 128, int64_t, <<)
+DEF_OP_VI_7 (shift, 256, int64_t, <<)
+DEF_OP_VI_7 (shift, 512, int64_t, <<)
+
+/* { dg-final { scan-assembler-times {vsll\.vi\s+v[0-9]+,\s*v[0-9]+,\s*7} 42 } } */
+/* { dg-final { scan-assembler-not {csrr} } } */