Skip to content

Commit 6fd182a

Browse files
authored
[RISCV] Support fixed vector vp.reverse/splice with Zvfhmin/Zvfbfmin. (#145596)
Fix the names of some tests I accidentally misspelled.
1 parent e8abdfc commit 6fd182a

File tree

4 files changed

+98
-11
lines changed

4 files changed

+98
-11
lines changed

llvm/lib/Target/RISCV/RISCVISelLowering.cpp

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -756,8 +756,7 @@ RISCVTargetLowering::RISCVTargetLowering(const TargetMachine &TM,
756756
ISD::VP_FROUNDEVEN, ISD::VP_FCOPYSIGN, ISD::VP_FROUNDTOZERO,
757757
ISD::VP_FRINT, ISD::VP_FNEARBYINT, ISD::VP_IS_FPCLASS,
758758
ISD::VP_FMINIMUM, ISD::VP_FMAXIMUM, ISD::VP_LRINT,
759-
ISD::VP_LLRINT, ISD::EXPERIMENTAL_VP_REVERSE,
760-
ISD::EXPERIMENTAL_VP_SPLICE, ISD::VP_REDUCE_FMINIMUM,
759+
ISD::VP_LLRINT, ISD::VP_REDUCE_FMINIMUM,
761760
ISD::VP_REDUCE_FMAXIMUM, ISD::EXPERIMENTAL_VP_SPLAT};
762761

763762
static const unsigned IntegerVecReduceOps[] = {
@@ -1112,6 +1111,8 @@ RISCVTargetLowering::RISCVTargetLowering(const TargetMachine &TM,
11121111
setOperationAction(ISD::VECTOR_INTERLEAVE, VT, Custom);
11131112

11141113
setOperationAction({ISD::VECTOR_REVERSE, ISD::VECTOR_SPLICE}, VT, Custom);
1114+
setOperationAction(ISD::EXPERIMENTAL_VP_SPLICE, VT, Custom);
1115+
setOperationAction(ISD::EXPERIMENTAL_VP_REVERSE, VT, Custom);
11151116

11161117
setOperationAction(FloatingPointVPOps, VT, Custom);
11171118

@@ -1420,6 +1421,8 @@ RISCVTargetLowering::RISCVTargetLowering(const TargetMachine &TM,
14201421
ISD::EXTRACT_SUBVECTOR, ISD::VECTOR_REVERSE,
14211422
ISD::VECTOR_SHUFFLE, ISD::VECTOR_COMPRESS},
14221423
VT, Custom);
1424+
setOperationAction(ISD::EXPERIMENTAL_VP_SPLICE, VT, Custom);
1425+
setOperationAction(ISD::EXPERIMENTAL_VP_REVERSE, VT, Custom);
14231426

14241427
setOperationAction({ISD::VECTOR_INTERLEAVE, ISD::VECTOR_DEINTERLEAVE},
14251428
VT, Custom);

llvm/test/CodeGen/RISCV/rvv/fixed-vectors-vp-reverser-float.ll renamed to llvm/test/CodeGen/RISCV/rvv/fixed-vectors-vp-reverse-float.ll

Lines changed: 32 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,7 @@
11
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2-
; RUN: llc -mtriple=riscv64 -mattr=+m,+f,+d,+v,+zvfh -verify-machineinstrs -riscv-v-vector-bits-min=128 \
2+
; RUN: llc -mtriple=riscv64 -mattr=+m,+f,+d,+v,+zvfh,+zvfbfmin -verify-machineinstrs -riscv-v-vector-bits-min=128 \
3+
; RUN: < %s | FileCheck %s
4+
; RUN: llc -mtriple=riscv64 -mattr=+m,+f,+d,+v,+zvfhmin,+zvfbfmin -verify-machineinstrs -riscv-v-vector-bits-min=128 \
35
; RUN: < %s | FileCheck %s
46

57
define <2 x double> @test_vp_reverse_v2f64_masked(<2 x double> %src, <2 x i1> %mask, i32 zeroext %evl) {
@@ -88,3 +90,32 @@ define <4 x half> @test_vp_reverse_v4f16(<4 x half> %src, i32 zeroext %evl) {
8890
%dst = call <4 x half> @llvm.experimental.vp.reverse.v4f16(<4 x half> %src, <4 x i1> splat (i1 1), i32 %evl)
8991
ret <4 x half> %dst
9092
}
93+
94+
define <4 x bfloat> @test_vp_reverse_v4bf16_masked(<4 x bfloat> %src, <4 x i1> %mask, i32 zeroext %evl) {
95+
; CHECK-LABEL: test_vp_reverse_v4bf16_masked:
96+
; CHECK: # %bb.0:
97+
; CHECK-NEXT: vsetvli zero, a0, e16, mf2, ta, ma
98+
; CHECK-NEXT: vid.v v9, v0.t
99+
; CHECK-NEXT: addi a0, a0, -1
100+
; CHECK-NEXT: vrsub.vx v10, v9, a0, v0.t
101+
; CHECK-NEXT: vrgather.vv v9, v8, v10, v0.t
102+
; CHECK-NEXT: vmv1r.v v8, v9
103+
; CHECK-NEXT: ret
104+
%dst = call <4 x bfloat> @llvm.experimental.vp.reverse.v4bf16(<4 x bfloat> %src, <4 x i1> %mask, i32 %evl)
105+
ret <4 x bfloat> %dst
106+
}
107+
108+
define <4 x bfloat> @test_vp_reverse_v4bf16(<4 x bfloat> %src, i32 zeroext %evl) {
109+
; CHECK-LABEL: test_vp_reverse_v4bf16:
110+
; CHECK: # %bb.0:
111+
; CHECK-NEXT: addi a1, a0, -1
112+
; CHECK-NEXT: vsetvli zero, a0, e16, mf2, ta, ma
113+
; CHECK-NEXT: vid.v v9
114+
; CHECK-NEXT: vrsub.vx v10, v9, a1
115+
; CHECK-NEXT: vrgather.vv v9, v8, v10
116+
; CHECK-NEXT: vmv1r.v v8, v9
117+
; CHECK-NEXT: ret
118+
119+
%dst = call <4 x bfloat> @llvm.experimental.vp.reverse.v4bf16(<4 x bfloat> %src, <4 x i1> splat (i1 1), i32 %evl)
120+
ret <4 x bfloat> %dst
121+
}

llvm/test/CodeGen/RISCV/rvv/fixed-vectors-vp-splice.ll

Lines changed: 61 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,8 @@
11
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2-
; RUN: llc -mtriple riscv64 -mattr=+f,+d,+v,+zvfh -verify-machineinstrs -riscv-v-vector-bits-min=128 \
3-
; RUN: < %s | FileCheck %s
2+
; RUN: llc -mtriple riscv64 -mattr=+f,+d,+v,+zvfh,+zvfbfmin -verify-machineinstrs -riscv-v-vector-bits-min=128 \
3+
; RUN: < %s | FileCheck %s --check-prefixes=CHECK,ZVFH
4+
; RUN: llc -mtriple riscv64 -mattr=+f,+d,+v,+zvfhmin,+zvfbfmin -verify-machineinstrs -riscv-v-vector-bits-min=128 \
5+
; RUN: < %s | FileCheck %s --check-prefixes=CHECK,ZVFHMIN
46

57
define <2 x i64> @test_vp_splice_v2i64(<2 x i64> %va, <2 x i64> %vb, i32 zeroext %evla, i32 zeroext %evlb) {
68
; CHECK-LABEL: test_vp_splice_v2i64:
@@ -338,13 +340,64 @@ define <4 x float> @test_vp_splice_nxv2f32_with_firstelt(float %first, <4 x floa
338340
}
339341

340342
define <4 x half> @test_vp_splice_nxv2f16_with_firstelt(half %first, <4 x half> %vb, <4 x i1> %mask, i32 zeroext %evl) {
341-
; CHECK-LABEL: test_vp_splice_nxv2f16_with_firstelt:
342-
; CHECK: # %bb.0:
343-
; CHECK-NEXT: vsetvli zero, a0, e16, mf2, ta, ma
344-
; CHECK-NEXT: vfslide1up.vf v9, v8, fa0, v0.t
345-
; CHECK-NEXT: vmv1r.v v8, v9
346-
; CHECK-NEXT: ret
343+
; ZVFH-LABEL: test_vp_splice_nxv2f16_with_firstelt:
344+
; ZVFH: # %bb.0:
345+
; ZVFH-NEXT: vsetvli zero, a0, e16, mf2, ta, ma
346+
; ZVFH-NEXT: vfslide1up.vf v9, v8, fa0, v0.t
347+
; ZVFH-NEXT: vmv1r.v v8, v9
348+
; ZVFH-NEXT: ret
349+
;
350+
; ZVFHMIN-LABEL: test_vp_splice_nxv2f16_with_firstelt:
351+
; ZVFHMIN: # %bb.0:
352+
; ZVFHMIN-NEXT: fmv.x.w a1, fa0
353+
; ZVFHMIN-NEXT: vsetivli zero, 4, e16, m1, ta, ma
354+
; ZVFHMIN-NEXT: vmv.s.x v9, a1
355+
; ZVFHMIN-NEXT: vsetvli zero, a0, e16, mf2, ta, mu
356+
; ZVFHMIN-NEXT: vslideup.vi v9, v8, 1, v0.t
357+
; ZVFHMIN-NEXT: vmv1r.v v8, v9
358+
; ZVFHMIN-NEXT: ret
347359
%va = insertelement <4 x half> poison, half %first, i32 0
348360
%v = call <4 x half> @llvm.experimental.vp.splice.nxv2f16(<4 x half> %va, <4 x half> %vb, i32 0, <4 x i1> %mask, i32 1, i32 %evl)
349361
ret <4 x half> %v
350362
}
363+
364+
define <8 x bfloat> @test_vp_splice_v8bf16(<8 x bfloat> %va, <8 x bfloat> %vb, i32 zeroext %evla, i32 zeroext %evlb) {
365+
; CHECK-LABEL: test_vp_splice_v8bf16:
366+
; CHECK: # %bb.0:
367+
; CHECK-NEXT: addi a0, a0, -5
368+
; CHECK-NEXT: vsetvli zero, a0, e16, m1, ta, ma
369+
; CHECK-NEXT: vslidedown.vi v8, v8, 5
370+
; CHECK-NEXT: vsetvli zero, a1, e16, m1, ta, ma
371+
; CHECK-NEXT: vslideup.vx v8, v9, a0
372+
; CHECK-NEXT: ret
373+
374+
%v = call <8 x bfloat> @llvm.experimental.vp.splice.v8bf16(<8 x bfloat> %va, <8 x bfloat> %vb, i32 5, <8 x i1> splat (i1 1), i32 %evla, i32 %evlb)
375+
ret <8 x bfloat> %v
376+
}
377+
378+
define <8 x bfloat> @test_vp_splice_v8bf16_negative_offset(<8 x bfloat> %va, <8 x bfloat> %vb, i32 zeroext %evla, i32 zeroext %evlb) {
379+
; CHECK-LABEL: test_vp_splice_v8bf16_negative_offset:
380+
; CHECK: # %bb.0:
381+
; CHECK-NEXT: addi a0, a0, -5
382+
; CHECK-NEXT: vsetivli zero, 5, e16, m1, ta, ma
383+
; CHECK-NEXT: vslidedown.vx v8, v8, a0
384+
; CHECK-NEXT: vsetvli zero, a1, e16, m1, ta, ma
385+
; CHECK-NEXT: vslideup.vi v8, v9, 5
386+
; CHECK-NEXT: ret
387+
388+
%v = call <8 x bfloat> @llvm.experimental.vp.splice.v8bf16(<8 x bfloat> %va, <8 x bfloat> %vb, i32 -5, <8 x i1> splat (i1 1), i32 %evla, i32 %evlb)
389+
ret <8 x bfloat> %v
390+
}
391+
392+
define <8 x bfloat> @test_vp_splice_v8bf16_masked(<8 x bfloat> %va, <8 x bfloat> %vb, <8 x i1> %mask, i32 zeroext %evla, i32 zeroext %evlb) {
393+
; CHECK-LABEL: test_vp_splice_v8bf16_masked:
394+
; CHECK: # %bb.0:
395+
; CHECK-NEXT: addi a0, a0, -5
396+
; CHECK-NEXT: vsetvli zero, a0, e16, m1, ta, ma
397+
; CHECK-NEXT: vslidedown.vi v8, v8, 5, v0.t
398+
; CHECK-NEXT: vsetvli zero, a1, e16, m1, ta, mu
399+
; CHECK-NEXT: vslideup.vx v8, v9, a0, v0.t
400+
; CHECK-NEXT: ret
401+
%v = call <8 x bfloat> @llvm.experimental.vp.splice.v8bf16(<8 x bfloat> %va, <8 x bfloat> %vb, i32 5, <8 x i1> %mask, i32 %evla, i32 %evlb)
402+
ret <8 x bfloat> %v
403+
}

0 commit comments

Comments
 (0)