@@ -23,19 +23,19 @@ define half @reduce_fadd_half(<8 x half> %in) {
23
23
; CHECK-EMPTY:
24
24
; CHECK-NEXT: // %bb.0:
25
25
; CHECK-NEXT: ld.param.v4.u32 {%r1, %r2, %r3, %r4}, [reduce_fadd_half_param_0];
26
- ; CHECK-NEXT: mov.b32 {%rs1, %rs2}, %r4 ;
27
- ; CHECK-NEXT: mov.b32 { %rs3, %rs4}, %r3 ;
28
- ; CHECK-NEXT: mov.b32 {%rs5 , %rs6} , %r2 ;
29
- ; CHECK-NEXT: mov.b32 {%rs7 , %rs8} , %r1 ;
30
- ; CHECK-NEXT: mov.b16 %rs9, 0x0000 ;
31
- ; CHECK-NEXT: add.rn.f16 %rs10 , %rs7 , %rs9 ;
32
- ; CHECK-NEXT: add.rn.f16 %rs11 , %rs10 , %rs8 ;
33
- ; CHECK-NEXT: add.rn.f16 %rs12 , %rs11, %rs5 ;
34
- ; CHECK-NEXT: add.rn.f16 %rs13 , %rs12 , %rs6 ;
35
- ; CHECK-NEXT: add.rn.f16 %rs14 , %rs13 , %rs3 ;
36
- ; CHECK-NEXT: add.rn.f16 %rs15 , %rs14 , %rs4 ;
37
- ; CHECK-NEXT: add.rn.f16 %rs16, %rs15 , %rs1 ;
38
- ; CHECK-NEXT: add.rn.f16 %rs17, %rs16, %rs2 ;
26
+ ; CHECK-NEXT: mov.b32 {%rs1, %rs2}, %r1 ;
27
+ ; CHECK-NEXT: mov.b16 %rs3, 0x0000 ;
28
+ ; CHECK-NEXT: add.rn.f16 %rs4 , %rs1 , %rs3 ;
29
+ ; CHECK-NEXT: add.rn.f16 %rs5 , %rs4 , %rs2 ;
30
+ ; CHECK-NEXT: mov.b32 {%rs6, %rs7}, %r2 ;
31
+ ; CHECK-NEXT: add.rn.f16 %rs8 , %rs5 , %rs6 ;
32
+ ; CHECK-NEXT: add.rn.f16 %rs9 , %rs8 , %rs7 ;
33
+ ; CHECK-NEXT: mov.b32 {%rs10 , %rs11} , %r3 ;
34
+ ; CHECK-NEXT: add.rn.f16 %rs12 , %rs9 , %rs10 ;
35
+ ; CHECK-NEXT: add.rn.f16 %rs13 , %rs12 , %rs11 ;
36
+ ; CHECK-NEXT: mov.b32 {%rs14 , %rs15} , %r4 ;
37
+ ; CHECK-NEXT: add.rn.f16 %rs16, %rs13 , %rs14 ;
38
+ ; CHECK-NEXT: add.rn.f16 %rs17, %rs16, %rs15 ;
39
39
; CHECK-NEXT: st.param.b16 [func_retval0], %rs17;
40
40
; CHECK-NEXT: ret;
41
41
%res = call half @llvm.vector.reduce.fadd (half 0 .0 , <8 x half > %in )
@@ -174,17 +174,17 @@ define half @reduce_fmul_half(<8 x half> %in) {
174
174
; CHECK-EMPTY:
175
175
; CHECK-NEXT: // %bb.0:
176
176
; CHECK-NEXT: ld.param.v4.u32 {%r1, %r2, %r3, %r4}, [reduce_fmul_half_param_0];
177
- ; CHECK-NEXT: mov.b32 {%rs1, %rs2}, %r4 ;
178
- ; CHECK-NEXT: mov.b32 {%rs3, %rs4}, %r3 ;
179
- ; CHECK-NEXT: mov.b32 { %rs5, %rs6} , %r2 ;
180
- ; CHECK-NEXT: mov.b32 {%rs7 , %rs8} , %r1 ;
181
- ; CHECK-NEXT: mul.rn.f16 %rs9 , %rs7 , %rs8 ;
182
- ; CHECK-NEXT: mul.rn.f16 %rs10 , %rs9, %rs5 ;
183
- ; CHECK-NEXT: mul.rn.f16 %rs11 , %rs10 , %rs6 ;
184
- ; CHECK-NEXT: mul.rn.f16 %rs12 , %rs11 , %rs3 ;
185
- ; CHECK-NEXT: mul.rn.f16 %rs13 , %rs12 , %rs4 ;
186
- ; CHECK-NEXT: mul.rn.f16 %rs14, %rs13 , %rs1 ;
187
- ; CHECK-NEXT: mul.rn.f16 %rs15, %rs14, %rs2 ;
177
+ ; CHECK-NEXT: mov.b32 {%rs1, %rs2}, %r2 ;
178
+ ; CHECK-NEXT: mov.b32 {%rs3, %rs4}, %r1 ;
179
+ ; CHECK-NEXT: mul.rn.f16 %rs5, %rs3 , %rs4 ;
180
+ ; CHECK-NEXT: mul.rn.f16 %rs6 , %rs5 , %rs1 ;
181
+ ; CHECK-NEXT: mul.rn.f16 %rs7 , %rs6 , %rs2 ;
182
+ ; CHECK-NEXT: mov.b32 {%rs8 , %rs9} , %r3 ;
183
+ ; CHECK-NEXT: mul.rn.f16 %rs10 , %rs7 , %rs8 ;
184
+ ; CHECK-NEXT: mul.rn.f16 %rs11 , %rs10 , %rs9 ;
185
+ ; CHECK-NEXT: mov.b32 {%rs12 , %rs13} , %r4 ;
186
+ ; CHECK-NEXT: mul.rn.f16 %rs14, %rs11 , %rs12 ;
187
+ ; CHECK-NEXT: mul.rn.f16 %rs15, %rs14, %rs13 ;
188
188
; CHECK-NEXT: st.param.b16 [func_retval0], %rs15;
189
189
; CHECK-NEXT: ret;
190
190
%res = call half @llvm.vector.reduce.fmul (half 1 .0 , <8 x half > %in )
0 commit comments