@@ -4913,12 +4913,10 @@ define inreg <20 x i32> @bitcast_v40i16_to_v20i32_scalar(<40 x i16> inreg %a, i3
4913
4913
; GFX11-TRUE16-LABEL: bitcast_v40i16_to_v20i32_scalar:
4914
4914
; GFX11-TRUE16: ; %bb.0:
4915
4915
; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
4916
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.h, 0
4917
4916
; GFX11-TRUE16-NEXT: v_cmp_ne_u32_e32 vcc_lo, 0, v2
4918
4917
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.l, v1.h
4919
4918
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.l, v0.h
4920
4919
; GFX11-TRUE16-NEXT: v_and_b32_e32 v35, 0xffff, v0
4921
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.h, v32.h
4922
4920
; GFX11-TRUE16-NEXT: v_and_b32_e32 v34, 0xffff, v1
4923
4921
; GFX11-TRUE16-NEXT: s_lshr_b32 s41, s29, 16
4924
4922
; GFX11-TRUE16-NEXT: s_lshr_b32 s42, s28, 16
@@ -8342,12 +8340,10 @@ define inreg <20 x i32> @bitcast_v40f16_to_v20i32_scalar(<40 x half> inreg %a, i
8342
8340
; GFX11-TRUE16-LABEL: bitcast_v40f16_to_v20i32_scalar:
8343
8341
; GFX11-TRUE16: ; %bb.0:
8344
8342
; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
8345
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.h, 0
8346
8343
; GFX11-TRUE16-NEXT: v_cmp_ne_u32_e32 vcc_lo, 0, v2
8347
8344
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.l, v1.h
8348
8345
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.l, v0.h
8349
8346
; GFX11-TRUE16-NEXT: v_and_b32_e32 v35, 0xffff, v0
8350
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.h, v32.h
8351
8347
; GFX11-TRUE16-NEXT: v_and_b32_e32 v34, 0xffff, v1
8352
8348
; GFX11-TRUE16-NEXT: s_lshr_b32 s41, s29, 16
8353
8349
; GFX11-TRUE16-NEXT: s_lshr_b32 s42, s28, 16
@@ -12629,12 +12625,10 @@ define inreg <20 x float> @bitcast_v40i16_to_v20f32_scalar(<40 x i16> inreg %a,
12629
12625
; GFX11-TRUE16-LABEL: bitcast_v40i16_to_v20f32_scalar:
12630
12626
; GFX11-TRUE16: ; %bb.0:
12631
12627
; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
12632
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.h, 0
12633
12628
; GFX11-TRUE16-NEXT: v_cmp_ne_u32_e32 vcc_lo, 0, v2
12634
12629
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.l, v1.h
12635
12630
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.l, v0.h
12636
12631
; GFX11-TRUE16-NEXT: v_and_b32_e32 v35, 0xffff, v0
12637
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.h, v32.h
12638
12632
; GFX11-TRUE16-NEXT: v_and_b32_e32 v34, 0xffff, v1
12639
12633
; GFX11-TRUE16-NEXT: s_lshr_b32 s41, s29, 16
12640
12634
; GFX11-TRUE16-NEXT: s_lshr_b32 s42, s28, 16
@@ -16043,12 +16037,10 @@ define inreg <20 x float> @bitcast_v40f16_to_v20f32_scalar(<40 x half> inreg %a,
16043
16037
; GFX11-TRUE16-LABEL: bitcast_v40f16_to_v20f32_scalar:
16044
16038
; GFX11-TRUE16: ; %bb.0:
16045
16039
; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
16046
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.h, 0
16047
16040
; GFX11-TRUE16-NEXT: v_cmp_ne_u32_e32 vcc_lo, 0, v2
16048
16041
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.l, v1.h
16049
16042
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.l, v0.h
16050
16043
; GFX11-TRUE16-NEXT: v_and_b32_e32 v35, 0xffff, v0
16051
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.h, v32.h
16052
16044
; GFX11-TRUE16-NEXT: v_and_b32_e32 v34, 0xffff, v1
16053
16045
; GFX11-TRUE16-NEXT: s_lshr_b32 s41, s29, 16
16054
16046
; GFX11-TRUE16-NEXT: s_lshr_b32 s42, s28, 16
@@ -19655,12 +19647,10 @@ define inreg <10 x i64> @bitcast_v40i16_to_v10i64_scalar(<40 x i16> inreg %a, i3
19655
19647
; GFX11-TRUE16-LABEL: bitcast_v40i16_to_v10i64_scalar:
19656
19648
; GFX11-TRUE16: ; %bb.0:
19657
19649
; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
19658
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.h, 0
19659
19650
; GFX11-TRUE16-NEXT: v_cmp_ne_u32_e32 vcc_lo, 0, v2
19660
19651
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.l, v1.h
19661
19652
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.l, v0.h
19662
19653
; GFX11-TRUE16-NEXT: v_and_b32_e32 v35, 0xffff, v0
19663
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.h, v32.h
19664
19654
; GFX11-TRUE16-NEXT: v_and_b32_e32 v34, 0xffff, v1
19665
19655
; GFX11-TRUE16-NEXT: s_lshr_b32 s41, s29, 16
19666
19656
; GFX11-TRUE16-NEXT: s_lshr_b32 s42, s28, 16
@@ -23094,12 +23084,10 @@ define inreg <10 x i64> @bitcast_v40f16_to_v10i64_scalar(<40 x half> inreg %a, i
23094
23084
; GFX11-TRUE16-LABEL: bitcast_v40f16_to_v10i64_scalar:
23095
23085
; GFX11-TRUE16: ; %bb.0:
23096
23086
; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
23097
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.h, 0
23098
23087
; GFX11-TRUE16-NEXT: v_cmp_ne_u32_e32 vcc_lo, 0, v2
23099
23088
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.l, v1.h
23100
23089
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.l, v0.h
23101
23090
; GFX11-TRUE16-NEXT: v_and_b32_e32 v35, 0xffff, v0
23102
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.h, v32.h
23103
23091
; GFX11-TRUE16-NEXT: v_and_b32_e32 v34, 0xffff, v1
23104
23092
; GFX11-TRUE16-NEXT: s_lshr_b32 s41, s29, 16
23105
23093
; GFX11-TRUE16-NEXT: s_lshr_b32 s42, s28, 16
@@ -25911,12 +25899,10 @@ define inreg <10 x double> @bitcast_v40i16_to_v10f64_scalar(<40 x i16> inreg %a,
25911
25899
; GFX11-TRUE16-LABEL: bitcast_v40i16_to_v10f64_scalar:
25912
25900
; GFX11-TRUE16: ; %bb.0:
25913
25901
; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
25914
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.h, 0
25915
25902
; GFX11-TRUE16-NEXT: v_cmp_ne_u32_e32 vcc_lo, 0, v2
25916
25903
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.l, v1.h
25917
25904
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.l, v0.h
25918
25905
; GFX11-TRUE16-NEXT: v_and_b32_e32 v35, 0xffff, v0
25919
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.h, v32.h
25920
25906
; GFX11-TRUE16-NEXT: v_and_b32_e32 v34, 0xffff, v1
25921
25907
; GFX11-TRUE16-NEXT: s_lshr_b32 s41, s29, 16
25922
25908
; GFX11-TRUE16-NEXT: s_lshr_b32 s42, s28, 16
@@ -29258,12 +29244,10 @@ define inreg <10 x double> @bitcast_v40f16_to_v10f64_scalar(<40 x half> inreg %a
29258
29244
; GFX11-TRUE16-LABEL: bitcast_v40f16_to_v10f64_scalar:
29259
29245
; GFX11-TRUE16: ; %bb.0:
29260
29246
; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
29261
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.h, 0
29262
29247
; GFX11-TRUE16-NEXT: v_cmp_ne_u32_e32 vcc_lo, 0, v2
29263
29248
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v32.l, v1.h
29264
29249
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.l, v0.h
29265
29250
; GFX11-TRUE16-NEXT: v_and_b32_e32 v35, 0xffff, v0
29266
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v33.h, v32.h
29267
29251
; GFX11-TRUE16-NEXT: v_and_b32_e32 v34, 0xffff, v1
29268
29252
; GFX11-TRUE16-NEXT: s_lshr_b32 s41, s29, 16
29269
29253
; GFX11-TRUE16-NEXT: s_lshr_b32 s42, s28, 16
@@ -31057,12 +31041,10 @@ define inreg <40 x half> @bitcast_v40i16_to_v40f16_scalar(<40 x i16> inreg %a, i
31057
31041
; GFX11-TRUE16-LABEL: bitcast_v40i16_to_v40f16_scalar:
31058
31042
; GFX11-TRUE16: ; %bb.0:
31059
31043
; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
31060
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v19.h, 0
31061
31044
; GFX11-TRUE16-NEXT: v_cmp_ne_u32_e32 vcc_lo, 0, v2
31062
31045
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v19.l, v1.h
31063
31046
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v18.l, v0.h
31064
31047
; GFX11-TRUE16-NEXT: s_lshr_b32 s45, s29, 16
31065
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v18.h, v19.h
31066
31048
; GFX11-TRUE16-NEXT: s_lshr_b32 s44, s28, 16
31067
31049
; GFX11-TRUE16-NEXT: s_lshr_b32 s43, s27, 16
31068
31050
; GFX11-TRUE16-NEXT: s_lshr_b32 s42, s26, 16
@@ -31074,12 +31056,12 @@ define inreg <40 x half> @bitcast_v40i16_to_v40f16_scalar(<40 x i16> inreg %a, i
31074
31056
; GFX11-TRUE16-NEXT: s_lshr_b32 s12, s20, 16
31075
31057
; GFX11-TRUE16-NEXT: s_lshr_b32 s11, s19, 16
31076
31058
; GFX11-TRUE16-NEXT: s_lshr_b32 s10, s18, 16
31077
- ; GFX11-TRUE16-NEXT: s_lshr_b32 s8 , s17, 16
31059
+ ; GFX11-TRUE16-NEXT: s_lshr_b32 s9 , s17, 16
31078
31060
; GFX11-TRUE16-NEXT: s_lshr_b32 s7, s16, 16
31079
31061
; GFX11-TRUE16-NEXT: s_lshr_b32 s6, s3, 16
31080
31062
; GFX11-TRUE16-NEXT: s_lshr_b32 s5, s2, 16
31081
31063
; GFX11-TRUE16-NEXT: s_lshr_b32 s4, s1, 16
31082
- ; GFX11-TRUE16-NEXT: s_lshr_b32 s9 , s0, 16
31064
+ ; GFX11-TRUE16-NEXT: s_lshr_b32 s8 , s0, 16
31083
31065
; GFX11-TRUE16-NEXT: s_mov_b32 s46, 0
31084
31066
; GFX11-TRUE16-NEXT: s_and_b32 s47, vcc_lo, exec_lo
31085
31067
; GFX11-TRUE16-NEXT: s_cbranch_scc0 .LBB57_3
@@ -31103,11 +31085,11 @@ define inreg <40 x half> @bitcast_v40i16_to_v40f16_scalar(<40 x i16> inreg %a, i
31103
31085
; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s12, s20, s12
31104
31086
; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s11, s19, s11
31105
31087
; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s10, s18, s10
31106
- ; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s8 , s17, s8
31088
+ ; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s9 , s17, s9
31107
31089
; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s7, s16, s7
31108
31090
; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s3, s3, s6
31109
31091
; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s2, s2, s5
31110
- ; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s0, s0, s9
31092
+ ; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s0, s0, s8
31111
31093
; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s1, s1, s4
31112
31094
; GFX11-TRUE16-NEXT: v_pk_add_u16 v15, s29, 3 op_sel_hi:[1,0]
31113
31095
; GFX11-TRUE16-NEXT: v_pk_add_u16 v16, s28, 3 op_sel_hi:[1,0]
@@ -31123,7 +31105,7 @@ define inreg <40 x half> @bitcast_v40i16_to_v40f16_scalar(<40 x i16> inreg %a, i
31123
31105
; GFX11-TRUE16-NEXT: v_pk_add_u16 v6, s12, 3 op_sel_hi:[1,0]
31124
31106
; GFX11-TRUE16-NEXT: v_pk_add_u16 v7, s11, 3 op_sel_hi:[1,0]
31125
31107
; GFX11-TRUE16-NEXT: v_pk_add_u16 v8, s10, 3 op_sel_hi:[1,0]
31126
- ; GFX11-TRUE16-NEXT: v_pk_add_u16 v9, s8 , 3 op_sel_hi:[1,0]
31108
+ ; GFX11-TRUE16-NEXT: v_pk_add_u16 v9, s9 , 3 op_sel_hi:[1,0]
31127
31109
; GFX11-TRUE16-NEXT: v_pk_add_u16 v21, s0, 3 op_sel_hi:[1,0]
31128
31110
; GFX11-TRUE16-NEXT: v_pk_add_u16 v20, s1, 3 op_sel_hi:[1,0]
31129
31111
; GFX11-TRUE16-NEXT: v_pk_add_u16 v4, s2, 3 op_sel_hi:[1,0]
@@ -31168,9 +31150,9 @@ define inreg <40 x half> @bitcast_v40i16_to_v40f16_scalar(<40 x i16> inreg %a, i
31168
31150
; GFX11-TRUE16-NEXT: v_dual_mov_b32 v28, s15 :: v_dual_mov_b32 v29, s14
31169
31151
; GFX11-TRUE16-NEXT: v_dual_mov_b32 v30, s13 :: v_dual_mov_b32 v31, s12
31170
31152
; GFX11-TRUE16-NEXT: v_dual_mov_b32 v32, s11 :: v_dual_mov_b32 v33, s10
31171
- ; GFX11-TRUE16-NEXT: v_dual_mov_b32 v34, s8 :: v_dual_mov_b32 v35, s7
31153
+ ; GFX11-TRUE16-NEXT: v_dual_mov_b32 v34, s9 :: v_dual_mov_b32 v35, s7
31172
31154
; GFX11-TRUE16-NEXT: v_dual_mov_b32 v36, s6 :: v_dual_mov_b32 v37, s5
31173
- ; GFX11-TRUE16-NEXT: v_dual_mov_b32 v38, s4 :: v_dual_mov_b32 v39, s9
31155
+ ; GFX11-TRUE16-NEXT: v_dual_mov_b32 v38, s4 :: v_dual_mov_b32 v39, s8
31174
31156
; GFX11-TRUE16-NEXT: .LBB57_5: ; %end
31175
31157
; GFX11-TRUE16-NEXT: v_and_b32_e32 v4, 0xffff, v4
31176
31158
; GFX11-TRUE16-NEXT: v_and_b32_e32 v49, 0xffff, v2
@@ -32879,12 +32861,10 @@ define inreg <40 x i16> @bitcast_v40f16_to_v40i16_scalar(<40 x half> inreg %a, i
32879
32861
; GFX11-TRUE16-LABEL: bitcast_v40f16_to_v40i16_scalar:
32880
32862
; GFX11-TRUE16: ; %bb.0:
32881
32863
; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
32882
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v19.h, 0
32883
32864
; GFX11-TRUE16-NEXT: v_cmp_ne_u32_e32 vcc_lo, 0, v2
32884
32865
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v19.l, v1.h
32885
32866
; GFX11-TRUE16-NEXT: v_mov_b16_e32 v18.l, v0.h
32886
32867
; GFX11-TRUE16-NEXT: s_lshr_b32 s45, s29, 16
32887
- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v18.h, v19.h
32888
32868
; GFX11-TRUE16-NEXT: s_lshr_b32 s44, s28, 16
32889
32869
; GFX11-TRUE16-NEXT: s_lshr_b32 s43, s27, 16
32890
32870
; GFX11-TRUE16-NEXT: s_lshr_b32 s42, s26, 16
@@ -32896,12 +32876,12 @@ define inreg <40 x i16> @bitcast_v40f16_to_v40i16_scalar(<40 x half> inreg %a, i
32896
32876
; GFX11-TRUE16-NEXT: s_lshr_b32 s12, s20, 16
32897
32877
; GFX11-TRUE16-NEXT: s_lshr_b32 s11, s19, 16
32898
32878
; GFX11-TRUE16-NEXT: s_lshr_b32 s10, s18, 16
32899
- ; GFX11-TRUE16-NEXT: s_lshr_b32 s8 , s17, 16
32879
+ ; GFX11-TRUE16-NEXT: s_lshr_b32 s9 , s17, 16
32900
32880
; GFX11-TRUE16-NEXT: s_lshr_b32 s7, s16, 16
32901
32881
; GFX11-TRUE16-NEXT: s_lshr_b32 s6, s3, 16
32902
32882
; GFX11-TRUE16-NEXT: s_lshr_b32 s5, s2, 16
32903
32883
; GFX11-TRUE16-NEXT: s_lshr_b32 s4, s1, 16
32904
- ; GFX11-TRUE16-NEXT: s_lshr_b32 s9 , s0, 16
32884
+ ; GFX11-TRUE16-NEXT: s_lshr_b32 s8 , s0, 16
32905
32885
; GFX11-TRUE16-NEXT: s_mov_b32 s46, 0
32906
32886
; GFX11-TRUE16-NEXT: s_and_b32 s47, vcc_lo, exec_lo
32907
32887
; GFX11-TRUE16-NEXT: s_cbranch_scc0 .LBB59_3
@@ -32925,11 +32905,11 @@ define inreg <40 x i16> @bitcast_v40f16_to_v40i16_scalar(<40 x half> inreg %a, i
32925
32905
; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s12, s20, s12
32926
32906
; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s11, s19, s11
32927
32907
; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s10, s18, s10
32928
- ; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s8 , s17, s8
32908
+ ; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s9 , s17, s9
32929
32909
; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s7, s16, s7
32930
32910
; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s3, s3, s6
32931
32911
; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s2, s2, s5
32932
- ; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s0, s0, s9
32912
+ ; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s0, s0, s8
32933
32913
; GFX11-TRUE16-NEXT: s_pack_ll_b32_b16 s1, s1, s4
32934
32914
; GFX11-TRUE16-NEXT: v_pk_add_f16 v15, 0x200, s29 op_sel_hi:[0,1]
32935
32915
; GFX11-TRUE16-NEXT: v_pk_add_f16 v16, 0x200, s28 op_sel_hi:[0,1]
@@ -32945,7 +32925,7 @@ define inreg <40 x i16> @bitcast_v40f16_to_v40i16_scalar(<40 x half> inreg %a, i
32945
32925
; GFX11-TRUE16-NEXT: v_pk_add_f16 v6, 0x200, s12 op_sel_hi:[0,1]
32946
32926
; GFX11-TRUE16-NEXT: v_pk_add_f16 v7, 0x200, s11 op_sel_hi:[0,1]
32947
32927
; GFX11-TRUE16-NEXT: v_pk_add_f16 v8, 0x200, s10 op_sel_hi:[0,1]
32948
- ; GFX11-TRUE16-NEXT: v_pk_add_f16 v9, 0x200, s8 op_sel_hi:[0,1]
32928
+ ; GFX11-TRUE16-NEXT: v_pk_add_f16 v9, 0x200, s9 op_sel_hi:[0,1]
32949
32929
; GFX11-TRUE16-NEXT: v_pk_add_f16 v21, 0x200, s0 op_sel_hi:[0,1]
32950
32930
; GFX11-TRUE16-NEXT: v_pk_add_f16 v20, 0x200, s1 op_sel_hi:[0,1]
32951
32931
; GFX11-TRUE16-NEXT: v_pk_add_f16 v4, 0x200, s2 op_sel_hi:[0,1]
@@ -32990,9 +32970,9 @@ define inreg <40 x i16> @bitcast_v40f16_to_v40i16_scalar(<40 x half> inreg %a, i
32990
32970
; GFX11-TRUE16-NEXT: v_dual_mov_b32 v28, s15 :: v_dual_mov_b32 v29, s14
32991
32971
; GFX11-TRUE16-NEXT: v_dual_mov_b32 v30, s13 :: v_dual_mov_b32 v31, s12
32992
32972
; GFX11-TRUE16-NEXT: v_dual_mov_b32 v32, s11 :: v_dual_mov_b32 v33, s10
32993
- ; GFX11-TRUE16-NEXT: v_dual_mov_b32 v34, s8 :: v_dual_mov_b32 v35, s7
32973
+ ; GFX11-TRUE16-NEXT: v_dual_mov_b32 v34, s9 :: v_dual_mov_b32 v35, s7
32994
32974
; GFX11-TRUE16-NEXT: v_dual_mov_b32 v36, s6 :: v_dual_mov_b32 v37, s5
32995
- ; GFX11-TRUE16-NEXT: v_dual_mov_b32 v38, s4 :: v_dual_mov_b32 v39, s9
32975
+ ; GFX11-TRUE16-NEXT: v_dual_mov_b32 v38, s4 :: v_dual_mov_b32 v39, s8
32996
32976
; GFX11-TRUE16-NEXT: .LBB59_5: ; %end
32997
32977
; GFX11-TRUE16-NEXT: v_and_b32_e32 v4, 0xffff, v4
32998
32978
; GFX11-TRUE16-NEXT: v_and_b32_e32 v49, 0xffff, v2
0 commit comments