@@ -28,7 +28,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_bf8_bf16_dst_sel_1(ptr addrspace(1)
28
28
; GFX950: ; %bb.0:
29
29
; GFX950-NEXT: global_load_dword v5, v[0:1], off
30
30
; GFX950-NEXT: s_waitcnt vmcnt(0)
31
- ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_bf16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
31
+ ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_bf16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
32
32
; GFX950-NEXT: global_store_dword v[0:1], v5, off
33
33
; GFX950-NEXT: s_endpgm
34
34
%old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -42,7 +42,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_bf8_bf16_dst_sel_2(ptr addrspace(1)
42
42
; GFX950: ; %bb.0:
43
43
; GFX950-NEXT: global_load_dword v5, v[0:1], off
44
44
; GFX950-NEXT: s_waitcnt vmcnt(0)
45
- ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_bf16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
45
+ ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_bf16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
46
46
; GFX950-NEXT: global_store_dword v[0:1], v5, off
47
47
; GFX950-NEXT: s_endpgm
48
48
%old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -84,7 +84,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_bf8_f16_dst_sel_1(ptr addrspace(1) %
84
84
; GFX950: ; %bb.0:
85
85
; GFX950-NEXT: global_load_dword v5, v[0:1], off
86
86
; GFX950-NEXT: s_waitcnt vmcnt(0)
87
- ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
87
+ ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
88
88
; GFX950-NEXT: global_store_dword v[0:1], v5, off
89
89
; GFX950-NEXT: s_endpgm
90
90
%old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -98,7 +98,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_bf8_f16_dst_sel_2(ptr addrspace(1) %
98
98
; GFX950: ; %bb.0:
99
99
; GFX950-NEXT: global_load_dword v5, v[0:1], off
100
100
; GFX950-NEXT: s_waitcnt vmcnt(0)
101
- ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
101
+ ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
102
102
; GFX950-NEXT: global_store_dword v[0:1], v5, off
103
103
; GFX950-NEXT: s_endpgm
104
104
%old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -140,7 +140,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_bf8_f32_dst_sel_1(ptr addrspace(1) %
140
140
; GFX950: ; %bb.0:
141
141
; GFX950-NEXT: global_load_dword v5, v[0:1], off
142
142
; GFX950-NEXT: s_waitcnt vmcnt(0)
143
- ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f32 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
143
+ ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f32 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
144
144
; GFX950-NEXT: global_store_dword v[0:1], v5, off
145
145
; GFX950-NEXT: s_endpgm
146
146
%old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -154,7 +154,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_bf8_f32_dst_sel_2(ptr addrspace(1) %
154
154
; GFX950: ; %bb.0:
155
155
; GFX950-NEXT: global_load_dword v5, v[0:1], off
156
156
; GFX950-NEXT: s_waitcnt vmcnt(0)
157
- ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f32 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
157
+ ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f32 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
158
158
; GFX950-NEXT: global_store_dword v[0:1], v5, off
159
159
; GFX950-NEXT: s_endpgm
160
160
%old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -196,7 +196,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_fp8_bf16_dst_sel_1(ptr addrspace(1)
196
196
; GFX950: ; %bb.0:
197
197
; GFX950-NEXT: global_load_dword v5, v[0:1], off
198
198
; GFX950-NEXT: s_waitcnt vmcnt(0)
199
- ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_bf16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
199
+ ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_bf16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
200
200
; GFX950-NEXT: global_store_dword v[0:1], v5, off
201
201
; GFX950-NEXT: s_endpgm
202
202
%old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -210,7 +210,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_fp8_bf16_dst_sel_2(ptr addrspace(1)
210
210
; GFX950: ; %bb.0:
211
211
; GFX950-NEXT: global_load_dword v5, v[0:1], off
212
212
; GFX950-NEXT: s_waitcnt vmcnt(0)
213
- ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_bf16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
213
+ ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_bf16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
214
214
; GFX950-NEXT: global_store_dword v[0:1], v5, off
215
215
; GFX950-NEXT: s_endpgm
216
216
%old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -252,7 +252,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_fp8_f16_dst_sel_1(ptr addrspace(1) %
252
252
; GFX950: ; %bb.0:
253
253
; GFX950-NEXT: global_load_dword v5, v[0:1], off
254
254
; GFX950-NEXT: s_waitcnt vmcnt(0)
255
- ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
255
+ ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
256
256
; GFX950-NEXT: global_store_dword v[0:1], v5, off
257
257
; GFX950-NEXT: s_endpgm
258
258
%old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -266,7 +266,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_fp8_f16_dst_sel_2(ptr addrspace(1) %
266
266
; GFX950: ; %bb.0:
267
267
; GFX950-NEXT: global_load_dword v5, v[0:1], off
268
268
; GFX950-NEXT: s_waitcnt vmcnt(0)
269
- ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
269
+ ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
270
270
; GFX950-NEXT: global_store_dword v[0:1], v5, off
271
271
; GFX950-NEXT: s_endpgm
272
272
%old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -308,7 +308,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_fp8_f32_dst_sel_1(ptr addrspace(1) %
308
308
; GFX950: ; %bb.0:
309
309
; GFX950-NEXT: global_load_dword v5, v[0:1], off
310
310
; GFX950-NEXT: s_waitcnt vmcnt(0)
311
- ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f32 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
311
+ ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f32 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
312
312
; GFX950-NEXT: global_store_dword v[0:1], v5, off
313
313
; GFX950-NEXT: s_endpgm
314
314
%old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -322,7 +322,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_fp8_f32_dst_sel_2(ptr addrspace(1) %
322
322
; GFX950: ; %bb.0:
323
323
; GFX950-NEXT: global_load_dword v5, v[0:1], off
324
324
; GFX950-NEXT: s_waitcnt vmcnt(0)
325
- ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f32 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
325
+ ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f32 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
326
326
; GFX950-NEXT: global_store_dword v[0:1], v5, off
327
327
; GFX950-NEXT: s_endpgm
328
328
%old = load i32 , ptr addrspace (1 ) %out , align 4
0 commit comments