Skip to content

Commit 482bcd2

Browse files
committed
[AMDGPU] WMMA convergent flag fix
Fixed test
1 parent 45b5989 commit 482bcd2

File tree

1 file changed

+9
-45
lines changed

1 file changed

+9
-45
lines changed

llvm/test/CodeGen/AMDGPU/wmma-gfx12-convergent.mir

Lines changed: 9 additions & 45 deletions
Original file line numberDiff line numberDiff line change
@@ -1,30 +1,13 @@
11
# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py UTC_ARGS: --version 6
22
# RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx12-generic -run-pass=machine-sink %s -o - | FileCheck %s
33

4-
--- |
5-
; ModuleID = 'test-wmma-convergent'
6-
target triple = "amdgcn-amd-amdhsa"
7-
8-
define void @wmma_test() {
9-
entry:
10-
br label %if.then
11-
12-
if.then:
13-
br label %if.end
14-
15-
if.end:
16-
ret void
17-
}
18-
19-
...
204
---
215
name: wmma_test
22-
alignment: 1
236
tracksRegLiveness: true
247
body: |
258
; CHECK-LABEL: name: wmma_test
26-
; CHECK: bb.0.entry:
27-
; CHECK-NEXT: successors: %bb.1(0x40000000), %bb.2(0x40000000)
9+
; CHECK: bb.0:
10+
; CHECK-NEXT: successors: %bb.2(0x40000000), %bb.1(0x40000000)
2811
; CHECK-NEXT: {{ $}}
2912
; CHECK-NEXT: [[DEF:%[0-9]+]]:vreg_128 = IMPLICIT_DEF
3013
; CHECK-NEXT: [[DEF1:%[0-9]+]]:vreg_128 = IMPLICIT_DEF
@@ -33,45 +16,26 @@ body: |
3316
; CHECK-NEXT: [[SI_IF:%[0-9]+]]:sreg_32 = SI_IF [[DEF2]], %bb.2, implicit-def dead $exec, implicit-def dead $scc, implicit $exec
3417
; CHECK-NEXT: S_BRANCH %bb.1
3518
; CHECK-NEXT: {{ $}}
36-
; CHECK-NEXT: bb.1.if.then:
19+
; CHECK-NEXT: bb.1:
3720
; CHECK-NEXT: successors: %bb.2(0x80000000)
3821
; CHECK-NEXT: {{ $}}
39-
; CHECK-NEXT: [[COPY:%[0-9]+]]:vgpr_32 = COPY %3.sub1
40-
; CHECK-NEXT: [[COPY1:%[0-9]+]]:vgpr_32 = COPY %3.sub3
41-
; CHECK-NEXT: [[COPY2:%[0-9]+]]:vgpr_32 = COPY %3.sub5
42-
; CHECK-NEXT: [[COPY3:%[0-9]+]]:vgpr_32 = COPY %3.sub7
43-
; CHECK-NEXT: [[COPY4:%[0-9]+]]:vgpr_32 = COPY %3.sub6
44-
; CHECK-NEXT: [[COPY5:%[0-9]+]]:vgpr_32 = COPY %3.sub4
45-
; CHECK-NEXT: [[COPY6:%[0-9]+]]:vgpr_32 = COPY %3.sub2
46-
; CHECK-NEXT: [[COPY7:%[0-9]+]]:vgpr_32 = COPY %3.sub0
22+
; CHECK-NEXT: [[COPY:%[0-9]+]]:vreg_256 = COPY %3.sub1
4723
; CHECK-NEXT: {{ $}}
48-
; CHECK-NEXT: bb.2.if.end:
24+
; CHECK-NEXT: bb.2:
4925
; CHECK-NEXT: SI_END_CF [[SI_IF]], implicit-def dead $exec, implicit-def dead $scc, implicit $exec
5026
; CHECK-NEXT: S_ENDPGM 0
51-
52-
bb.0.entry:
53-
successors: %bb.1, %bb.2
54-
27+
bb.0:
5528
%0:vreg_128 = IMPLICIT_DEF
5629
%1:vreg_128 = IMPLICIT_DEF
5730
%2:sreg_32 = IMPLICIT_DEF
5831
early-clobber %3:vreg_256 = V_WMMA_F32_16X16X16_F16_w32_threeaddr 8, %0:vreg_128, 8, %1:vreg_128, 8, 0, 0, 0, implicit $exec
5932
%4:sreg_32 = SI_IF %2:sreg_32, %bb.2, implicit-def dead $exec, implicit-def dead $scc, implicit $exec
6033
S_BRANCH %bb.1
6134
62-
bb.1.if.then:
63-
successors: %bb.2
64-
65-
%5:vgpr_32 = COPY %3.sub1:vreg_256
66-
%6:vgpr_32 = COPY %3.sub3:vreg_256
67-
%7:vgpr_32 = COPY %3.sub5:vreg_256
68-
%8:vgpr_32 = COPY %3.sub7:vreg_256
69-
%9:vgpr_32 = COPY %3.sub6:vreg_256
70-
%10:vgpr_32 = COPY %3.sub4:vreg_256
71-
%11:vgpr_32 = COPY %3.sub2:vreg_256
72-
%12:vgpr_32 = COPY %3.sub0:vreg_256
35+
bb.1:
36+
%5:vreg_256 = COPY %3.sub1:vreg_256
7337
74-
bb.2.if.end:
38+
bb.2:
7539
SI_END_CF %4:sreg_32, implicit-def dead $exec, implicit-def dead $scc, implicit $exec
7640
S_ENDPGM 0
7741

0 commit comments

Comments
 (0)