@@ -7646,9 +7646,9 @@ define amdgpu_kernel void @local_ds_fadd(ptr addrspace(1) %out, ptr addrspace(3)
7646
7646
; GFX7-NEXT: s_or_b64 s[8:9], s[0:1], s[8:9]
7647
7647
; GFX7-NEXT: s_andn2_b64 exec, exec, s[8:9]
7648
7648
; GFX7-NEXT: s_cbranch_execnz .LBB28_2
7649
- ; GFX7-NEXT: ; %bb.3: ; %Flow23
7649
+ ; GFX7-NEXT: ; %bb.3: ; %Flow22
7650
7650
; GFX7-NEXT: s_or_b64 exec, exec, s[8:9]
7651
- ; GFX7-NEXT: .LBB28_4: ; %Flow24
7651
+ ; GFX7-NEXT: .LBB28_4: ; %Flow23
7652
7652
; GFX7-NEXT: s_or_b64 exec, exec, s[6:7]
7653
7653
; GFX7-NEXT: s_mov_b64 s[8:9], exec
7654
7654
; GFX7-NEXT: v_readfirstlane_b32 s10, v1
@@ -7676,7 +7676,7 @@ define amdgpu_kernel void @local_ds_fadd(ptr addrspace(1) %out, ptr addrspace(3)
7676
7676
; GFX7-NEXT: v_mov_b32_e32 v3, v4
7677
7677
; GFX7-NEXT: s_andn2_b64 exec, exec, s[8:9]
7678
7678
; GFX7-NEXT: s_cbranch_execnz .LBB28_6
7679
- ; GFX7-NEXT: .LBB28_7: ; %Flow22
7679
+ ; GFX7-NEXT: .LBB28_7: ; %Flow21
7680
7680
; GFX7-NEXT: s_or_b64 exec, exec, s[6:7]
7681
7681
; GFX7-NEXT: v_cvt_f32_ubyte0_e32 v0, v0
7682
7682
; GFX7-NEXT: v_mul_f32_e32 v0, 0x42280000, v0
@@ -7725,7 +7725,7 @@ define amdgpu_kernel void @local_ds_fadd(ptr addrspace(1) %out, ptr addrspace(3)
7725
7725
; GFX7-NEXT: s_cbranch_execnz .LBB28_11
7726
7726
; GFX7-NEXT: ; %bb.12: ; %Flow
7727
7727
; GFX7-NEXT: s_or_b64 exec, exec, s[2:3]
7728
- ; GFX7-NEXT: .LBB28_13: ; %Flow20
7728
+ ; GFX7-NEXT: .LBB28_13: ; %Flow19
7729
7729
; GFX7-NEXT: s_or_b64 exec, exec, s[6:7]
7730
7730
; GFX7-NEXT: s_load_dwordx2 s[0:1], s[4:5], 0x0
7731
7731
; GFX7-NEXT: v_readfirstlane_b32 s4, v2
@@ -7770,9 +7770,9 @@ define amdgpu_kernel void @local_ds_fadd(ptr addrspace(1) %out, ptr addrspace(3)
7770
7770
; GFX6-NEXT: s_or_b64 s[8:9], s[0:1], s[8:9]
7771
7771
; GFX6-NEXT: s_andn2_b64 exec, exec, s[8:9]
7772
7772
; GFX6-NEXT: s_cbranch_execnz .LBB28_2
7773
- ; GFX6-NEXT: ; %bb.3: ; %Flow21
7773
+ ; GFX6-NEXT: ; %bb.3: ; %Flow20
7774
7774
; GFX6-NEXT: s_or_b64 exec, exec, s[8:9]
7775
- ; GFX6-NEXT: .LBB28_4: ; %Flow22
7775
+ ; GFX6-NEXT: .LBB28_4: ; %Flow21
7776
7776
; GFX6-NEXT: s_or_b64 exec, exec, s[6:7]
7777
7777
; GFX6-NEXT: s_mov_b64 s[8:9], exec
7778
7778
; GFX6-NEXT: v_readfirstlane_b32 s10, v1
@@ -7800,7 +7800,7 @@ define amdgpu_kernel void @local_ds_fadd(ptr addrspace(1) %out, ptr addrspace(3)
7800
7800
; GFX6-NEXT: v_mov_b32_e32 v3, v4
7801
7801
; GFX6-NEXT: s_andn2_b64 exec, exec, s[8:9]
7802
7802
; GFX6-NEXT: s_cbranch_execnz .LBB28_6
7803
- ; GFX6-NEXT: .LBB28_7: ; %Flow20
7803
+ ; GFX6-NEXT: .LBB28_7: ; %Flow19
7804
7804
; GFX6-NEXT: s_or_b64 exec, exec, s[6:7]
7805
7805
; GFX6-NEXT: v_cvt_f32_ubyte0_e32 v0, v0
7806
7806
; GFX6-NEXT: v_mul_f32_e32 v0, 0x42280000, v0
@@ -7849,7 +7849,7 @@ define amdgpu_kernel void @local_ds_fadd(ptr addrspace(1) %out, ptr addrspace(3)
7849
7849
; GFX6-NEXT: s_cbranch_execnz .LBB28_11
7850
7850
; GFX6-NEXT: ; %bb.12: ; %Flow
7851
7851
; GFX6-NEXT: s_or_b64 exec, exec, s[2:3]
7852
- ; GFX6-NEXT: .LBB28_13: ; %Flow18
7852
+ ; GFX6-NEXT: .LBB28_13: ; %Flow17
7853
7853
; GFX6-NEXT: s_or_b64 exec, exec, s[6:7]
7854
7854
; GFX6-NEXT: s_load_dwordx2 s[0:1], s[4:5], 0x0
7855
7855
; GFX6-NEXT: v_readfirstlane_b32 s4, v2
@@ -8483,9 +8483,9 @@ define amdgpu_kernel void @local_ds_fadd_one_as(ptr addrspace(1) %out, ptr addrs
8483
8483
; GFX7-NEXT: s_or_b64 s[8:9], s[0:1], s[8:9]
8484
8484
; GFX7-NEXT: s_andn2_b64 exec, exec, s[8:9]
8485
8485
; GFX7-NEXT: s_cbranch_execnz .LBB29_2
8486
- ; GFX7-NEXT: ; %bb.3: ; %Flow23
8486
+ ; GFX7-NEXT: ; %bb.3: ; %Flow22
8487
8487
; GFX7-NEXT: s_or_b64 exec, exec, s[8:9]
8488
- ; GFX7-NEXT: .LBB29_4: ; %Flow24
8488
+ ; GFX7-NEXT: .LBB29_4: ; %Flow23
8489
8489
; GFX7-NEXT: s_or_b64 exec, exec, s[6:7]
8490
8490
; GFX7-NEXT: s_mov_b64 s[8:9], exec
8491
8491
; GFX7-NEXT: v_readfirstlane_b32 s10, v1
@@ -8513,7 +8513,7 @@ define amdgpu_kernel void @local_ds_fadd_one_as(ptr addrspace(1) %out, ptr addrs
8513
8513
; GFX7-NEXT: v_mov_b32_e32 v3, v4
8514
8514
; GFX7-NEXT: s_andn2_b64 exec, exec, s[8:9]
8515
8515
; GFX7-NEXT: s_cbranch_execnz .LBB29_6
8516
- ; GFX7-NEXT: .LBB29_7: ; %Flow22
8516
+ ; GFX7-NEXT: .LBB29_7: ; %Flow21
8517
8517
; GFX7-NEXT: s_or_b64 exec, exec, s[6:7]
8518
8518
; GFX7-NEXT: v_cvt_f32_ubyte0_e32 v0, v0
8519
8519
; GFX7-NEXT: v_mul_f32_e32 v0, 0x42280000, v0
@@ -8562,7 +8562,7 @@ define amdgpu_kernel void @local_ds_fadd_one_as(ptr addrspace(1) %out, ptr addrs
8562
8562
; GFX7-NEXT: s_cbranch_execnz .LBB29_11
8563
8563
; GFX7-NEXT: ; %bb.12: ; %Flow
8564
8564
; GFX7-NEXT: s_or_b64 exec, exec, s[2:3]
8565
- ; GFX7-NEXT: .LBB29_13: ; %Flow20
8565
+ ; GFX7-NEXT: .LBB29_13: ; %Flow19
8566
8566
; GFX7-NEXT: s_or_b64 exec, exec, s[6:7]
8567
8567
; GFX7-NEXT: s_load_dwordx2 s[0:1], s[4:5], 0x0
8568
8568
; GFX7-NEXT: v_readfirstlane_b32 s4, v2
@@ -8607,9 +8607,9 @@ define amdgpu_kernel void @local_ds_fadd_one_as(ptr addrspace(1) %out, ptr addrs
8607
8607
; GFX6-NEXT: s_or_b64 s[8:9], s[0:1], s[8:9]
8608
8608
; GFX6-NEXT: s_andn2_b64 exec, exec, s[8:9]
8609
8609
; GFX6-NEXT: s_cbranch_execnz .LBB29_2
8610
- ; GFX6-NEXT: ; %bb.3: ; %Flow21
8610
+ ; GFX6-NEXT: ; %bb.3: ; %Flow20
8611
8611
; GFX6-NEXT: s_or_b64 exec, exec, s[8:9]
8612
- ; GFX6-NEXT: .LBB29_4: ; %Flow22
8612
+ ; GFX6-NEXT: .LBB29_4: ; %Flow21
8613
8613
; GFX6-NEXT: s_or_b64 exec, exec, s[6:7]
8614
8614
; GFX6-NEXT: s_mov_b64 s[8:9], exec
8615
8615
; GFX6-NEXT: v_readfirstlane_b32 s10, v1
@@ -8637,7 +8637,7 @@ define amdgpu_kernel void @local_ds_fadd_one_as(ptr addrspace(1) %out, ptr addrs
8637
8637
; GFX6-NEXT: v_mov_b32_e32 v3, v4
8638
8638
; GFX6-NEXT: s_andn2_b64 exec, exec, s[8:9]
8639
8639
; GFX6-NEXT: s_cbranch_execnz .LBB29_6
8640
- ; GFX6-NEXT: .LBB29_7: ; %Flow20
8640
+ ; GFX6-NEXT: .LBB29_7: ; %Flow19
8641
8641
; GFX6-NEXT: s_or_b64 exec, exec, s[6:7]
8642
8642
; GFX6-NEXT: v_cvt_f32_ubyte0_e32 v0, v0
8643
8643
; GFX6-NEXT: v_mul_f32_e32 v0, 0x42280000, v0
@@ -8686,7 +8686,7 @@ define amdgpu_kernel void @local_ds_fadd_one_as(ptr addrspace(1) %out, ptr addrs
8686
8686
; GFX6-NEXT: s_cbranch_execnz .LBB29_11
8687
8687
; GFX6-NEXT: ; %bb.12: ; %Flow
8688
8688
; GFX6-NEXT: s_or_b64 exec, exec, s[2:3]
8689
- ; GFX6-NEXT: .LBB29_13: ; %Flow18
8689
+ ; GFX6-NEXT: .LBB29_13: ; %Flow17
8690
8690
; GFX6-NEXT: s_or_b64 exec, exec, s[6:7]
8691
8691
; GFX6-NEXT: s_load_dwordx2 s[0:1], s[4:5], 0x0
8692
8692
; GFX6-NEXT: v_readfirstlane_b32 s4, v2
0 commit comments