| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py |
| ; RUN: opt -mtriple=amdgcn-amd-amdhsa -mcpu=gfx90a -S -passes=infer-address-spaces --verify-each %s | FileCheck %s |
| |
| ; Inst can use a value multiple time. When we're inserting an addrspacecast to flat, |
| ; it's important all the identical uses use an indentical replacement, especially |
| ; for PHIs. |
| |
| define amdgpu_kernel void @test_phi() { |
| ; CHECK-LABEL: @test_phi( |
| ; CHECK-NEXT: entry: |
| ; CHECK-NEXT: [[LOADED_PTR:%.*]] = load ptr, ptr addrspace(4) null, align 8 |
| ; CHECK-NEXT: [[TMP0:%.*]] = addrspacecast ptr [[LOADED_PTR]] to ptr addrspace(1) |
| ; CHECK-NEXT: br label [[BB0:%.*]] |
| ; CHECK: bb0: |
| ; CHECK-NEXT: [[GEP:%.*]] = getelementptr i64, ptr addrspace(1) [[TMP0]], i64 3 |
| ; CHECK-NEXT: [[TMP1:%.*]] = addrspacecast ptr addrspace(1) [[GEP]] to ptr |
| ; CHECK-NEXT: switch i32 0, label [[END:%.*]] [ |
| ; CHECK-NEXT: i32 1, label [[END]] |
| ; CHECK-NEXT: i32 4, label [[END]] |
| ; CHECK-NEXT: i32 5, label [[BB1:%.*]] |
| ; CHECK-NEXT: ] |
| ; CHECK: bb1: |
| ; CHECK-NEXT: [[TMP2:%.*]] = load double, ptr addrspace(1) [[GEP]], align 16 |
| ; CHECK-NEXT: br label [[END]] |
| ; CHECK: end: |
| ; CHECK-NEXT: [[RETVAL_SROA_0_0_I569_PH:%.*]] = phi ptr [ null, [[BB1]] ], [ [[TMP1]], [[BB0]] ], [ [[TMP1]], [[BB0]] ], [ [[TMP1]], [[BB0]] ] |
| ; CHECK-NEXT: ret void |
| ; |
| entry: |
| %loaded.ptr = load ptr, ptr addrspace(4) null, align 8 |
| br label %bb0 |
| |
| bb0: |
| %gep = getelementptr i64, ptr %loaded.ptr, i64 3 |
| switch i32 0, label %end [ |
| i32 1, label %end |
| i32 4, label %end |
| i32 5, label %bb1 |
| ] |
| |
| bb1: |
| %0 = load double, ptr %gep, align 16 |
| br label %end |
| |
| end: |
| %retval.sroa.0.0.i569.ph = phi ptr [ null, %bb1 ], [ %gep, %bb0 ], [ %gep, %bb0 ], [ %gep, %bb0 ] |
| ret void |
| } |
| |
| declare void @uses_ptrs(ptr, ptr, ptr) |
| |
| ; We shouldn't treat PHIs differently, even other users should have the same treatment. |
| ; All occurences of %gep are replaced with an identical value. |
| define amdgpu_kernel void @test_other() { |
| ; CHECK-LABEL: @test_other( |
| ; CHECK-NEXT: entry: |
| ; CHECK-NEXT: [[LOADED_PTR:%.*]] = load ptr, ptr addrspace(4) null, align 8 |
| ; CHECK-NEXT: [[TMP0:%.*]] = addrspacecast ptr [[LOADED_PTR]] to ptr addrspace(1) |
| ; CHECK-NEXT: [[TMP1:%.*]] = addrspacecast ptr addrspace(1) [[TMP0]] to ptr |
| ; CHECK-NEXT: [[GEP:%.*]] = getelementptr i64, ptr [[TMP1]], i64 3 |
| ; CHECK-NEXT: call void @uses_ptrs(ptr [[GEP]], ptr [[GEP]], ptr [[GEP]]) |
| ; CHECK-NEXT: ret void |
| ; |
| entry: |
| %loaded.ptr = load ptr, ptr addrspace(4) null, align 8 |
| %gep = getelementptr i64, ptr %loaded.ptr, i64 3 |
| call void @uses_ptrs(ptr %gep, ptr %gep, ptr %gep) |
| ret void |
| } |