43 lines
1.0 KiB
LLVM
43 lines
1.0 KiB
LLVM
; RUN: opt -S -codegenprepare < %s | FileCheck %s
|
|
|
|
target datalayout = "e-i64:64-v16:16-v32:32-n16:32:64"
|
|
target triple = "nvptx64-nvidia-cuda"
|
|
|
|
|
|
; ptrtoint/inttoptr combinations can introduce semantically-meaningful address space casts
|
|
; which we can't sink into an addrspacecast
|
|
|
|
; CHECK-LABEL: @test
|
|
define void @test(ptr %input_ptr) {
|
|
; CHECK-LABEL: l1:
|
|
; CHECK-NOT: addrspacecast
|
|
%intptr = ptrtoint ptr %input_ptr to i64
|
|
%ptr = inttoptr i64 %intptr to ptr addrspace(3)
|
|
|
|
br label %l1
|
|
l1:
|
|
|
|
store atomic i32 1, ptr addrspace(3) %ptr unordered, align 4
|
|
ret void
|
|
}
|
|
|
|
|
|
; we still should be able to look through multiple sequences of inttoptr/ptrtoint
|
|
|
|
; CHECK-LABEL: @test2
|
|
define void @test2(ptr %input_ptr) {
|
|
; CHECK-LABEL: l2:
|
|
; CHECK-NEXT: store
|
|
%intptr = ptrtoint ptr %input_ptr to i64
|
|
%ptr = inttoptr i64 %intptr to ptr addrspace(3)
|
|
|
|
%intptr2 = ptrtoint ptr addrspace(3) %ptr to i64
|
|
%ptr2 = inttoptr i64 %intptr2 to ptr
|
|
|
|
br label %l2
|
|
l2:
|
|
|
|
store atomic i32 1, ptr %ptr2 unordered, align 4
|
|
ret void
|
|
}
|