forked from llvm-mirror/llvm
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
------------------------------------------------------------------------ r259558 | Matthew.Arsenault | 2016-02-02 12:28:10 -0800 (Tue, 02 Feb 2016) | 4 lines AMDGPU: Handle promoting memmove Also add missing tests for the others. ------------------------------------------------------------------------ git-svn-id: https://llvm.org/svn/llvm-project/llvm/branches/release_38@271593 91177308-0d34-0410-b5e6-96231b3b80d8
- Loading branch information
1 parent
c7c7ff0
commit 5a2d99b
Showing
2 changed files
with
89 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,65 @@ | ||
; RUN: opt -S -mtriple=amdgcn-unknown-amdhsa -amdgpu-promote-alloca < %s | FileCheck %s | ||
|
||
declare void @llvm.memcpy.p0i8.p1i8.i32(i8* nocapture, i8 addrspace(1)* nocapture, i32, i32, i1) #0 | ||
declare void @llvm.memcpy.p1i8.p0i8.i32(i8 addrspace(1)* nocapture, i8* nocapture, i32, i32, i1) #0 | ||
|
||
declare void @llvm.memmove.p0i8.p1i8.i32(i8* nocapture, i8 addrspace(1)* nocapture, i32, i32, i1) #0 | ||
declare void @llvm.memmove.p1i8.p0i8.i32(i8 addrspace(1)* nocapture, i8* nocapture, i32, i32, i1) #0 | ||
|
||
declare void @llvm.memset.p0i8.i32(i8* nocapture, i8, i32, i32, i1) #0 | ||
|
||
declare i32 @llvm.objectsize.i32.p0i8(i8*, i1) #1 | ||
|
||
; CHECK-LABEL: @promote_with_memcpy( | ||
; CHECK: getelementptr [256 x [17 x i32]], [256 x [17 x i32]] addrspace(3)* @alloca, i32 0, i32 %{{[0-9]+}} | ||
; CHECK: call void @llvm.memcpy.p3i8.p1i8.i32(i8 addrspace(3)* %alloca.bc, i8 addrspace(1)* %in.bc, i32 68, i32 4, i1 false) | ||
; CHECK: call void @llvm.memcpy.p1i8.p3i8.i32(i8 addrspace(1)* %out.bc, i8 addrspace(3)* %alloca.bc, i32 68, i32 4, i1 false) | ||
define void @promote_with_memcpy(i32 addrspace(1)* %out, i32 addrspace(1)* %in) #0 { | ||
%alloca = alloca [17 x i32], align 16 | ||
%alloca.bc = bitcast [17 x i32]* %alloca to i8* | ||
%in.bc = bitcast i32 addrspace(1)* %in to i8 addrspace(1)* | ||
%out.bc = bitcast i32 addrspace(1)* %out to i8 addrspace(1)* | ||
call void @llvm.memcpy.p0i8.p1i8.i32(i8* %alloca.bc, i8 addrspace(1)* %in.bc, i32 68, i32 4, i1 false) | ||
call void @llvm.memcpy.p1i8.p0i8.i32(i8 addrspace(1)* %out.bc, i8* %alloca.bc, i32 68, i32 4, i1 false) | ||
ret void | ||
} | ||
|
||
; CHECK-LABEL: @promote_with_memmove( | ||
; CHECK: getelementptr [256 x [17 x i32]], [256 x [17 x i32]] addrspace(3)* @alloca.1, i32 0, i32 %{{[0-9]+}} | ||
; CHECK: call void @llvm.memmove.p3i8.p1i8.i32(i8 addrspace(3)* %alloca.bc, i8 addrspace(1)* %in.bc, i32 68, i32 4, i1 false) | ||
; CHECK: call void @llvm.memmove.p1i8.p3i8.i32(i8 addrspace(1)* %out.bc, i8 addrspace(3)* %alloca.bc, i32 68, i32 4, i1 false) | ||
define void @promote_with_memmove(i32 addrspace(1)* %out, i32 addrspace(1)* %in) #0 { | ||
%alloca = alloca [17 x i32], align 16 | ||
%alloca.bc = bitcast [17 x i32]* %alloca to i8* | ||
%in.bc = bitcast i32 addrspace(1)* %in to i8 addrspace(1)* | ||
%out.bc = bitcast i32 addrspace(1)* %out to i8 addrspace(1)* | ||
call void @llvm.memmove.p0i8.p1i8.i32(i8* %alloca.bc, i8 addrspace(1)* %in.bc, i32 68, i32 4, i1 false) | ||
call void @llvm.memmove.p1i8.p0i8.i32(i8 addrspace(1)* %out.bc, i8* %alloca.bc, i32 68, i32 4, i1 false) | ||
ret void | ||
} | ||
|
||
; CHECK-LABEL: @promote_with_memset( | ||
; CHECK: getelementptr [256 x [17 x i32]], [256 x [17 x i32]] addrspace(3)* @alloca.2, i32 0, i32 %{{[0-9]+}} | ||
; CHECK: call void @llvm.memset.p3i8.i32(i8 addrspace(3)* %alloca.bc, i8 7, i32 68, i32 4, i1 false) | ||
define void @promote_with_memset(i32 addrspace(1)* %out, i32 addrspace(1)* %in) #0 { | ||
%alloca = alloca [17 x i32], align 16 | ||
%alloca.bc = bitcast [17 x i32]* %alloca to i8* | ||
%in.bc = bitcast i32 addrspace(1)* %in to i8 addrspace(1)* | ||
%out.bc = bitcast i32 addrspace(1)* %out to i8 addrspace(1)* | ||
call void @llvm.memset.p0i8.i32(i8* %alloca.bc, i8 7, i32 68, i32 4, i1 false) | ||
ret void | ||
} | ||
|
||
; CHECK-LABEL: @promote_with_objectsize( | ||
; CHECK: [[PTR:%[0-9]+]] = getelementptr [256 x [17 x i32]], [256 x [17 x i32]] addrspace(3)* @alloca.3, i32 0, i32 %{{[0-9]+}} | ||
; CHECK: call i32 @llvm.objectsize.i32.p3i8(i8 addrspace(3)* %alloca.bc, i1 false) | ||
define void @promote_with_objectsize(i32 addrspace(1)* %out) #0 { | ||
%alloca = alloca [17 x i32], align 16 | ||
%alloca.bc = bitcast [17 x i32]* %alloca to i8* | ||
%size = call i32 @llvm.objectsize.i32.p0i8(i8* %alloca.bc, i1 false) | ||
store i32 %size, i32 addrspace(1)* %out | ||
ret void | ||
} | ||
|
||
attributes #0 = { nounwind } | ||
attributes #1 = { nounwind readnone } |