forked from llvm-mirror/llvm
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
This patch improves the performance of vector creation in caseiswhere where several of the lanes in the vector are a constant floating point value. It also includes new patterns to fold together some of the instructions when the value is 0.0f. Test cases included. rdar://16349427 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@206496 91177308-0d34-0410-b5e6-96231b3b80d8
Showing
3 changed files
with
38 additions
and
2 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,33 @@ | ||
; RUN: llc -march=arm64 -mcpu=generic < %s | FileCheck %s | ||
|
||
define void @test0f(float* nocapture %x, float %a) #0 { | ||
entry: | ||
%0 = insertelement <4 x float> <float undef, float 0.000000e+00, float 0.000000e+00, float 0.000000e+00>, float %a, i32 0 | ||
%1 = bitcast float* %x to <4 x float>* | ||
store <4 x float> %0, <4 x float>* %1, align 16 | ||
ret void | ||
|
||
; CHECK-LABEL: test0f | ||
; CHECK: movi.2d v[[TEMP:[0-9]+]], #0000000000000000 | ||
; CHECK: ins.s v[[TEMP]][0], v{{[0-9]+}}[0] | ||
; CHECK: str q[[TEMP]], [x0] | ||
; CHECK: ret | ||
|
||
|
||
} | ||
|
||
|
||
define void @test1f(float* nocapture %x, float %a) #0 { | ||
entry: | ||
%0 = insertelement <4 x float> <float undef, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00>, float %a, i32 0 | ||
%1 = bitcast float* %x to <4 x float>* | ||
store <4 x float> %0, <4 x float>* %1, align 16 | ||
ret void | ||
|
||
; CHECK-LABEL: test1f | ||
; CHECK: fmov s[[TEMP:[0-9]+]], #1.000000e+00 | ||
; CHECK: dup.4s v[[TEMP2:[0-9]+]], v[[TEMP]][0] | ||
; CHECK: ins.s v[[TEMP2]][0], v0[0] | ||
; CHECK: str q[[TEMP2]], [x0] | ||
; CHECK: ret | ||
} |