src - FreeBSD source tree

diff options


context:
space:
mode:

author	Dimitry Andric <dim@FreeBSD.org>	2017-04-16 16:01:22 +0000
committer	Dimitry Andric <dim@FreeBSD.org>	2017-04-16 16:01:22 +0000
commit	71d5a2540a98c81f5bcaeb48805e0e2881f530ef (patch)
tree	5343938942df402b49ec7300a1c25a2d4ccd5821 /test/CodeGen/AMDGPU/coalescer-subrange-crash.ll
parent	31bbf64f3a4974a2d6c8b3b27ad2f519caf74057 (diff)
download	src-71d5a2540a98c81f5bcaeb48805e0e2881f530ef.tar.gz src-71d5a2540a98c81f5bcaeb48805e0e2881f530ef.zip

Vendor import of llvm trunk r300422:vendor/llvm/llvm-trunk-r300422

https://llvm.org/svn/llvm-project/llvm/trunk@300422

Notes

Notes: svn path=/vendor/llvm/dist/; revision=317017 svn path=/vendor/llvm/llvm-trunk-r300422/; revision=317018; tag=vendor/llvm/llvm-trunk-r300422

Diffstat (limited to 'test/CodeGen/AMDGPU/coalescer-subrange-crash.ll')

-rw-r--r--

test/CodeGen/AMDGPU/coalescer-subrange-crash.ll

1 files changed, 18 insertions, 14 deletions

diff --git a/test/CodeGen/AMDGPU/coalescer-subrange-crash.ll b/test/CodeGen/AMDGPU/coalescer-subrange-crash.ll
index 7ff133b86e72..ef1b3d25f883 100644
--- a/test/CodeGen/AMDGPU/coalescer-subrange-crash.ll
+++ b/test/CodeGen/AMDGPU/coalescer-subrange-crash.ll

@@ -1,5 +1,4 @@

-; RUN: llc -march=amdgcn < %s | FileCheck %s

-; REQUIRES: asserts

+; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck %s

;

; This testcase used to cause the following crash:

;

@@ -18,14 +17,16 @@

;

; Test for a valid output:

; CHECK: image_sample_c_d_o

-target triple = "amdgcn--"

define amdgpu_ps <{ i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, float, float, float, float, float, float, float, float, float, float, float, float, float, float }> @main([17 x <16 x i8>] addrspace(2)* byval dereferenceable(18446744073709551615) %arg, [16 x <16 x i8>] addrspace(2)* byval dereferenceable(18446744073709551615) %arg1, [32 x <8 x i32>] addrspace(2)* byval dereferenceable(18446744073709551615) %arg2, [16 x <8 x i32>] addrspace(2)* byval dereferenceable(18446744073709551615) %arg3, [16 x <4 x i32>] addrspace(2)* byval dereferenceable(18446744073709551615) %arg4, float inreg %arg5, i32 inreg %arg6, <2 x i32> %arg7, <2 x i32> %arg8, <2 x i32> %arg9, <3 x i32> %arg10, <2 x i32> %arg11, <2 x i32> %arg12, <2 x i32> %arg13, float %arg14, float %arg15, float %arg16, float %arg17, float %arg18, i32 %arg19, i32 %arg20, float %arg21, i32 %arg22) #0 {

main_body:

- %tmp = call float @llvm.SI.fs.interp(i32 3, i32 0, i32 %arg6, <2 x i32> %arg8)

- %tmp23 = fadd float %tmp, 0xBFA99999A0000000

- %tmp24 = fadd float %tmp, 0x3FA99999A0000000

+ %i.i = extractelement <2 x i32> %arg8, i32 0

+ %j.i = extractelement <2 x i32> %arg8, i32 1

+ %i.f.i = bitcast i32 %i.i to float

+ %j.f.i = bitcast i32 %j.i to float

+ %p1.i = call float @llvm.amdgcn.interp.p1(float %i.f.i, i32 3, i32 0, i32 %arg6) #1

+ %p2.i = call float @llvm.amdgcn.interp.p2(float %p1.i, float %j.f.i, i32 3, i32 0, i32 %arg6) #1

+ %tmp23 = fadd float %p2.i, 0xBFA99999A0000000

+ %tmp24 = fadd float %p2.i, 0x3FA99999A0000000

%tmp25 = bitcast float %tmp23 to i32

%tmp26 = insertelement <16 x i32> <i32 212739, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef>, i32 %tmp25, i32 1

%tmp27 = insertelement <16 x i32> %tmp26, i32 undef, i32 2

@@ -35,7 +36,8 @@ main_body:

%tmp31 = insertelement <16 x i32> %tmp30, i32 undef, i32 6

%tmp32 = insertelement <16 x i32> %tmp31, i32 undef, i32 7

%tmp33 = insertelement <16 x i32> %tmp32, i32 undef, i32 8

- %tmp34 = call <4 x float> @llvm.SI.image.sample.c.d.o.v16i32(<16 x i32> %tmp33, <8 x i32> undef, <4 x i32> undef, i32 15, i32 0, i32 0, i32 1, i32 0, i32 0, i32 0, i32 0)

+ %tmp33.bc = bitcast <16 x i32> %tmp33 to <16 x float>

+ %tmp34 = call <4 x float> @llvm.amdgcn.image.sample.c.d.o.v4f32.v16f32.v8i32(<16 x float> %tmp33.bc, <8 x i32> undef, <4 x i32> undef, i32 15, i1 false, i1 false, i1 false, i1 false, i1 true)

%tmp35 = extractelement <4 x float> %tmp34, i32 0

%tmp36 = bitcast float %tmp24 to i32

%tmp37 = insertelement <16 x i32> <i32 212739, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef>, i32 %tmp36, i32 1

@@ -46,7 +48,8 @@ main_body:

%tmp42 = insertelement <16 x i32> %tmp41, i32 undef, i32 6

%tmp43 = insertelement <16 x i32> %tmp42, i32 undef, i32 7

%tmp44 = insertelement <16 x i32> %tmp43, i32 undef, i32 8

- %tmp45 = call <4 x float> @llvm.SI.image.sample.c.d.o.v16i32(<16 x i32> %tmp44, <8 x i32> undef, <4 x i32> undef, i32 15, i32 0, i32 0, i32 1, i32 0, i32 0, i32 0, i32 0)

+ %tmp44.bc = bitcast <16 x i32> %tmp44 to <16 x float>

+ %tmp45 = call <4 x float> @llvm.amdgcn.image.sample.c.d.o.v4f32.v16f32.v8i32(<16 x float> %tmp44.bc, <8 x i32> undef, <4 x i32> undef, i32 15, i1 false, i1 false, i1 false, i1 false, i1 true)

%tmp46 = extractelement <4 x float> %tmp45, i32 0

%tmp47 = fmul float %tmp35, %tmp46

%tmp48 = insertvalue <{ i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, float, float, float, float, float, float, float, float, float, float, float, float, float, float }> undef, float %tmp47, 14

@@ -54,9 +57,10 @@ main_body:

ret <{ i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, float, float, float, float, float, float, float, float, float, float, float, float, float, float }> %tmp49

}

-declare float @llvm.SI.fs.interp(i32, i32, i32, <2 x i32>) #1

-declare float @llvm.SI.load.const(<16 x i8>, i32) #1

-declare <4 x float> @llvm.SI.image.sample.c.d.o.v16i32(<16 x i32>, <8 x i32>, <4 x i32>, i32, i32, i32, i32, i32, i32, i32, i32) #1

+declare float @llvm.amdgcn.interp.p1(float, i32, i32, i32) #1

+declare float @llvm.amdgcn.interp.p2(float, float, i32, i32, i32) #1

+declare <4 x float> @llvm.amdgcn.image.sample.c.d.o.v4f32.v16f32.v8i32(<16 x float>, <8 x i32>, <4 x i32>, i32, i1, i1, i1, i1, i1) #2

-attributes #0 = { "InitialPSInputAddr"="36983" "target-cpu"="tonga" }

+attributes #0 = { nounwind }

attributes #1 = { nounwind readnone }

+attributes #2 = { nounwind readonly }