Strength reduction improvements.

- Avoid attempting stride-reuse in the case that there are users that aren't addresses. In that case, there will be places where the multiplications won't be folded away, so it's better to try to strength-reduce them. - Several SSE intrinsics have operands that strength-reduction can treat as addresses. The previous item makes this more visible, as any non-address use of an IV can inhibit stride-reuse. - Make ValidStride aware of whether there's likely to be a base register in the address computation. This prevents it from thinking that things like stride 9 are valid on x86 when the base register is already occupied. Also, XFAIL the 2007-08-10-LEA16Use32.ll test; the new logic to avoid stride-reuse elimintes the LEA in the loop, so the test is no longer testing what it was intended to test. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@43231 91177308-0d34-0410-b5e6-96231b3b80d8
author: Dan Gohman <gohman@apple.com> 2007-10-22 20:40:42 +0000
committer: Dan Gohman <gohman@apple.com> 2007-10-22 20:40:42 +0000
commit: 02e4fa7d5fb4edd2ce9c7ede29c74d50cb126d7d (patch)
tree: dd1a099ed5fe939eef704a76816872cdf6323a71 /test/CodeGen/X86/stride-nine-with-base-reg.ll
parent: 8368805e255d53a68f89e341b69ed0f7022509c4 (diff)
download: llvm-02e4fa7d5fb4edd2ce9c7ede29c74d50cb126d7d.tar.gz
llvm-02e4fa7d5fb4edd2ce9c7ede29c74d50cb126d7d.tar.bz2
llvm-02e4fa7d5fb4edd2ce9c7ede29c74d50cb126d7d.tar.xz
1 files changed, 34 insertions, 0 deletions
diff --git a/test/CodeGen/X86/stride-nine-with-base-reg.ll b/test/CodeGen/X86/stride-nine-with-base-reg.ll
new file mode 100644
index 0000000000..f443c76015
--- /dev/null
+++ b/test/CodeGen/X86/stride-nine-with-base-reg.ll
@@ -0,0 +1,34 @@
+; RUN: llvm-as < %s | llc -march=x86 | grep lea | count 1
+; RUN: llvm-as < %s | llc -march=x86-64 | not grep lea
+
+; For x86 there's an lea above the loop. In both cases, there shouldn't
+; be any lea instructions inside the loop.
+
+@B = external global [1000 x i8], align 32
+@A = external global [1000 x i8], align 32
+@P = external global [1000 x i8], align 32
+
+define void @foo(i32 %m, i32 %p) {
+entry:
+	%tmp1 = icmp sgt i32 %m, 0
+	br i1 %tmp1, label %bb, label %return
+
+bb:
+	%i.019.0 = phi i32 [ %indvar.next, %bb ], [ 0, %entry ]
+	%tmp2 = getelementptr [1000 x i8]* @B, i32 0, i32 %i.019.0
+	%tmp3 = load i8* %tmp2, align 4
+	%tmp4 = mul i8 %tmp3, 2
+	%tmp5 = getelementptr [1000 x i8]* @A, i32 0, i32 %i.019.0
+	store i8 %tmp4, i8* %tmp5, align 4
+	%tmp8 = mul i32 %i.019.0, 9
+        %tmp0 = add i32 %tmp8, %p
+	%tmp10 = getelementptr [1000 x i8]* @P, i32 0, i32 %tmp0
+	store i8 17, i8* %tmp10, align 4
+	%indvar.next = add i32 %i.019.0, 1
+	%exitcond = icmp eq i32 %indvar.next, %m
+	br i1 %exitcond, label %return, label %bb
+
+return:
+	ret void
+}
+
author	Dan Gohman <gohman@apple.com>	2007-10-22 20:40:42 +0000
committer	Dan Gohman <gohman@apple.com>	2007-10-22 20:40:42 +0000
commit	02e4fa7d5fb4edd2ce9c7ede29c74d50cb126d7d (patch)
tree	dd1a099ed5fe939eef704a76816872cdf6323a71 /test/CodeGen/X86/stride-nine-with-base-reg.ll
parent	8368805e255d53a68f89e341b69ed0f7022509c4 (diff)
download	llvm-02e4fa7d5fb4edd2ce9c7ede29c74d50cb126d7d.tar.gz llvm-02e4fa7d5fb4edd2ce9c7ede29c74d50cb126d7d.tar.bz2 llvm-02e4fa7d5fb4edd2ce9c7ede29c74d50cb126d7d.tar.xz