Teach valuetracking that byval arguments with a specified alignment are

aligned. Teach memcpyopt to not give up all hope when confonted with an underaligned memcpy feeding an overaligned byval. If the *source* of the memcpy can be determined to be adequeately aligned, or if it can be forced to be, we can eliminate the memcpy. This addresses PR9794. We now compile the example into: define i32 @f(%struct.p* nocapture byval align 8 %q) nounwind ssp { entry: %call = call i32 @g(%struct.p* byval align 8 %q) nounwind ret i32 %call } in both x86-64 and x86-32 mode. We still don't get a tailcall though, because tailcalls apparently can't handle byval. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@131884 91177308-0d34-0410-b5e6-96231b3b80d8
author: Chris Lattner <sabre@nondot.org> 2011-05-23 00:03:39 +0000
committer: Chris Lattner <sabre@nondot.org> 2011-05-23 00:03:39 +0000
commit: b3f0673d52b72f34434dec13c4e2044c82012ef6 (patch)
tree: e2c468a159ebf2b8586cef5e319a9fce91c05068 /lib/Transforms/Scalar
parent: ae441cc33cee83a598f74e3d0447fe02157b0389 (diff)
download: llvm-b3f0673d52b72f34434dec13c4e2044c82012ef6.tar.gz
llvm-b3f0673d52b72f34434dec13c4e2044c82012ef6.tar.bz2
llvm-b3f0673d52b72f34434dec13c4e2044c82012ef6.tar.xz
1 files changed, 10 insertions, 5 deletions
diff --git a/lib/Transforms/Scalar/MemCpyOptimizer.cpp b/lib/Transforms/Scalar/MemCpyOptimizer.cpp
index 04edfd43a2..360639ec95 100644
--- a/lib/Transforms/Scalar/MemCpyOptimizer.cpp
+++ b/lib/Transforms/Scalar/MemCpyOptimizer.cpp
@@ -23,6 +23,7 @@
 #include "llvm/Analysis/AliasAnalysis.h"
 #include "llvm/Analysis/MemoryDependenceAnalysis.h"
 #include "llvm/Analysis/ValueTracking.h"
+#include "llvm/Transforms/Utils/Local.h"
 #include "llvm/Support/Debug.h"
 #include "llvm/Support/GetElementPtrTypeIterator.h"
 #include "llvm/Support/IRBuilder.h"
@@ -866,12 +867,16 @@ bool MemCpyOpt::processByValArgument(CallSite CS, unsigned ArgNo) {
   if (C1 == 0 || C1->getValue().getZExtValue() < ByValSize)
     return false;
 
-  // Get the alignment of the byval.  If it is greater than the memcpy, then we
-  // can't do the substitution.  If the call doesn't specify the alignment, then
-  // it is some target specific value that we can't know.
+  // Get the alignment of the byval.  If the call doesn't specify the alignment,
+  // then it is some target specific value that we can't know.
   unsigned ByValAlign = CS.getParamAlignment(ArgNo+1);
-  if (ByValAlign == 0 || MDep->getAlignment() < ByValAlign)
-    return false;  
+  if (ByValAlign == 0) return false;
+  
+  // If it is greater than the memcpy, then we check to see if we can force the
+  // source of the memcpy to the alignment we need.  If we fail, we bail out.
+  if (MDep->getAlignment() < ByValAlign &&
+      getOrEnforceKnownAlignment(MDep->getSource(),ByValAlign, TD) < ByValAlign)
+    return false;
   
   // Verify that the copied-from memory doesn't change in between the memcpy and
   // the byval call.
author	Chris Lattner <sabre@nondot.org>	2011-05-23 00:03:39 +0000
committer	Chris Lattner <sabre@nondot.org>	2011-05-23 00:03:39 +0000
commit	b3f0673d52b72f34434dec13c4e2044c82012ef6 (patch)
tree	e2c468a159ebf2b8586cef5e319a9fce91c05068 /lib/Transforms/Scalar
parent	ae441cc33cee83a598f74e3d0447fe02157b0389 (diff)
download	llvm-b3f0673d52b72f34434dec13c4e2044c82012ef6.tar.gz llvm-b3f0673d52b72f34434dec13c4e2044c82012ef6.tar.bz2 llvm-b3f0673d52b72f34434dec13c4e2044c82012ef6.tar.xz