diff options
author | Tim Northover <tnorthover@apple.com> | 2014-02-19 10:37:05 +0000 |
---|---|---|
committer | Tim Northover <tnorthover@apple.com> | 2014-02-19 10:37:05 +0000 |
commit | 45de76ea91e590f63496f49468fa51dcf4b2ba2a (patch) | |
tree | e47d449653fdf6c922a9ac961f57319ff74ef19b /utils | |
parent | 69ca34421886443df2def063e5029439c3abead5 (diff) | |
download | clang-45de76ea91e590f63496f49468fa51dcf4b2ba2a.tar.gz clang-45de76ea91e590f63496f49468fa51dcf4b2ba2a.tar.bz2 clang-45de76ea91e590f63496f49468fa51dcf4b2ba2a.tar.xz |
ARM & AArch64: merge the semantic checking of NEON intrinsics
There are two kinds of automatically generated tests for NEON intrinsics, both
of which can be merged without adversely affecting users.
1. We check that a valid kind of __builtin_neon_XYZ overload is requested (e.g.
we're not asking for a float32x4_t version when it only accepts integers. Since
the __builtin_neon_XYZ intrinsics should only be used in arm_neon.h, relaxing
this test and permitting AArch64 types for AArch32 should not cause a problem.
The extra arm_neon.h definitions should be #ifdefed out anyway.
2. We check that intrinsics which take immediates are actually given
compile-time constants within range. Since all NEON intrinsics should be
backwards compatible, these tests should be identical on AArch64 and AArch32
anyway.
This patch, therefore, merges the separate AArch64 and 32-bit checks.
rdar://problem/16035743
git-svn-id: https://llvm.org/svn/llvm-project/cfe/trunk@201659 91177308-0d34-0410-b5e6-96231b3b80d8
Diffstat (limited to 'utils')
-rw-r--r-- | utils/TableGen/NeonEmitter.cpp | 143 |
1 files changed, 50 insertions, 93 deletions
diff --git a/utils/TableGen/NeonEmitter.cpp b/utils/TableGen/NeonEmitter.cpp index db954b2183..5b0084afdb 100644 --- a/utils/TableGen/NeonEmitter.cpp +++ b/utils/TableGen/NeonEmitter.cpp @@ -375,12 +375,8 @@ private: void emitIntrinsic(raw_ostream &OS, Record *R, StringMap<ClassKind> &EmittedMap); void genBuiltinsDef(raw_ostream &OS); - void genOverloadTypeCheckCode(raw_ostream &OS, - StringMap<ClassKind> &A64IntrinsicMap, - bool isA64TypeCheck); - void genIntrinsicRangeCheckCode(raw_ostream &OS, - StringMap<ClassKind> &A64IntrinsicMap, - bool isA64RangeCheck); + void genOverloadTypeCheckCode(raw_ostream &OS); + void genIntrinsicRangeCheckCode(raw_ostream &OS); void genTargetTest(raw_ostream &OS, StringMap<OpKind> &EmittedMap, bool isA64TestGen); }; @@ -2911,17 +2907,12 @@ static unsigned RangeScalarShiftImm(const char mod, StringRef typestr) { /// Generate the ARM and AArch64 intrinsic range checking code for /// shift/lane immediates, checking for unique declarations. void -NeonEmitter::genIntrinsicRangeCheckCode(raw_ostream &OS, - StringMap<ClassKind> &A64IntrinsicMap, - bool isA64RangeCheck) { +NeonEmitter::genIntrinsicRangeCheckCode(raw_ostream &OS) { std::vector<Record *> RV = Records.getAllDerivedDefinitions("Inst"); StringMap<OpKind> EmittedMap; // Generate the intrinsic range checking code for shift/lane immediates. - if (isA64RangeCheck) - OS << "#ifdef GET_NEON_AARCH64_IMMEDIATE_CHECK\n"; - else - OS << "#ifdef GET_NEON_IMMEDIATE_CHECK\n"; + OS << "#ifdef GET_NEON_IMMEDIATE_CHECK\n"; for (unsigned i = 0, e = RV.size(); i != e; ++i) { Record *R = RV[i]; @@ -2956,19 +2947,6 @@ NeonEmitter::genIntrinsicRangeCheckCode(raw_ostream &OS, if (!ProtoHasScalar(Proto)) ck = ClassB; - // Do not include AArch64 range checks if not generating code for AArch64. - bool isA64 = R->getValueAsBit("isA64"); - if (!isA64RangeCheck && isA64) - continue; - - // Include ARM range checks in AArch64 but only if ARM intrinsics are not - // redefined by AArch64 to handle new types. - if (isA64RangeCheck && !isA64 && A64IntrinsicMap.count(Rename)) { - ClassKind &A64CK = A64IntrinsicMap[Rename]; - if (A64CK == ck && ck != ClassNone) - continue; - } - for (unsigned ti = 0, te = TypeVec.size(); ti != te; ++ti) { std::string namestr, shiftstr, rangestr; @@ -3070,16 +3048,22 @@ NeonEmitter::genIntrinsicRangeCheckCode(raw_ostream &OS, /// Generate the ARM and AArch64 overloaded type checking code for /// SemaChecking.cpp, checking for unique builtin declarations. void -NeonEmitter::genOverloadTypeCheckCode(raw_ostream &OS, - StringMap<ClassKind> &A64IntrinsicMap, - bool isA64TypeCheck) { +NeonEmitter::genOverloadTypeCheckCode(raw_ostream &OS) { std::vector<Record *> RV = Records.getAllDerivedDefinitions("Inst"); // Generate the overloaded type checking code for SemaChecking.cpp - if (isA64TypeCheck) - OS << "#ifdef GET_NEON_AARCH64_OVERLOAD_CHECK\n"; - else - OS << "#ifdef GET_NEON_OVERLOAD_CHECK\n"; + OS << "#ifdef GET_NEON_OVERLOAD_CHECK\n"; + + // We record each overload check line before emitting because subsequent Inst + // definitions may extend the number of permitted types (i.e. augment the + // Mask). Use std::map to avoid sorting the table by hash number. + struct OverloadInfo { + uint64_t Mask; + int PtrArgNum; + bool HasConstPtr; + }; + std::map<std::string, OverloadInfo> OverloadMap; + typedef std::map<std::string, OverloadInfo>::iterator OverloadIterator; for (unsigned i = 0, e = RV.size(); i != e; ++i) { Record *R = RV[i]; @@ -3108,21 +3092,6 @@ NeonEmitter::genOverloadTypeCheckCode(raw_ostream &OS, if (R->getSuperClasses().size() < 2) PrintFatalError(R->getLoc(), "Builtin has no class kind"); - // Do not include AArch64 type checks if not generating code for AArch64. - bool isA64 = R->getValueAsBit("isA64"); - if (!isA64TypeCheck && isA64) - continue; - - // Include ARM type check in AArch64 but only if ARM intrinsics - // are not redefined in AArch64 to handle new types, e.g. "vabd" is a SIntr - // redefined in AArch64 to handle an additional 2 x f64 type. - ClassKind ck = ClassMap[R->getSuperClasses()[1]]; - if (isA64TypeCheck && !isA64 && A64IntrinsicMap.count(Rename)) { - ClassKind &A64CK = A64IntrinsicMap[Rename]; - if (A64CK == ck && ck != ClassNone) - continue; - } - int si = -1, qi = -1; uint64_t mask = 0, qmask = 0; for (unsigned ti = 0, te = TypeVec.size(); ti != te; ++ti) { @@ -3170,26 +3139,41 @@ NeonEmitter::genOverloadTypeCheckCode(raw_ostream &OS, } if (mask) { - OS << "case NEON::BI__builtin_neon_"; - OS << MangleName(name, TypeVec[si], ClassB) << ": mask = " - << "0x" << utohexstr(mask) << "ULL"; - if (PtrArgNum >= 0) - OS << "; PtrArgNum = " << PtrArgNum; - if (HasConstPtr) - OS << "; HasConstPtr = true"; - OS << "; break;\n"; + std::pair<OverloadIterator, bool> I = OverloadMap.insert(std::make_pair( + MangleName(name, TypeVec[si], ClassB), OverloadInfo())); + OverloadInfo &Record = I.first->second; + if (!I.second) + assert(Record.PtrArgNum == PtrArgNum && + Record.HasConstPtr == HasConstPtr); + Record.Mask |= mask; + Record.PtrArgNum = PtrArgNum; + Record.HasConstPtr = HasConstPtr; } if (qmask) { - OS << "case NEON::BI__builtin_neon_"; - OS << MangleName(name, TypeVec[qi], ClassB) << ": mask = " - << "0x" << utohexstr(qmask) << "ULL"; - if (PtrArgNum >= 0) - OS << "; PtrArgNum = " << PtrArgNum; - if (HasConstPtr) - OS << "; HasConstPtr = true"; - OS << "; break;\n"; + std::pair<OverloadIterator, bool> I = OverloadMap.insert(std::make_pair( + MangleName(name, TypeVec[qi], ClassB), OverloadInfo())); + OverloadInfo &Record = I.first->second; + if (!I.second) + assert(Record.PtrArgNum == PtrArgNum && + Record.HasConstPtr == HasConstPtr); + Record.Mask |= qmask; + Record.PtrArgNum = PtrArgNum; + Record.HasConstPtr = HasConstPtr; } } + + for (OverloadIterator I = OverloadMap.begin(), E = OverloadMap.end(); I != E; + ++I) { + OverloadInfo &BuiltinOverloads = I->second; + OS << "case NEON::BI__builtin_neon_" << I->first << ": "; + OS << "mask = " << "0x" << utohexstr(BuiltinOverloads.Mask) << "ULL"; + if (BuiltinOverloads.PtrArgNum >= 0) + OS << "; PtrArgNum = " << BuiltinOverloads.PtrArgNum; + if (BuiltinOverloads.HasConstPtr) + OS << "; HasConstPtr = true"; + OS << "; break;\n"; + } + OS << "#endif\n\n"; } @@ -3248,41 +3232,14 @@ void NeonEmitter::genBuiltinsDef(raw_ostream &OS) { void NeonEmitter::runHeader(raw_ostream &OS) { std::vector<Record *> RV = Records.getAllDerivedDefinitions("Inst"); - // build a map of AArch64 intriniscs to be used in uniqueness checks. - StringMap<ClassKind> A64IntrinsicMap; - for (unsigned i = 0, e = RV.size(); i != e; ++i) { - Record *R = RV[i]; - - bool isA64 = R->getValueAsBit("isA64"); - if (!isA64) - continue; - - ClassKind CK = ClassNone; - if (R->getSuperClasses().size() >= 2) - CK = ClassMap[R->getSuperClasses()[1]]; - - std::string Name = R->getValueAsString("Name"); - std::string Proto = R->getValueAsString("Prototype"); - std::string Rename = Name + "@" + Proto; - if (A64IntrinsicMap.count(Rename)) - continue; - A64IntrinsicMap[Rename] = CK; - } - // Generate shared BuiltinsXXX.def genBuiltinsDef(OS); // Generate ARM overloaded type checking code for SemaChecking.cpp - genOverloadTypeCheckCode(OS, A64IntrinsicMap, false); - - // Generate AArch64 overloaded type checking code for SemaChecking.cpp - genOverloadTypeCheckCode(OS, A64IntrinsicMap, true); + genOverloadTypeCheckCode(OS); // Generate ARM range checking code for shift/lane immediates. - genIntrinsicRangeCheckCode(OS, A64IntrinsicMap, false); - - // Generate the AArch64 range checking code for shift/lane immediates. - genIntrinsicRangeCheckCode(OS, A64IntrinsicMap, true); + genIntrinsicRangeCheckCode(OS); } /// GenTest - Write out a test for the intrinsic specified by the name and |