Change -mno-mmx to be more compatible with gcc. Specifically, -mno-mmx should not imply -mno-sse.

Note that because we don't usually touch the MMX registers anyway, all -mno-mmx needs to do is tweak the x86-32 calling convention a little for vectors that look like MMX vectors, and prevent the definition of __MMX__.

clang doesn't actually stop the user from using MMX inline asm operands or MMX builtins in -mno-mmx mode; as a QOI issue, it would be nice to diagnose, but I doubt it really matters much.

<rdar://problem/9694837>



git-svn-id: https://llvm.org/svn/llvm-project/cfe/trunk@134770 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
Eli Friedman 2011-07-08 23:31:17 +00:00
Родитель 528a8c7b4c
Коммит c3e0fb406f
6 изменённых файлов: 84 добавлений и 50 удалений

Просмотреть файл

@ -1110,18 +1110,18 @@ const TargetInfo::AddlRegName AddlRegNames[] = {
// most of the implementation can be shared. // most of the implementation can be shared.
class X86TargetInfo : public TargetInfo { class X86TargetInfo : public TargetInfo {
enum X86SSEEnum { enum X86SSEEnum {
NoMMXSSE, MMX, SSE1, SSE2, SSE3, SSSE3, SSE41, SSE42 NoSSE, SSE1, SSE2, SSE3, SSSE3, SSE41, SSE42
} SSELevel; } SSELevel;
enum AMD3DNowEnum { enum MMX3DNowEnum {
NoAMD3DNow, AMD3DNow, AMD3DNowAthlon NoMMX3DNow, MMX, AMD3DNow, AMD3DNowAthlon
} AMD3DNowLevel; } MMX3DNowLevel;
bool HasAES; bool HasAES;
bool HasAVX; bool HasAVX;
public: public:
X86TargetInfo(const std::string& triple) X86TargetInfo(const std::string& triple)
: TargetInfo(triple), SSELevel(NoMMXSSE), AMD3DNowLevel(NoAMD3DNow), : TargetInfo(triple), SSELevel(NoSSE), MMX3DNowLevel(NoMMX3DNow),
HasAES(false), HasAVX(false) { HasAES(false), HasAVX(false) {
LongDoubleFormat = &llvm::APFloat::x87DoubleExtended; LongDoubleFormat = &llvm::APFloat::x87DoubleExtended;
} }
@ -1159,6 +1159,9 @@ public:
virtual void getDefaultFeatures(const std::string &CPU, virtual void getDefaultFeatures(const std::string &CPU,
llvm::StringMap<bool> &Features) const; llvm::StringMap<bool> &Features) const;
virtual void HandleTargetFeatures(std::vector<std::string> &Features); virtual void HandleTargetFeatures(std::vector<std::string> &Features);
virtual const char* getABI() const {
return MMX3DNowLevel == NoMMX3DNow ? "no-mmx" : "";
}
}; };
void X86TargetInfo::getDefaultFeatures(const std::string &CPU, void X86TargetInfo::getDefaultFeatures(const std::string &CPU,
@ -1190,23 +1193,31 @@ void X86TargetInfo::getDefaultFeatures(const std::string &CPU,
; ;
else if (CPU == "pentium-mmx" || CPU == "pentium2") else if (CPU == "pentium-mmx" || CPU == "pentium2")
setFeatureEnabled(Features, "mmx", true); setFeatureEnabled(Features, "mmx", true);
else if (CPU == "pentium3") else if (CPU == "pentium3") {
setFeatureEnabled(Features, "mmx", true);
setFeatureEnabled(Features, "sse", true); setFeatureEnabled(Features, "sse", true);
else if (CPU == "pentium-m" || CPU == "pentium4" || CPU == "x86-64") } else if (CPU == "pentium-m" || CPU == "pentium4" || CPU == "x86-64") {
setFeatureEnabled(Features, "mmx", true);
setFeatureEnabled(Features, "sse2", true); setFeatureEnabled(Features, "sse2", true);
else if (CPU == "yonah" || CPU == "prescott" || CPU == "nocona") } else if (CPU == "yonah" || CPU == "prescott" || CPU == "nocona") {
setFeatureEnabled(Features, "mmx", true);
setFeatureEnabled(Features, "sse3", true); setFeatureEnabled(Features, "sse3", true);
else if (CPU == "core2") } else if (CPU == "core2") {
setFeatureEnabled(Features, "mmx", true);
setFeatureEnabled(Features, "ssse3", true); setFeatureEnabled(Features, "ssse3", true);
else if (CPU == "penryn") { } else if (CPU == "penryn") {
setFeatureEnabled(Features, "mmx", true);
setFeatureEnabled(Features, "sse4", true); setFeatureEnabled(Features, "sse4", true);
Features["sse42"] = false; Features["sse42"] = false;
} else if (CPU == "atom") } else if (CPU == "atom") {
setFeatureEnabled(Features, "mmx", true);
setFeatureEnabled(Features, "sse3", true); setFeatureEnabled(Features, "sse3", true);
else if (CPU == "corei7") { } else if (CPU == "corei7") {
setFeatureEnabled(Features, "mmx", true);
setFeatureEnabled(Features, "sse4", true); setFeatureEnabled(Features, "sse4", true);
setFeatureEnabled(Features, "aes", true); setFeatureEnabled(Features, "aes", true);
} else if (CPU == "corei7-avx") { } else if (CPU == "corei7-avx") {
setFeatureEnabled(Features, "mmx", true);
setFeatureEnabled(Features, "sse4", true); setFeatureEnabled(Features, "sse4", true);
setFeatureEnabled(Features, "aes", true); setFeatureEnabled(Features, "aes", true);
// setFeatureEnabled(Features, "avx", true); // setFeatureEnabled(Features, "avx", true);
@ -1214,7 +1225,6 @@ void X86TargetInfo::getDefaultFeatures(const std::string &CPU,
setFeatureEnabled(Features, "mmx", true); setFeatureEnabled(Features, "mmx", true);
else if (CPU == "k6-2" || CPU == "k6-3" || CPU == "athlon" || else if (CPU == "k6-2" || CPU == "k6-3" || CPU == "athlon" ||
CPU == "athlon-tbird" || CPU == "winchip2" || CPU == "c3") { CPU == "athlon-tbird" || CPU == "winchip2" || CPU == "c3") {
setFeatureEnabled(Features, "mmx", true);
setFeatureEnabled(Features, "3dnow", true); setFeatureEnabled(Features, "3dnow", true);
} else if (CPU == "athlon-4" || CPU == "athlon-xp" || CPU == "athlon-mp") { } else if (CPU == "athlon-4" || CPU == "athlon-xp" || CPU == "athlon-mp") {
setFeatureEnabled(Features, "sse", true); setFeatureEnabled(Features, "sse", true);
@ -1226,8 +1236,10 @@ void X86TargetInfo::getDefaultFeatures(const std::string &CPU,
} else if (CPU == "k8-sse3") { } else if (CPU == "k8-sse3") {
setFeatureEnabled(Features, "sse3", true); setFeatureEnabled(Features, "sse3", true);
setFeatureEnabled(Features, "3dnowa", true); setFeatureEnabled(Features, "3dnowa", true);
} else if (CPU == "c3-2") } else if (CPU == "c3-2") {
setFeatureEnabled(Features, "mmx", true);
setFeatureEnabled(Features, "sse", true); setFeatureEnabled(Features, "sse", true);
}
} }
bool X86TargetInfo::setFeatureEnabled(llvm::StringMap<bool> &Features, bool X86TargetInfo::setFeatureEnabled(llvm::StringMap<bool> &Features,
@ -1243,34 +1255,31 @@ bool X86TargetInfo::setFeatureEnabled(llvm::StringMap<bool> &Features,
if (Name == "mmx") if (Name == "mmx")
Features["mmx"] = true; Features["mmx"] = true;
else if (Name == "sse") else if (Name == "sse")
Features["mmx"] = Features["sse"] = true; Features["sse"] = true;
else if (Name == "sse2") else if (Name == "sse2")
Features["mmx"] = Features["sse"] = Features["sse2"] = true; Features["sse"] = Features["sse2"] = true;
else if (Name == "sse3") else if (Name == "sse3")
Features["mmx"] = Features["sse"] = Features["sse2"] = Features["sse"] = Features["sse2"] = Features["sse3"] = true;
Features["sse3"] = true;
else if (Name == "ssse3") else if (Name == "ssse3")
Features["mmx"] = Features["sse"] = Features["sse2"] = Features["sse3"] = Features["sse"] = Features["sse2"] = Features["sse3"] =
Features["ssse3"] = true; Features["ssse3"] = true;
else if (Name == "sse4" || Name == "sse4.2") else if (Name == "sse4" || Name == "sse4.2")
Features["mmx"] = Features["sse"] = Features["sse2"] = Features["sse3"] = Features["sse"] = Features["sse2"] = Features["sse3"] =
Features["ssse3"] = Features["sse41"] = Features["sse42"] = true; Features["ssse3"] = Features["sse41"] = Features["sse42"] = true;
else if (Name == "sse4.1") else if (Name == "sse4.1")
Features["mmx"] = Features["sse"] = Features["sse2"] = Features["sse3"] = Features["sse"] = Features["sse2"] = Features["sse3"] =
Features["ssse3"] = Features["sse41"] = true; Features["ssse3"] = Features["sse41"] = true;
else if (Name == "3dnow") else if (Name == "3dnow")
Features["3dnowa"] = true; Features["mmx"] = Features["3dnow"] = true;
else if (Name == "3dnowa") else if (Name == "3dnowa")
Features["3dnow"] = Features["3dnowa"] = true; Features["mmx"] = Features["3dnow"] = Features["3dnowa"] = true;
else if (Name == "aes") else if (Name == "aes")
Features["aes"] = true; Features["aes"] = true;
else if (Name == "avx") else if (Name == "avx")
Features["avx"] = true; Features["avx"] = true;
} else { } else {
if (Name == "mmx") if (Name == "mmx")
Features["mmx"] = Features["3dnow"] = Features["3dnowa"] = Features["mmx"] = Features["3dnow"] = Features["3dnowa"] = false;
Features["sse"] = Features["sse2"] = Features["sse3"] =
Features["ssse3"] = Features["sse41"] = Features["sse42"] = false;
else if (Name == "sse") else if (Name == "sse")
Features["sse"] = Features["sse2"] = Features["sse3"] = Features["sse"] = Features["sse2"] = Features["sse3"] =
Features["ssse3"] = Features["sse41"] = Features["sse42"] = false; Features["ssse3"] = Features["sse41"] = Features["sse42"] = false;
@ -1328,18 +1337,25 @@ void X86TargetInfo::HandleTargetFeatures(std::vector<std::string> &Features) {
.Case("sse3", SSE3) .Case("sse3", SSE3)
.Case("sse2", SSE2) .Case("sse2", SSE2)
.Case("sse", SSE1) .Case("sse", SSE1)
.Case("mmx", MMX) .Default(NoSSE);
.Default(NoMMXSSE);
SSELevel = std::max(SSELevel, Level); SSELevel = std::max(SSELevel, Level);
AMD3DNowEnum ThreeDNowLevel = MMX3DNowEnum ThreeDNowLevel =
llvm::StringSwitch<AMD3DNowEnum>(Features[i].substr(1)) llvm::StringSwitch<MMX3DNowEnum>(Features[i].substr(1))
.Case("3dnowa", AMD3DNowAthlon) .Case("3dnowa", AMD3DNowAthlon)
.Case("3dnow", AMD3DNow) .Case("3dnow", AMD3DNow)
.Default(NoAMD3DNow); .Case("mmx", MMX)
.Default(NoMMX3DNow);
AMD3DNowLevel = std::max(AMD3DNowLevel, ThreeDNowLevel); MMX3DNowLevel = std::max(MMX3DNowLevel, ThreeDNowLevel);
} }
// Don't tell the backend if we're turning off mmx; it will end up disabling
// SSE, which we don't want.
std::vector<std::string>::iterator it;
it = std::find(Features.begin(), Features.end(), "-mmx");
if (it != Features.end())
Features.erase(it);
} }
/// X86TargetInfo::getTargetDefines - Return a set of the X86-specific #defines /// X86TargetInfo::getTargetDefines - Return a set of the X86-specific #defines
@ -1394,9 +1410,7 @@ void X86TargetInfo::getTargetDefines(const LangOptions &Opts,
case SSE1: case SSE1:
Builder.defineMacro("__SSE__"); Builder.defineMacro("__SSE__");
Builder.defineMacro("__SSE_MATH__"); // -mfp-math=sse always implied. Builder.defineMacro("__SSE_MATH__"); // -mfp-math=sse always implied.
case MMX: case NoSSE:
Builder.defineMacro("__MMX__");
case NoMMXSSE:
break; break;
} }
@ -1418,12 +1432,14 @@ void X86TargetInfo::getTargetDefines(const LangOptions &Opts,
} }
// Each case falls through to the previous one here. // Each case falls through to the previous one here.
switch (AMD3DNowLevel) { switch (MMX3DNowLevel) {
case AMD3DNowAthlon: case AMD3DNowAthlon:
Builder.defineMacro("__3dNOW_A__"); Builder.defineMacro("__3dNOW_A__");
case AMD3DNow: case AMD3DNow:
Builder.defineMacro("__3dNOW__"); Builder.defineMacro("__3dNOW__");
case NoAMD3DNow: case MMX:
Builder.defineMacro("__MMX__");
case NoMMX3DNow:
break; break;
} }
} }

Просмотреть файл

@ -374,6 +374,7 @@ class X86_32ABIInfo : public ABIInfo {
bool IsDarwinVectorABI; bool IsDarwinVectorABI;
bool IsSmallStructInRegABI; bool IsSmallStructInRegABI;
bool IsMMXDisabled;
static bool isRegisterSize(unsigned Size) { static bool isRegisterSize(unsigned Size) {
return (Size == 8 || Size == 16 || Size == 32 || Size == 64); return (Size == 8 || Size == 16 || Size == 32 || Size == 64);
@ -403,14 +404,15 @@ public:
virtual llvm::Value *EmitVAArg(llvm::Value *VAListAddr, QualType Ty, virtual llvm::Value *EmitVAArg(llvm::Value *VAListAddr, QualType Ty,
CodeGenFunction &CGF) const; CodeGenFunction &CGF) const;
X86_32ABIInfo(CodeGen::CodeGenTypes &CGT, bool d, bool p) X86_32ABIInfo(CodeGen::CodeGenTypes &CGT, bool d, bool p, bool m)
: ABIInfo(CGT), IsDarwinVectorABI(d), IsSmallStructInRegABI(p) {} : ABIInfo(CGT), IsDarwinVectorABI(d), IsSmallStructInRegABI(p),
IsMMXDisabled(m) {}
}; };
class X86_32TargetCodeGenInfo : public TargetCodeGenInfo { class X86_32TargetCodeGenInfo : public TargetCodeGenInfo {
public: public:
X86_32TargetCodeGenInfo(CodeGen::CodeGenTypes &CGT, bool d, bool p) X86_32TargetCodeGenInfo(CodeGen::CodeGenTypes &CGT, bool d, bool p, bool m)
:TargetCodeGenInfo(new X86_32ABIInfo(CGT, d, p)) {} :TargetCodeGenInfo(new X86_32ABIInfo(CGT, d, p, m)) {}
void SetTargetAttributes(const Decl *D, llvm::GlobalValue *GV, void SetTargetAttributes(const Decl *D, llvm::GlobalValue *GV,
CodeGen::CodeGenModule &CGM) const; CodeGen::CodeGenModule &CGM) const;
@ -701,6 +703,9 @@ ABIArgInfo X86_32ABIInfo::classifyArgumentType(QualType Ty) const {
const llvm::Type *IRType = CGT.ConvertTypeRecursive(Ty); const llvm::Type *IRType = CGT.ConvertTypeRecursive(Ty);
if (UseX86_MMXType(IRType)) { if (UseX86_MMXType(IRType)) {
if (IsMMXDisabled)
return ABIArgInfo::getDirect(llvm::IntegerType::get(getVMContext(),
64));
ABIArgInfo AAI = ABIArgInfo::getDirect(IRType); ABIArgInfo AAI = ABIArgInfo::getDirect(IRType);
AAI.setCoerceToType(llvm::Type::getX86_MMXTy(getVMContext())); AAI.setCoerceToType(llvm::Type::getX86_MMXTy(getVMContext()));
return AAI; return AAI;
@ -3006,10 +3011,12 @@ const TargetCodeGenInfo &CodeGenModule::getTargetCodeGenInfo() {
case llvm::Triple::msp430: case llvm::Triple::msp430:
return *(TheTargetCodeGenInfo = new MSP430TargetCodeGenInfo(Types)); return *(TheTargetCodeGenInfo = new MSP430TargetCodeGenInfo(Types));
case llvm::Triple::x86: case llvm::Triple::x86: {
bool DisableMMX = strcmp(getContext().Target.getABI(), "no-mmx") == 0;
if (Triple.isOSDarwin()) if (Triple.isOSDarwin())
return *(TheTargetCodeGenInfo = return *(TheTargetCodeGenInfo =
new X86_32TargetCodeGenInfo(Types, true, true)); new X86_32TargetCodeGenInfo(Types, true, true, DisableMMX));
switch (Triple.getOS()) { switch (Triple.getOS()) {
case llvm::Triple::Cygwin: case llvm::Triple::Cygwin:
@ -3020,12 +3027,13 @@ const TargetCodeGenInfo &CodeGenModule::getTargetCodeGenInfo() {
case llvm::Triple::OpenBSD: case llvm::Triple::OpenBSD:
case llvm::Triple::NetBSD: case llvm::Triple::NetBSD:
return *(TheTargetCodeGenInfo = return *(TheTargetCodeGenInfo =
new X86_32TargetCodeGenInfo(Types, false, true)); new X86_32TargetCodeGenInfo(Types, false, true, DisableMMX));
default: default:
return *(TheTargetCodeGenInfo = return *(TheTargetCodeGenInfo =
new X86_32TargetCodeGenInfo(Types, false, false)); new X86_32TargetCodeGenInfo(Types, false, false, DisableMMX));
} }
}
case llvm::Triple::x86_64: case llvm::Triple::x86_64:
switch (Triple.getOS()) { switch (Triple.getOS()) {

Просмотреть файл

@ -1,5 +1,4 @@
// RUN: %clang_cc1 -w -fblocks -triple i386-apple-darwin9 -emit-llvm -o %t %s // RUN: %clang_cc1 -w -fblocks -triple i386-apple-darwin9 -target-cpu yonah -emit-llvm -o - %s | FileCheck %s
// RUN: FileCheck < %t %s
// CHECK: define signext i8 @f0() // CHECK: define signext i8 @f0()
char f0(void) { char f0(void) {

Просмотреть файл

@ -1,4 +1,4 @@
// RUN: %clang_cc1 -w -fblocks -triple i386-pc-linux-gnu -emit-llvm -o %t %s // RUN: %clang_cc1 -w -fblocks -triple i386-pc-linux-gnu -target-cpu pentium4 -emit-llvm -o %t %s
// RUN: FileCheck < %t %s // RUN: FileCheck < %t %s
// CHECK: define void @f56( // CHECK: define void @f56(

Просмотреть файл

@ -0,0 +1,11 @@
// RUN: %clang_cc1 -target-feature -mmx -target-feature +sse2 -triple i686-pc-linux-gnu -emit-llvm -o - %s | FileCheck %s
// no-mmx should put mmx into memory
typedef int __attribute__((vector_size (8))) i32v2;
int a(i32v2 x) { return x[0]; }
// CHECK: define i32 @a(i64 %x.coerce)
// but SSE2 vectors should still go into an SSE2 register
typedef int __attribute__((vector_size (16))) i32v4;
int b(i32v4 x) { return x[0]; }
// CHECK: define i32 @b(<4 x i32> %x.coerce)

Просмотреть файл

@ -1,5 +1,5 @@
// RUN: %clang_cc1 -ffreestanding -fsyntax-only -target-feature +ssse3 -verify -triple x86_64-pc-linux-gnu %s // RUN: %clang_cc1 -ffreestanding -fsyntax-only -target-feature +ssse3 -target-feature +mmx -verify -triple x86_64-pc-linux-gnu %s
// RUN: %clang_cc1 -ffreestanding -fsyntax-only -target-feature +ssse3 -verify -triple i686-apple-darwin10 %s // RUN: %clang_cc1 -ffreestanding -fsyntax-only -target-feature +ssse3 -target-feature +mmx -verify -triple i686-apple-darwin10 %s
#include <tmmintrin.h> #include <tmmintrin.h>