зеркало из https://github.com/microsoft/clang.git
Skip extra copy from aggregate where it isn't necessary; rdar://problem/8139919 . This shouldn't make much of a difference at -O3, but should substantially reduce the number of generated memcpy's at -O0.
git-svn-id: https://llvm.org/svn/llvm-project/cfe/trunk@130717 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
Родитель
35bdbf4062
Коммит
b5a03b6217
|
@ -1166,6 +1166,15 @@ void CodeGenFunction::EmitCallArg(CallArgList &args, const Expr *E,
|
|||
return args.add(EmitReferenceBindingToExpr(E, /*InitializedDecl=*/0),
|
||||
type);
|
||||
|
||||
if (hasAggregateLLVMType(type) && isa<ImplicitCastExpr>(E) &&
|
||||
cast<CastExpr>(E)->getCastKind() == CK_LValueToRValue) {
|
||||
LValue L = EmitLValue(cast<CastExpr>(E)->getSubExpr());
|
||||
assert(L.isSimple());
|
||||
args.add(RValue::getAggregate(L.getAddress(), L.isVolatileQualified()),
|
||||
type, /*NeedsCopy*/true);
|
||||
return;
|
||||
}
|
||||
|
||||
args.add(EmitAnyExprToTemp(E), type);
|
||||
}
|
||||
|
||||
|
@ -1231,6 +1240,10 @@ RValue CodeGenFunction::EmitCall(const CGFunctionInfo &CallInfo,
|
|||
Alignment, I->Ty);
|
||||
else
|
||||
StoreComplexToAddr(RV.getComplexVal(), Args.back(), false);
|
||||
} else if (I->NeedsCopy && !ArgInfo.getIndirectByVal()) {
|
||||
Args.push_back(CreateMemTemp(I->Ty));
|
||||
EmitAggregateCopy(Args.back(), RV.getAggregateAddr(), I->Ty,
|
||||
RV.isVolatileQualified());
|
||||
} else {
|
||||
Args.push_back(RV.getAggregateAddr());
|
||||
}
|
||||
|
|
|
@ -47,8 +47,9 @@ namespace CodeGen {
|
|||
struct CallArg {
|
||||
RValue RV;
|
||||
QualType Ty;
|
||||
CallArg(RValue rv, QualType ty)
|
||||
: RV(rv), Ty(ty)
|
||||
bool NeedsCopy;
|
||||
CallArg(RValue rv, QualType ty, bool needscopy)
|
||||
: RV(rv), Ty(ty), NeedsCopy(needscopy)
|
||||
{ }
|
||||
};
|
||||
|
||||
|
@ -57,8 +58,8 @@ namespace CodeGen {
|
|||
class CallArgList :
|
||||
public llvm::SmallVector<CallArg, 16> {
|
||||
public:
|
||||
void add(RValue rvalue, QualType type) {
|
||||
push_back(CallArg(rvalue, type));
|
||||
void add(RValue rvalue, QualType type, bool needscopy = false) {
|
||||
push_back(CallArg(rvalue, type, needscopy));
|
||||
}
|
||||
};
|
||||
|
||||
|
|
|
@ -0,0 +1,20 @@
|
|||
// RUN: %clang_cc1 -emit-llvm -triple x86_64-apple-darwin10 < %s | FileCheck %s
|
||||
|
||||
struct Test1S {
|
||||
long NumDecls;
|
||||
long X;
|
||||
long Y;
|
||||
};
|
||||
struct Test2S {
|
||||
long NumDecls;
|
||||
long X;
|
||||
};
|
||||
|
||||
// Make sure we don't generate extra memcpy for lvalues
|
||||
void test1a(struct Test1S, struct Test2S);
|
||||
// CHECK: define void @test1(
|
||||
// CHECK-NOT: memcpy
|
||||
// CHECK: call void @test1a
|
||||
void test1(struct Test1S *A, struct Test2S *B) {
|
||||
test1a(*A, *B);
|
||||
}
|
Загрузка…
Ссылка в новой задаче