Skip extra copy from aggregate where it isn't necessary; rdar://problem/8139919 . This shouldn't make much of a difference at -O3, but should substantially reduce the number of generated memcpy's at -O0.

git-svn-id: https://llvm.org/svn/llvm-project/cfe/trunk@130717 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
Eli Friedman 2011-05-02 20:24:29 +00:00
Родитель 35bdbf4062
Коммит b5a03b6217
3 изменённых файлов: 38 добавлений и 4 удалений

Просмотреть файл

@ -1166,6 +1166,15 @@ void CodeGenFunction::EmitCallArg(CallArgList &args, const Expr *E,
return args.add(EmitReferenceBindingToExpr(E, /*InitializedDecl=*/0),
type);
if (hasAggregateLLVMType(type) && isa<ImplicitCastExpr>(E) &&
cast<CastExpr>(E)->getCastKind() == CK_LValueToRValue) {
LValue L = EmitLValue(cast<CastExpr>(E)->getSubExpr());
assert(L.isSimple());
args.add(RValue::getAggregate(L.getAddress(), L.isVolatileQualified()),
type, /*NeedsCopy*/true);
return;
}
args.add(EmitAnyExprToTemp(E), type);
}
@ -1231,6 +1240,10 @@ RValue CodeGenFunction::EmitCall(const CGFunctionInfo &CallInfo,
Alignment, I->Ty);
else
StoreComplexToAddr(RV.getComplexVal(), Args.back(), false);
} else if (I->NeedsCopy && !ArgInfo.getIndirectByVal()) {
Args.push_back(CreateMemTemp(I->Ty));
EmitAggregateCopy(Args.back(), RV.getAggregateAddr(), I->Ty,
RV.isVolatileQualified());
} else {
Args.push_back(RV.getAggregateAddr());
}

Просмотреть файл

@ -47,8 +47,9 @@ namespace CodeGen {
struct CallArg {
RValue RV;
QualType Ty;
CallArg(RValue rv, QualType ty)
: RV(rv), Ty(ty)
bool NeedsCopy;
CallArg(RValue rv, QualType ty, bool needscopy)
: RV(rv), Ty(ty), NeedsCopy(needscopy)
{ }
};
@ -57,8 +58,8 @@ namespace CodeGen {
class CallArgList :
public llvm::SmallVector<CallArg, 16> {
public:
void add(RValue rvalue, QualType type) {
push_back(CallArg(rvalue, type));
void add(RValue rvalue, QualType type, bool needscopy = false) {
push_back(CallArg(rvalue, type, needscopy));
}
};

Просмотреть файл

@ -0,0 +1,20 @@
// RUN: %clang_cc1 -emit-llvm -triple x86_64-apple-darwin10 < %s | FileCheck %s
struct Test1S {
long NumDecls;
long X;
long Y;
};
struct Test2S {
long NumDecls;
long X;
};
// Make sure we don't generate extra memcpy for lvalues
void test1a(struct Test1S, struct Test2S);
// CHECK: define void @test1(
// CHECK-NOT: memcpy
// CHECK: call void @test1a
void test1(struct Test1S *A, struct Test2S *B) {
test1a(*A, *B);
}