Index: clang/lib/CodeGen/TargetInfo.cpp =================================================================== --- clang/lib/CodeGen/TargetInfo.cpp +++ clang/lib/CodeGen/TargetInfo.cpp @@ -7418,18 +7418,29 @@ }; class SystemZTargetCodeGenInfo : public TargetCodeGenInfo { + ASTContext &Ctx; + + const SystemZABIInfo &getABIInfo() const { + return static_cast(TargetCodeGenInfo::getABIInfo()); + } + // These are used for speeding up the search for a visible vector ABI. mutable bool HasVisibleVecABIFlag = false; mutable std::set SeenTypes; - // Returns true (the first time) if Ty is or found to make use of a vector - // type (e.g. as a function argument). - bool isVectorTypeBased(const Type *Ty) const; + // Returns true (the first time) if Ty is, or is found to include, a vector + // type that exposes the vector ABI. This is any vector >=16 bytes which + // with vector support are aligned to only 8 bytes. When IsParam is true, + // the type belongs to a value as passed between functions. If it is a + // vector <=16 bytes it will be passed in a register in case of vector + // support. + bool isVectorTypeBased(const Type *Ty, bool IsParam = false) const; public: SystemZTargetCodeGenInfo(CodeGenTypes &CGT, bool HasVector, bool SoftFloatABI) : TargetCodeGenInfo( - std::make_unique(CGT, HasVector, SoftFloatABI)) { + std::make_unique(CGT, HasVector, SoftFloatABI)), + Ctx(CGT.getContext()) { SwiftInfo = std::make_unique(CGT, /*SwiftErrorInRegister=*/false); } @@ -7440,8 +7451,9 @@ // a GNU attribute indicating the vector ABI of the module. Ty is the type // of a variable or function parameter that is globally visible. void handleExternallyVisibleObjABI(const Type *Ty, - CodeGen::CodeGenModule &M) const { - if (!HasVisibleVecABIFlag && isVectorTypeBased(Ty)) { + CodeGen::CodeGenModule &M, + bool IsParam = false) const { + if (!HasVisibleVecABIFlag && isVectorTypeBased(Ty, IsParam)) { M.getModule().addModuleFlag(llvm::Module::Warning, "s390x-visible-vector-ABI", 1); HasVisibleVecABIFlag = true; @@ -7571,17 +7583,18 @@ // If this is a C++ record, check the bases first. if (const CXXRecordDecl *CXXRD = dyn_cast(RD)) - for (const auto &I : CXXRD->bases()) { - QualType Base = I.getType(); + if (CXXRD->hasDefinition()) + for (const auto &I : CXXRD->bases()) { + QualType Base = I.getType(); - // Empty bases don't affect things either way. - if (isEmptyRecord(getContext(), Base, true)) - continue; + // Empty bases don't affect things either way. + if (isEmptyRecord(getContext(), Base, true)) + continue; - if (!Found.isNull()) - return Ty; - Found = GetSingleElementType(Base); - } + if (!Found.isNull()) + return Ty; + Found = GetSingleElementType(Base); + } // Check the fields. for (const auto *FD : RD->fields()) { @@ -7635,7 +7648,8 @@ bool IsVector = false; CharUnits UnpaddedSize; CharUnits DirectAlign; - SZCGI.handleExternallyVisibleObjABI(Ty.getTypePtr(), CGT.getCGM()); + SZCGI.handleExternallyVisibleObjABI(Ty.getTypePtr(), CGT.getCGM(), + /*IsParam*/true); if (IsIndirect) { DirectTy = llvm::PointerType::getUnqual(DirectTy); UnpaddedSize = DirectAlign = CharUnits::fromQuantity(8); @@ -7843,17 +7857,30 @@ // Check if a vararg vector argument is passed, in which case the // vector ABI becomes visible as the va_list could be passed on to // other functions. - SZCGI.handleExternallyVisibleObjABI(I.type.getTypePtr(), CGT.getCGM()); + SZCGI.handleExternallyVisibleObjABI(I.type.getTypePtr(), CGT.getCGM(), + /*IsParam*/true); } } -bool SystemZTargetCodeGenInfo::isVectorTypeBased(const Type *Ty) const { +bool SystemZTargetCodeGenInfo::isVectorTypeBased(const Type *Ty, + bool IsParam) const { while (Ty->isPointerType() || Ty->isArrayType()) Ty = Ty->getPointeeOrArrayElementType(); if (!SeenTypes.insert(Ty).second) return false; - if (Ty->isVectorType()) - return true; + if (Ty->isVectorType()) { + unsigned Bytes = Ctx.getTypeSize(Ty) / 8; + if (Bytes >= 16 || IsParam) + return true; + } + if (IsParam) { + const Type *SingleEltTy = + getABIInfo().GetSingleElementType(QualType(Ty, 0)).getTypePtr(); + if (SingleEltTy != Ty && SingleEltTy->isVectorType() && + Ctx.getTypeSize(SingleEltTy) == Ctx.getTypeSize(Ty)) + return true; + } + if (const auto *RecordTy = Ty->getAs()) { const RecordDecl *RD = RecordTy->getDecl(); if (const CXXRecordDecl *CXXRD = dyn_cast(RD)) @@ -7866,11 +7893,11 @@ return true; } if (const auto *FT = Ty->getAs()) - if (isVectorTypeBased(FT->getReturnType().getTypePtr())) + if (isVectorTypeBased(FT->getReturnType().getTypePtr(), true)) return true; if (const FunctionProtoType *Proto = Ty->getAs()) for (auto ParamType : Proto->getParamTypes()) - if (isVectorTypeBased(ParamType.getTypePtr())) + if (isVectorTypeBased(ParamType.getTypePtr(), true)) return true; return false; } Index: clang/test/CodeGen/SystemZ/vec-abi-gnuattr-03b.c =================================================================== --- /dev/null +++ clang/test/CodeGen/SystemZ/vec-abi-gnuattr-03b.c @@ -0,0 +1,19 @@ +// RUN: %clang_cc1 -triple s390x-ibm-linux -emit-llvm -fzvector -o - %s 2>&1 \ +// RUN: | FileCheck %s +// +// Test that the "s390x-visible-vector-ABI" module flag is emitted. + +// Call to external function with with narrow vector argument. + +typedef __attribute__((vector_size(8))) int v2i32; + +void bar(v2i32 arg); + +void foo() { + v2i32 Var = {0, 0}; + bar(Var); +} + +//CHECK: !llvm.module.flags = !{!0, !1} +//CHECK: !0 = !{i32 2, !"s390x-visible-vector-ABI", i32 1} + Index: clang/test/CodeGen/SystemZ/vec-abi-gnuattr-08b.c =================================================================== --- /dev/null +++ clang/test/CodeGen/SystemZ/vec-abi-gnuattr-08b.c @@ -0,0 +1,22 @@ +// RUN: %clang_cc1 -triple s390x-ibm-linux -emit-llvm -fzvector -o - %s 2>&1 \ +// RUN: | FileCheck %s +// +// Test the emission of the "s390x-visible-vector-ABI" module flag. + +// Passing a single element struct containing a narrow (8 byte) vector element. + +typedef __attribute__((vector_size(8))) int v2i32; + +struct S { + v2i32 B; +}; + +void bar(struct S Arg); + +void foo() { + struct S Var = {{0, 0}}; + bar(Var); +} + +//CHECK: !llvm.module.flags = !{!0, !1} +//CHECK: !0 = !{i32 2, !"s390x-visible-vector-ABI", i32 1} Index: clang/test/CodeGen/SystemZ/vec-abi-gnuattr-09b.c =================================================================== --- /dev/null +++ clang/test/CodeGen/SystemZ/vec-abi-gnuattr-09b.c @@ -0,0 +1,18 @@ +// RUN: %clang_cc1 -triple s390x-ibm-linux -emit-llvm -fzvector -o - %s 2>&1 \ +// RUN: | FileCheck %s +// +// Test the emission of the "s390x-visible-vector-ABI" module flag. + +// Call to vararg function with a narrow (8 bytes) vector argument. + +typedef __attribute__((vector_size(8))) int v2i32; + +void bar(int N, ...); + +void foo() { + v2i32 Var = {0, 0}; + bar(0, Var); +} + +//CHECK: !llvm.module.flags = !{!0, !1} +//CHECK: !0 = !{i32 2, !"s390x-visible-vector-ABI", i32 1} Index: clang/test/CodeGen/SystemZ/vec-abi-gnuattr-17b.c =================================================================== --- /dev/null +++ clang/test/CodeGen/SystemZ/vec-abi-gnuattr-17b.c @@ -0,0 +1,13 @@ +// RUN: %clang_cc1 -triple s390x-ibm-linux -emit-llvm -fzvector -o - %s 2>&1 \ +// RUN: | FileCheck %s +// +// Test that the "s390x-visible-vector-ABI" module flag is emitted. + +// Globally visible function pointer with narrow vector argument. + +typedef __attribute__((vector_size(8))) int v2i32; + +void (*bar)(v2i32 Arg); + +//CHECK: !llvm.module.flags = !{!0, !1} +//CHECK: !0 = !{i32 2, !"s390x-visible-vector-ABI", i32 1} Index: clang/test/CodeGen/SystemZ/vec-abi-gnuattr-24.c =================================================================== --- clang/test/CodeGen/SystemZ/vec-abi-gnuattr-24.c +++ clang/test/CodeGen/SystemZ/vec-abi-gnuattr-24.c @@ -34,4 +34,8 @@ return foo(V)[0] + GlobVal + GlobExtVar; } +// Globally visible vector variable less than 16 bytes in size. +typedef __attribute__((vector_size(8))) int v2i32; +v2i32 NarrowVecVar; + //CHECK-NOT: !{i32 2, !"s390x-visible-vector-ABI", i32 1}