This is an archive of the discontinued LLVM Phabricator instance.

clang/lib/CodeGen/CGBuiltin.cpp
2518	Is it an error here? It should be: if (BuiltinID == Builtin::BImempcpy \|\| BuiltinID == Builtin::BI__builtin_mempcpy) return RValue::get(Builder.CreateGEP(Dest.getPointer(), SizeVal)); else return RValue::get(Dest.getPointer());

@Jim obviously :-) Thanks for spotting that.

serge-sans-paille marked an inline comment as done.Dec 12 2019, 5:07 AM

jedilyn edited reviewers, added: Jim, erik.pilkington; removed: jedilyn.Dec 12 2019, 9:06 PM

Herald added a subscriber: dexonsmith. · View Herald TranscriptDec 12 2019, 9:06 PM

I am curious what is difference of code generation after applying your changes?

Please add a IR codegen test.

In D71374#1783032, @Jim wrote:

I am curious what is difference of code generation after applying your changes?

[[updated]]
Before, when compiling

#define _GNU_SOURCE
#include <string.h>

void* foo(void* to, void* from, unsigned n) {
  return mempcpy(mempcpy(to, from, n), from, n);
}

We get (clang -O3)

define dso_local i8* @foo(i8* %0, i8* nocapture readonly %1, i32 %2) local_unnamed_addr #0 {
  %4 = zext i32 %2 to i64
  tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 1 %0, i8* align 1 %1, i64 %4, i1 false) #2
  %5 = getelementptr inbounds i8, i8* %0, i64 %4
  tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 1 %5, i8* align 1 %1, i64 %4, i1 false) #2
  %6 = getelementptr inbounds i8, i8* %5, i64 %4
  ret i8* %6
}

And we now get

define dso_local i8* @foo(i8* %to, i8* nocapture readonly %from, i32 %n) local_unnamed_addr #0 {
entry:
  %conv = zext i32 %n to i64
  tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 1 %to, i8* align 1 %from, i64 %conv, i1 false)
  %0 = getelementptr i8, i8* %to, i64 %conv
  tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 1 %0, i8* align 1 %from, i64 %conv, i1 false)
  %1 = getelementptr i8, i8* %0, i64 %conv
  ret i8* %1
}

So no real change apart from the inbound keyword that I forgot to add.

LLVM already converts mempcpy to memcpy..

In D71374#1783245, @xbolva00 wrote:

LLVM already converts mempcpy to memcpy..

Indeed, the clang version I was using as base reference was clang-9, and the mempcpy optimisation at IR level got introduced after that.
Nevertheless, this patch does much more than lowering mempcpy, it also triggers new warnings, so It's still useful that clang understands it.

@xbolva00 should I remove the lowering part and leave it to llvm?

[[edited the example to reflect actual state]]

@xbolva00 should I remove the lowering part and leave it to llvm?

Probably okay to leave it + inbounds, but please add a test.

Added test cases + inbound GEP

@xbolva00 : validation is ok: https://github.com/serge-sans-paille/llvm-project/pull/5/checks

@xbolva00 : gentle reminder :-)

This revision is now accepted and ready to land.Jan 9 2020, 7:36 AM

Closed by commit rGcee4a1c95742: Improve support of GNU mempcpy (authored by serge-sans-paille). · Explain WhyJan 9 2020, 8:31 AM

This revision was automatically updated to reflect the committed changes.

Revision Contents

Path

Size

clang/

include/

clang/

Basic/

Builtins.def

1 line

lib/

AST/

Decl.cpp

7 lines

CodeGen/

CGBuiltin.cpp

10 lines

Sema/

SemaChecking.cpp

7 lines

test/

Analysis/

bstring.c

6 lines

CodeGen/

mempcpy-libcall.c

12 lines

Diff 237097

clang/include/clang/Basic/Builtins.def

	Show First 20 Lines • Show All 978 Lines • ▼ Show 20 Lines

	// Non-C library functions, active in GNU mode only.			// Non-C library functions, active in GNU mode only.
	// Functions with (returns_twice) attribute (marked as "j") are still active in			// Functions with (returns_twice) attribute (marked as "j") are still active in
	// all languages, because losing this attribute would result in miscompilation			// all languages, because losing this attribute would result in miscompilation
	// when these functions are used in non-GNU mode. PR16138.			// when these functions are used in non-GNU mode. PR16138.
	LIBBUILTIN(alloca, "v*z", "f", "stdlib.h", ALL_GNU_LANGUAGES)			LIBBUILTIN(alloca, "v*z", "f", "stdlib.h", ALL_GNU_LANGUAGES)
	// POSIX string.h			// POSIX string.h
	LIBBUILTIN(memccpy, "vvvC*iz", "f", "string.h", ALL_GNU_LANGUAGES)			LIBBUILTIN(memccpy, "vvvC*iz", "f", "string.h", ALL_GNU_LANGUAGES)
				LIBBUILTIN(mempcpy, "vvvC*z", "f", "string.h", ALL_GNU_LANGUAGES)
	LIBBUILTIN(stpcpy, "cccC*", "f", "string.h", ALL_GNU_LANGUAGES)			LIBBUILTIN(stpcpy, "cccC*", "f", "string.h", ALL_GNU_LANGUAGES)
	LIBBUILTIN(stpncpy, "cccC*z", "f", "string.h", ALL_GNU_LANGUAGES)			LIBBUILTIN(stpncpy, "cccC*z", "f", "string.h", ALL_GNU_LANGUAGES)
	LIBBUILTIN(strdup, "ccC", "f", "string.h", ALL_GNU_LANGUAGES)			LIBBUILTIN(strdup, "ccC", "f", "string.h", ALL_GNU_LANGUAGES)
	LIBBUILTIN(strndup, "ccCz", "f", "string.h", ALL_GNU_LANGUAGES)			LIBBUILTIN(strndup, "ccCz", "f", "string.h", ALL_GNU_LANGUAGES)
	// POSIX strings.h			// POSIX strings.h
	LIBBUILTIN(index, "ccCi", "f", "strings.h", ALL_GNU_LANGUAGES)			LIBBUILTIN(index, "ccCi", "f", "strings.h", ALL_GNU_LANGUAGES)
	LIBBUILTIN(rindex, "ccCi", "f", "strings.h", ALL_GNU_LANGUAGES)			LIBBUILTIN(rindex, "ccCi", "f", "strings.h", ALL_GNU_LANGUAGES)
	LIBBUILTIN(bzero, "vv*z", "f", "strings.h", ALL_GNU_LANGUAGES)			LIBBUILTIN(bzero, "vv*z", "f", "strings.h", ALL_GNU_LANGUAGES)
	▲ Show 20 Lines • Show All 577 Lines • Show Last 20 Lines

clang/lib/AST/Decl.cpp

Show First 20 Lines • Show All 3,873 Lines • ▼ Show 20 Lines	unsigned FunctionDecl::getMemoryFunctionKind() const {
case Builtin::BImemset:		case Builtin::BImemset:
return Builtin::BImemset;		return Builtin::BImemset;

case Builtin::BI__builtin_memcpy:		case Builtin::BI__builtin_memcpy:
case Builtin::BI__builtin___memcpy_chk:		case Builtin::BI__builtin___memcpy_chk:
case Builtin::BImemcpy:		case Builtin::BImemcpy:
return Builtin::BImemcpy;		return Builtin::BImemcpy;

		case Builtin::BI__builtin_mempcpy:
		case Builtin::BI__builtin___mempcpy_chk:
		case Builtin::BImempcpy:
		return Builtin::BImempcpy;

case Builtin::BI__builtin_memmove:		case Builtin::BI__builtin_memmove:
case Builtin::BI__builtin___memmove_chk:		case Builtin::BI__builtin___memmove_chk:
case Builtin::BImemmove:		case Builtin::BImemmove:
return Builtin::BImemmove;		return Builtin::BImemmove;

case Builtin::BIstrlcpy:		case Builtin::BIstrlcpy:
case Builtin::BI__builtin___strlcpy_chk:		case Builtin::BI__builtin___strlcpy_chk:
return Builtin::BIstrlcpy;		return Builtin::BIstrlcpy;
▲ Show 20 Lines • Show All 41 Lines • ▼ Show 20 Lines	case Builtin::BIbzero:
return Builtin::BIbzero;		return Builtin::BIbzero;

default:		default:
if (isExternC()) {		if (isExternC()) {
if (FnInfo->isStr("memset"))		if (FnInfo->isStr("memset"))
return Builtin::BImemset;		return Builtin::BImemset;
else if (FnInfo->isStr("memcpy"))		else if (FnInfo->isStr("memcpy"))
return Builtin::BImemcpy;		return Builtin::BImemcpy;
		else if (FnInfo->isStr("mempcpy"))
		return Builtin::BImempcpy;
else if (FnInfo->isStr("memmove"))		else if (FnInfo->isStr("memmove"))
return Builtin::BImemmove;		return Builtin::BImemmove;
else if (FnInfo->isStr("memcmp"))		else if (FnInfo->isStr("memcmp"))
return Builtin::BImemcmp;		return Builtin::BImemcmp;
else if (FnInfo->isStr("bcmp"))		else if (FnInfo->isStr("bcmp"))
return Builtin::BIbcmp;		return Builtin::BIbcmp;
else if (FnInfo->isStr("strncpy"))		else if (FnInfo->isStr("strncpy"))
return Builtin::BIstrncpy;		return Builtin::BIstrncpy;
▲ Show 20 Lines • Show All 1,029 Lines • Show Last 20 Lines

clang/lib/CodeGen/CGBuiltin.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 2,494 Lines • ▼ Show 20 Lines	case Builtin::BI__builtin_bzero: {
Address Dest = EmitPointerWithAlignment(E->getArg(0));		Address Dest = EmitPointerWithAlignment(E->getArg(0));
Value *SizeVal = EmitScalarExpr(E->getArg(1));		Value *SizeVal = EmitScalarExpr(E->getArg(1));
EmitNonNullArgCheck(RValue::get(Dest.getPointer()), E->getArg(0)->getType(),		EmitNonNullArgCheck(RValue::get(Dest.getPointer()), E->getArg(0)->getType(),
E->getArg(0)->getExprLoc(), FD, 0);		E->getArg(0)->getExprLoc(), FD, 0);
Builder.CreateMemSet(Dest, Builder.getInt8(0), SizeVal, false);		Builder.CreateMemSet(Dest, Builder.getInt8(0), SizeVal, false);
return RValue::get(nullptr);		return RValue::get(nullptr);
}		}
case Builtin::BImemcpy:		case Builtin::BImemcpy:
case Builtin::BI__builtin_memcpy: {		case Builtin::BI__builtin_memcpy:
		case Builtin::BImempcpy:
		case Builtin::BI__builtin_mempcpy: {
Address Dest = EmitPointerWithAlignment(E->getArg(0));		Address Dest = EmitPointerWithAlignment(E->getArg(0));
Address Src = EmitPointerWithAlignment(E->getArg(1));		Address Src = EmitPointerWithAlignment(E->getArg(1));
Value *SizeVal = EmitScalarExpr(E->getArg(2));		Value *SizeVal = EmitScalarExpr(E->getArg(2));
EmitNonNullArgCheck(RValue::get(Dest.getPointer()), E->getArg(0)->getType(),		EmitNonNullArgCheck(RValue::get(Dest.getPointer()), E->getArg(0)->getType(),
E->getArg(0)->getExprLoc(), FD, 0);		E->getArg(0)->getExprLoc(), FD, 0);
EmitNonNullArgCheck(RValue::get(Src.getPointer()), E->getArg(1)->getType(),		EmitNonNullArgCheck(RValue::get(Src.getPointer()), E->getArg(1)->getType(),
E->getArg(1)->getExprLoc(), FD, 1);		E->getArg(1)->getExprLoc(), FD, 1);
Builder.CreateMemCpy(Dest, Src, SizeVal, false);		Builder.CreateMemCpy(Dest, Src, SizeVal, false);
		if (BuiltinID == Builtin::BImempcpy \|\|
		BuiltinID == Builtin::BI__builtin_mempcpy)
		return RValue::get(Builder.CreateInBoundsGEP(Dest.getPointer(), SizeVal));
		else
return RValue::get(Dest.getPointer());		return RValue::get(Dest.getPointer());
		JimUnsubmitted Done Reply Inline Actions Is it an error here? It should be: if (BuiltinID == Builtin::BImempcpy \|\| BuiltinID == Builtin::BI__builtin_mempcpy) return RValue::get(Builder.CreateGEP(Dest.getPointer(), SizeVal)); else return RValue::get(Dest.getPointer()); Jim: Is it an error here? It should be: ``` if (BuiltinID == Builtin::BImempcpy \|\| BuiltinID…
}		}

case Builtin::BI__builtin_char_memchr:		case Builtin::BI__builtin_char_memchr:
BuiltinID = Builtin::BI__builtin_memchr;		BuiltinID = Builtin::BI__builtin_memchr;
break;		break;

case Builtin::BI__builtin___memcpy_chk: {		case Builtin::BI__builtin___memcpy_chk: {
// fold __builtin_memcpy_chk(x, y, cst1, cst2) to memcpy iff cst1<=cst2.		// fold __builtin_memcpy_chk(x, y, cst1, cst2) to memcpy iff cst1<=cst2.
▲ Show 20 Lines • Show All 12,304 Lines • Show Last 20 Lines

clang/lib/Sema/SemaChecking.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 334 Lines • ▼ Show 20 Lines	void Sema::checkFortifiedBuiltinMemoryFunction(FunctionDecl *FD,
case Builtin::BI__builtin___memcpy_chk:		case Builtin::BI__builtin___memcpy_chk:
case Builtin::BI__builtin___memmove_chk:		case Builtin::BI__builtin___memmove_chk:
case Builtin::BI__builtin___memset_chk:		case Builtin::BI__builtin___memset_chk:
case Builtin::BI__builtin___strlcat_chk:		case Builtin::BI__builtin___strlcat_chk:
case Builtin::BI__builtin___strlcpy_chk:		case Builtin::BI__builtin___strlcpy_chk:
case Builtin::BI__builtin___strncat_chk:		case Builtin::BI__builtin___strncat_chk:
case Builtin::BI__builtin___strncpy_chk:		case Builtin::BI__builtin___strncpy_chk:
case Builtin::BI__builtin___stpncpy_chk:		case Builtin::BI__builtin___stpncpy_chk:
case Builtin::BI__builtin___memccpy_chk: {		case Builtin::BI__builtin___memccpy_chk:
		case Builtin::BI__builtin___mempcpy_chk: {
DiagID = diag::warn_builtin_chk_overflow;		DiagID = diag::warn_builtin_chk_overflow;
IsChkVariant = true;		IsChkVariant = true;
SizeIndex = TheCall->getNumArgs() - 2;		SizeIndex = TheCall->getNumArgs() - 2;
ObjectIndex = TheCall->getNumArgs() - 1;		ObjectIndex = TheCall->getNumArgs() - 1;
break;		break;
}		}

case Builtin::BI__builtin___snprintf_chk:		case Builtin::BI__builtin___snprintf_chk:
Show All 22 Lines	case Builtin::BI__builtin_stpncpy: {
break;		break;
}		}

case Builtin::BImemcpy:		case Builtin::BImemcpy:
case Builtin::BI__builtin_memcpy:		case Builtin::BI__builtin_memcpy:
case Builtin::BImemmove:		case Builtin::BImemmove:
case Builtin::BI__builtin_memmove:		case Builtin::BI__builtin_memmove:
case Builtin::BImemset:		case Builtin::BImemset:
case Builtin::BI__builtin_memset: {		case Builtin::BI__builtin_memset:
		case Builtin::BImempcpy:
		case Builtin::BI__builtin_mempcpy: {
DiagID = diag::warn_fortify_source_overflow;		DiagID = diag::warn_fortify_source_overflow;
SizeIndex = TheCall->getNumArgs() - 1;		SizeIndex = TheCall->getNumArgs() - 1;
ObjectIndex = 0;		ObjectIndex = 0;
break;		break;
}		}
case Builtin::BIsnprintf:		case Builtin::BIsnprintf:
case Builtin::BI__builtin_snprintf:		case Builtin::BI__builtin_snprintf:
case Builtin::BIvsnprintf:		case Builtin::BIvsnprintf:
▲ Show 20 Lines • Show All 14,567 Lines • Show Last 20 Lines

clang/test/Analysis/bstring.c

Show First 20 Lines • Show All 216 Lines • ▼ Show 20 Lines	void mempcpy1 () {
mempcpy(dst, src, 5); // expected-warning{{Memory copy function accesses out-of-bound array element}}		mempcpy(dst, src, 5); // expected-warning{{Memory copy function accesses out-of-bound array element}}
}		}

void mempcpy2 () {		void mempcpy2 () {
char src[] = {1, 2, 3, 4};		char src[] = {1, 2, 3, 4};
char dst[1];		char dst[1];

mempcpy(dst, src, 4); // expected-warning{{Memory copy function overflows destination buffer}}		mempcpy(dst, src, 4); // expected-warning{{Memory copy function overflows destination buffer}}
		#ifndef VARIANT
		// expected-warning@-2{{'mempcpy' will always overflow; destination buffer has size 1, but size argument is 4}}
		#endif
}		}

void mempcpy3 () {		void mempcpy3 () {
char src[] = {1, 2, 3, 4};		char src[] = {1, 2, 3, 4};
char dst[3];		char dst[3];

mempcpy(dst+1, src+2, 2); // no-warning		mempcpy(dst+1, src+2, 2); // no-warning
}		}

void mempcpy4 () {		void mempcpy4 () {
char src[] = {1, 2, 3, 4};		char src[] = {1, 2, 3, 4};
char dst[10];		char dst[10];

mempcpy(dst+2, src+2, 3); // expected-warning{{Memory copy function accesses out-of-bound array element}}		mempcpy(dst+2, src+2, 3); // expected-warning{{Memory copy function accesses out-of-bound array element}}
}		}

void mempcpy5() {		void mempcpy5() {
char src[] = {1, 2, 3, 4};		char src[] = {1, 2, 3, 4};
char dst[3];		char dst[3];

mempcpy(dst+2, src+2, 2); // expected-warning{{Memory copy function overflows destination buffer}}		mempcpy(dst+2, src+2, 2); // expected-warning{{Memory copy function overflows destination buffer}}
		#ifndef VARIANT
		// expected-warning@-2{{'mempcpy' will always overflow; destination buffer has size 1, but size argument is 2}}
		#endif
}		}

void mempcpy6() {		void mempcpy6() {
int a[4] = {0};		int a[4] = {0};
mempcpy(a, a, 8); // expected-warning{{overlapping}}		mempcpy(a, a, 8); // expected-warning{{overlapping}}
}		}

void mempcpy7() {		void mempcpy7() {
▲ Show 20 Lines • Show All 269 Lines • Show Last 20 Lines

clang/test/CodeGen/mempcpy-libcall.c

This file was added.

				// RUN: %clang_cc1 -emit-llvm < %s\| FileCheck %s

				typedef __SIZE_TYPE__ size_t;

				void mempcpy(void , void const *, size_t);

				char test(char d, char *s, size_t n) {
				// CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.}} %[[REG1:[^ ]+]], i8 {{.*}} %1, i64 %[[REG2:[^ ]+]], i1 false)
				// CHECK-NEXT: %[[REGr:[^ ]+]] = getelementptr inbounds i8, i8* %[[REG1]], i64 %[[REG2]]
				// CHECK-NEXT: ret i8* %[[REGr]]
				return mempcpy(d, s, n);
				}

This is an archive of the discontinued LLVM Phabricator instance.

Improve support of GNU mempcpyClosedPublic

Details

Diff Detail

Event Timeline