This is an archive of the discontinued LLVM Phabricator instance.

Paths

Table of Contentst

-
lib/Headers/
-
Headers/
-
altivec.h
-
test/CodeGen/
-
CodeGen/
1/1
builtins-ppc-p9vector.c

Differential D28528

[PowerPC] Fix the wrong implementation of builtin vec_rlnm.
ClosedPublic

Authored by jtony on Jan 10 2017, 12:12 PM.

Download Raw Diff

Details

Reviewers

lei
syzaara
kbarton
sfertile
nemanjai

Summary

vec_rlnm was implemented according to the old ABI, which was wrong. The ABI team have fixed the issue (although not published yet). We need to re-implement these builtins according to the new ABI.

From (old implementation):
builtin_altivec_vrlwnm(a, b) & c;

To (new implementation):
vector unsigned int OneByte = { 0x8, 0x8, 0x8, 0x8 };
__builtin_altivec_vrlwnm(a, ((c << OneByte) | b));

Diff Detail

Event Timeline

jtony updated this revision to Diff 83846.Jan 10 2017, 12:12 PM

jtony retitled this revision from to [PowerPC] [PowerPC] Fix the wrong implementation of builtin vec_rlnm..

jtony updated this object.

jtony added reviewers: nemanjai, kbarton, sfertile, lei, syzaara.

jtony added subscribers: llvm-commits, cfe-commits, hfinkel, echristo.

jtony retitled this revision from [PowerPC] [PowerPC] Fix the wrong implementation of builtin vec_rlnm. to [PowerPC] Fix the wrong implementation of builtin vec_rlnm..Jan 10 2017, 12:16 PM

Please fix the minor issue with the test case and then commit.
LGTM.

test/CodeGen/builtins-ppc-p9vector.c
871	Don't hard-code the names of intermediate results. I imagine this will fail even now on some build bot. Rather specify it as something like: `// CHECK-BE: %[[RES1:.+]] = shl <4 x i32` And feel free to use the saved result as the operand to the next instruction. Like: `// CHECK-BE: %[[RES2:.+]] = or <4 x i32> %[[RES1]]`

This revision is now accepted and ready to land.Jan 11 2017, 12:30 PM

jtony marked an inline comment as done.Jan 11 2017, 12:47 PM

jtony closed this revision.Jan 12 2017, 5:21 PM

Revision Contents

Path

Size

lib/

Headers/

altivec.h

6 lines

test/

CodeGen/

builtins-ppc-p9vector.c

12 lines

Diff 83846

lib/Headers/altivec.h

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 7,658 Lines • ▼ Show 20 Lines	vec_rlmi(vector unsigned long long __a, vector unsigned long long __b,
vector unsigned long long __c) {		vector unsigned long long __c) {
return __builtin_altivec_vrldmi(__a, __c, __b);		return __builtin_altivec_vrldmi(__a, __c, __b);
}		}

/* vec_rlnm */		/* vec_rlnm */
static __inline__ vector unsigned int __ATTRS_o_ai		static __inline__ vector unsigned int __ATTRS_o_ai
vec_rlnm(vector unsigned int __a, vector unsigned int __b,		vec_rlnm(vector unsigned int __a, vector unsigned int __b,
vector unsigned int __c) {		vector unsigned int __c) {
return __builtin_altivec_vrlwnm(__a, __b) & __c;		vector unsigned int OneByte = { 0x8, 0x8, 0x8, 0x8 };
		return __builtin_altivec_vrlwnm(__a, ((__c << OneByte) \| __b));
}		}

static __inline__ vector unsigned long long __ATTRS_o_ai		static __inline__ vector unsigned long long __ATTRS_o_ai
vec_rlnm(vector unsigned long long __a, vector unsigned long long __b,		vec_rlnm(vector unsigned long long __a, vector unsigned long long __b,
vector unsigned long long __c) {		vector unsigned long long __c) {
return __builtin_altivec_vrldnm(__a, __b) & __c;		vector unsigned long long OneByte = { 0x8, 0x8 };
		return __builtin_altivec_vrldnm(__a, ((__c << OneByte) \| __b));
}		}
#endif		#endif

/* vec_vrlb */		/* vec_vrlb */

static __inline__ vector signed char __ATTRS_o_ai		static __inline__ vector signed char __ATTRS_o_ai
vec_vrlb(vector signed char __a, vector unsigned char __b) {		vec_vrlb(vector signed char __a, vector unsigned char __b) {
return (vector signed char)__builtin_altivec_vrlb((vector char)__a, __b);		return (vector signed char)__builtin_altivec_vrlb((vector char)__a, __b);
▲ Show 20 Lines • Show All 9,050 Lines • Show Last 20 Lines

test/CodeGen/builtins-ppc-p9vector.c

	Show First 20 Lines • Show All 862 Lines • ▼ Show 20 Lines
	vector unsigned long long test76(void) {			vector unsigned long long test76(void) {
	// CHECK-BE: @llvm.ppc.altivec.vrldmi(<2 x i64			// CHECK-BE: @llvm.ppc.altivec.vrldmi(<2 x i64
	// CHECK-BE-NEXT: ret <2 x i64>			// CHECK-BE-NEXT: ret <2 x i64>
	// CHECK: @llvm.ppc.altivec.vrldmi(<2 x i64			// CHECK: @llvm.ppc.altivec.vrldmi(<2 x i64
	// CHECK-NEXT: ret <2 x i64>			// CHECK-NEXT: ret <2 x i64>
	return vec_rlmi(vula, vula, vula);			return vec_rlmi(vula, vula, vula);
	}			}
	vector unsigned int test77(void) {			vector unsigned int test77(void) {
				// CHECK-BE: %shl.i = shl <4 x i32
				nemanjaiUnsubmitted Done Reply Inline Actions Don't hard-code the names of intermediate results. I imagine this will fail even now on some build bot. Rather specify it as something like: `// CHECK-BE: %[[RES1:.+]] = shl <4 x i32` And feel free to use the saved result as the operand to the next instruction. Like: `// CHECK-BE: %[[RES2:.+]] = or <4 x i32> %[[RES1]]` nemanjai: Don't hard-code the names of intermediate results. I imagine this will fail even now on some…
				// CHECK-BE: %or.i = or <4 x i32> %shl.i
	// CHECK-BE: @llvm.ppc.altivec.vrlwnm(<4 x i32			// CHECK-BE: @llvm.ppc.altivec.vrlwnm(<4 x i32
	// CHECK-BE: and <4 x i32
	// CHECK-BE: ret <4 x i32>			// CHECK-BE: ret <4 x i32>
				// CHECK: %shl.i = shl <4 x i32
				// CHECK: %or.i = or <4 x i32> %shl.i
	// CHECK: @llvm.ppc.altivec.vrlwnm(<4 x i32			// CHECK: @llvm.ppc.altivec.vrlwnm(<4 x i32
	// CHECK: and <4 x i32
	// CHECK: ret <4 x i32>			// CHECK: ret <4 x i32>
	return vec_rlnm(vuia, vuia, vuia);			return vec_rlnm(vuia, vuia, vuia);
	}			}
	vector unsigned long long test78(void) {			vector unsigned long long test78(void) {
				// CHECK-BE: %shl.i = shl <2 x i64
				// CHECK-BE: %or.i = or <2 x i64> %shl.i
	// CHECK-BE: @llvm.ppc.altivec.vrldnm(<2 x i64			// CHECK-BE: @llvm.ppc.altivec.vrldnm(<2 x i64
	// CHECK-BE: and <2 x i64
	// CHECK-BE-NEXT: ret <2 x i64>			// CHECK-BE-NEXT: ret <2 x i64>
				// CHECK: %shl.i = shl <2 x i64
				// CHECK: %or.i = or <2 x i64> %shl.i
	// CHECK: @llvm.ppc.altivec.vrldnm(<2 x i64			// CHECK: @llvm.ppc.altivec.vrldnm(<2 x i64
	// CHECK: and <2 x i64
	// CHECK-NEXT: ret <2 x i64>			// CHECK-NEXT: ret <2 x i64>
	return vec_rlnm(vula, vula, vula);			return vec_rlnm(vula, vula, vula);
	}			}
	vector double test79(void) {			vector double test79(void) {
	// CHECK-BE: extractelement <4 x float>			// CHECK-BE: extractelement <4 x float>
	// CHECK-BE: fpext float			// CHECK-BE: fpext float
	// CHECK-BE: insertelement <2 x double>			// CHECK-BE: insertelement <2 x double>
	// CHECK-BE: extractelement <4 x float>			// CHECK-BE: extractelement <4 x float>
	▲ Show 20 Lines • Show All 325 Lines • Show Last 20 Lines