This is an archive of the discontinued LLVM Phabricator instance.

Paths

Table of Contentst

-
include/clang/Basic/
-
clang/
-
Basic/
-
BuiltinsPPC.def
-
DiagnosticCommonKinds.td
-
lib/
-
Basic/
2/5
Targets.cpp
-
Headers/
1/7
altivec.h
-
test/CodeGen/
-
CodeGen/
-
builtins-ppc-altivec.c
2
builtins-ppc-p8vector.c
-
builtins-ppc-vsx.c

Differential D10972

Add missing builtins to altivec.h for ABI compliance (vol. 3)
ClosedPublic

Authored by nemanjai on Jul 6 2015, 1:55 PM.

Download Raw Diff

Details

Reviewers

wschmidt
echristo
kbarton
seurer
hfinkel

Summary

This patch introduces a number of new vector interfaces to altivec.h.
In doing so, it touches on a number of issues that existed in existing
implementations as well as with how features are treated in the front end.
As a result, this patch accomplishes a few somewhat distinct but related
goals. Namely:

Fixes how features and the related predefined macros are handled. Namely,

because -mvsx is implied by -mpower8-vector and by -mdirect-move. If we are on
a CPU that has those by default and we specify -mno-vsx, it turned off VSX in
the back end, but still left it on in the front end (most notably, the
predefined macro was still on).

Added a number of new interfaces listed in the ABI
Added a VSX path to one of the existing interfaces (vec_round)
Changed the signatures of some existing functions to match the ABI
Fixed how right shifts are generated as the implementation did not

match the ABI.

Changed signatures to conform to ABI:
vector short vec_perm(vector signed short, vector signed short, vector unsigned char)
vector int vec_perm(vector signed int, vector signed int, vector unsigned char)
vector long long vec_perm(vector signed long long, vector signed long long, vector unsigned char)
vector signed char vec_sld(vector signed char, vector signed char, const int)
vector unsigned char vec_sld(vector unsigned char, vector unsigned char, const int)
vector bool char vec_sld(vector bool char, vector bool char, const int)
vector unsigned short vec_sld(vector unsigned short, vector unsigned short, const int)
vector signed short vec_sld(vector signed short, vector signed short, const int)
vector signed int vec_sld(vector signed int, vector signed int, const int)
vector unsigned int vec_sld(vector unsigned int, vector unsigned int, const int)
vector float vec_sld(vector float, vector float, const int)
vector signed char vec_splat(vector signed char, const int)
vector unsigned char vec_splat(vector unsigned char, const int)
vector bool char vec_splat(vector bool char, const int)
vector signed short vec_splat(vector signed short, const int)
vector unsigned short vec_splat(vector unsigned short, const int)
vector bool short vec_splat(vector bool short, const int)
vector pixel vec_splat(vector pixel, const int)
vector signed int vec_splat(vector signed int, const int)
vector unsigned int vec_splat(vector unsigned int, const int)
vector bool int vec_splat(vector bool int, const int)
vector float vec_splat(vector float, const int)

Added a VSX path to:
vector float vec_round(vector float)

Added interfaces:
vector signed char vec_eqv(vector signed char, vector signed char)
vector signed char vec_eqv(vector bool char, vector signed char)
vector signed char vec_eqv(vector signed char, vector bool char)
vector unsigned char vec_eqv(vector unsigned char, vector unsigned char)
vector unsigned char vec_eqv(vector bool char, vector unsigned char)
vector unsigned char vec_eqv(vector unsigned char, vector bool char)
vector signed short vec_eqv(vector signed short, vector signed short)
vector signed short vec_eqv(vector bool short, vector signed short)
vector signed short vec_eqv(vector signed short, vector bool short)
vector unsigned short vec_eqv(vector unsigned short, vector unsigned short)
vector unsigned short vec_eqv(vector bool short, vector unsigned short)
vector unsigned short vec_eqv(vector unsigned short, vector bool short)
vector signed int vec_eqv(vector signed int, vector signed int)
vector signed int vec_eqv(vector bool int, vector signed int)
vector signed int vec_eqv(vector signed int, vector bool int)
vector unsigned int vec_eqv(vector unsigned int, vector unsigned int)
vector unsigned int vec_eqv(vector bool int, vector unsigned int)
vector unsigned int vec_eqv(vector unsigned int, vector bool int)
vector signed long long vec_eqv(vector signed long long, vector signed long long)
vector signed long long vec_eqv(vector bool long long, vector signed long long)
vector signed long long vec_eqv(vector signed long long, vector bool long long)
vector unsigned long long vec_eqv(vector unsigned long long, vector unsigned long long)
vector unsigned long long vec_eqv(vector bool long long, vector unsigned long long)
vector unsigned long long vec_eqv(vector unsigned long long, vector bool long long)
vector float vec_eqv(vector float, vector float)
vector float vec_eqv(vector bool int, vector float)
vector float vec_eqv(vector float, vector bool int)
vector double vec_eqv(vector double, vector double)
vector double vec_eqv(vector bool long long, vector double)
vector double vec_eqv(vector double, vector bool long long)
vector bool long long vec_perm(vector bool long long, vector bool long long, vector unsigned char)
vector double vec_round(vector double)
vector double vec_splat(vector double, const int)
vector bool long long vec_splat(vector bool long long, const int)
vector signed long long vec_splat(vector signed long long, const int)
vector unsigned long long vec_splat(vector unsigned long long,
vector bool int vec_sld(vector bool int, vector bool int, const int)
vector bool short vec_sld(vector bool short, vector bool short, const int)

Diff Detail

Repository: rL LLVM

Event Timeline

nemanjai updated this revision to Diff 29123.Jul 6 2015, 1:55 PM

nemanjai retitled this revision from to Add missing builtins to altivec.h for ABI compliance (vol. 3).

nemanjai updated this object.

nemanjai added reviewers: wschmidt, kbarton, hfinkel, echristo, seurer.

nemanjai set the repository for this revision to rL LLVM.

nemanjai added a subscriber: llvm-commits.

nemanjai added a subscriber: cfe-commits.Jul 6 2015, 2:00 PM

nemanjai added inline comments.Jul 6 2015, 2:03 PM

lib/Basic/Targets.cpp
1026	Oops, there was supposed to be a continue here. Added to the source tree.

Hi Nemanja,

Looks pretty good. I have a few comments to be dealt with before I can sign off. Thanks!

lib/Basic/Targets.cpp
1017	This way of handling the various -m arguments positionally is not quite right. If both -mvsx and -mno-vsx are present in the command line, the last one seen wins. That means that if the user specifies -mno-vsx -mpower8-vector -mvsx we should turn on both the VSX and the P8Vector features. The logic you are using will only turn on the VSX feature because the specification of -mpower8-vector happened to be in between -mno-vsx and -mvsx. Also, it is an error to specify -mpower8-vector or -mdirect-moves if -mno-vsx is the switch value that wins due to occurring last. So I suggest that you track each feature separately during this loop, obtaining individual values for HasVSX, HasP8Vector, and HasDirectMove. Following the loop, if !HasVSX && (HasP8Vector \|\| HasDirectMove), report an error and fail the compilation.
lib/Headers/altivec.h
6686–6687	Missing the & 0x0F here.
7013	Seems like too much casting above. It's ok to just use the original code here (and make "vector long long" into "vector unsigned long long"). The instruction will mask off all but the rightmost 6 bits of each element of b, so the signedness doesn't matter.
test/CodeGen/builtins-ppc-p8vector.c
1010	This will probably change back per my earlier comment.

nemanjai marked 3 inline comments as done.Jul 9 2015, 6:27 AM

nemanjai added inline comments.

lib/Basic/Targets.cpp
1017	Thank you for this comment. I think I know what and how we need to do (this matches the gcc behaviour): all three are set by default for ppc64le/pwr8 -mno-vsx disables all three defaults if an -mno-vsx wins (appears after any -mvsx) and the user explicitly specifies one of the other two, a diagnostic is emitted
lib/Headers/altivec.h
6686–6687	Greath catch, thank you.
7013	I am not sure if you are referring only to the vector long long overload of vec_sr or to all of them. In any case, the reason for the casts is that Clang will produce an `lshr` when the LHS is unsigned and an `ashr` when the LHS is signed. This is what was causing LLVM to emit `vsr[bhwd]` for the unsigned ones and `vsra[bhwd]` for the signed ones. So the casts are simply to ensure that the IR contains the `lshr` instructions rather than `ashr/lshr` depending on signedness. Of course, I could have just defined builtins and called the same one for both signed and unsigned overloads, but I assumed that since IR instructions exist for this, it is better to retain the information about what operation is actually being performed in case the optimizer can use it.
test/CodeGen/builtins-ppc-p8vector.c
1010	If we indeed want logical shifts for vec_sr, then this should not change back.

wschmidt added inline comments.Jul 9 2015, 6:39 AM

lib/Basic/Targets.cpp
1017	Agreed, that is more complete than what I wrote.
lib/Headers/altivec.h
7013	You have wrongly changed the instruction to be generated. The user has chosen vec_sr, which means the user wants vsr[bhwd]. If they wanted vsra[bhwd], they could have chosen vec_sra. See figures 4-120 and 4-121 of http://www.freescale.com/files/32bit/doc/ref_manual/ALTIVECPIM.pdf to see the required instruction mappings.

wschmidt added inline comments.Jul 9 2015, 6:40 AM

lib/Headers/altivec.h
7013	Note that in this case we are adding code for the vector long long operands, which is not described in the PIM. But we should be consistent with existing behavior for the other types.

Addressed the comments as follows:

Added the missing mask
Added handling for dependent feature options
No change to the vec_sr implementations, waiting for more clarification

What clarification are you waiting for?

wschmidt added inline comments.Jul 9 2015, 12:22 PM

lib/Headers/altivec.h
7013	OK, I take it back, I misread the code. We were already generating the wrong instruction here. Carry on... ;)

LGTM with additional commentary to explain what's going on. :) Thanks.

lib/Basic/Targets.cpp
1341	After chatting with you on IRC, the above logic is correct but it is still pretty hard to understand. Please add a few more comments to explain the various scenarios.

This revision is now accepted and ready to land.Jul 9 2015, 12:42 PM

I would also like to see a test case or two for the confusing -mno-vsx -mpower8-vector stuff...

nemanjai mentioned this in D10973: Add missing builtins to the PPC back end for ABI compliance (vol. 3).Jul 10 2015, 12:26 AM

Committed revision 241904.

Revision Contents

Path

Size

include/

clang/

Basic/

BuiltinsPPC.def

2 lines

DiagnosticCommonKinds.td

2 lines

lib/

Basic/

Targets.cpp

44 lines

Headers/

altivec.h

495 lines

test/

CodeGen/

builtins-ppc-altivec.c

14 lines

builtins-ppc-p8vector.c

338 lines

builtins-ppc-vsx.c

233 lines

Diff 29330

include/clang/Basic/BuiltinsPPC.def

	Show First 20 Lines • Show All 306 Lines • ▼ Show 20 Lines
	BUILTIN(__builtin_vsx_xvnmsubasp, "V4fV4fV4fV4f", "")			BUILTIN(__builtin_vsx_xvnmsubasp, "V4fV4fV4fV4f", "")

	BUILTIN(__builtin_vsx_xvrsqrtedp, "V2dV2d", "")			BUILTIN(__builtin_vsx_xvrsqrtedp, "V2dV2d", "")
	BUILTIN(__builtin_vsx_xvrsqrtesp, "V4fV4f", "")			BUILTIN(__builtin_vsx_xvrsqrtesp, "V4fV4f", "")

	BUILTIN(__builtin_vsx_xvsqrtdp, "V2dV2d", "")			BUILTIN(__builtin_vsx_xvsqrtdp, "V2dV2d", "")
	BUILTIN(__builtin_vsx_xvsqrtsp, "V4fV4f", "")			BUILTIN(__builtin_vsx_xvsqrtsp, "V4fV4f", "")

				BUILTIN(__builtin_vsx_xxleqv, "V4UiV4UiV4Ui", "")

	// HTM builtins			// HTM builtins
	BUILTIN(__builtin_tbegin, "UiUIi", "")			BUILTIN(__builtin_tbegin, "UiUIi", "")
	BUILTIN(__builtin_tend, "UiUIi", "")			BUILTIN(__builtin_tend, "UiUIi", "")

	BUILTIN(__builtin_tabort, "UiUi", "")			BUILTIN(__builtin_tabort, "UiUi", "")
	BUILTIN(__builtin_tabortdc, "UiUiUiUi", "")			BUILTIN(__builtin_tabortdc, "UiUiUiUi", "")
	BUILTIN(__builtin_tabortdci, "UiUiUii", "")			BUILTIN(__builtin_tabortdci, "UiUiUii", "")
	BUILTIN(__builtin_tabortwc, "UiUiUiUi", "")			BUILTIN(__builtin_tabortwc, "UiUiUiUi", "")
	Show All 33 Lines

include/clang/Basic/DiagnosticCommonKinds.td

Show First 20 Lines • Show All 173 Lines • ▼ Show 20 Lines	def err_target_unknown_triple : Error<
"unknown target triple '%0', please use -triple or -arch">;		"unknown target triple '%0', please use -triple or -arch">;
def err_target_unknown_cpu : Error<"unknown target CPU '%0'">;		def err_target_unknown_cpu : Error<"unknown target CPU '%0'">;
def err_target_unknown_abi : Error<"unknown target ABI '%0'">;		def err_target_unknown_abi : Error<"unknown target ABI '%0'">;
def err_target_unknown_fpmath : Error<"unknown FP unit '%0'">;		def err_target_unknown_fpmath : Error<"unknown FP unit '%0'">;
def err_target_unsupported_fpmath : Error<		def err_target_unsupported_fpmath : Error<
"the '%0' unit is not supported with this instruction set">;		"the '%0' unit is not supported with this instruction set">;
def err_target_unsupported_unaligned : Error<		def err_target_unsupported_unaligned : Error<
"the %0 sub-architecture does not support unaligned accesses">;		"the %0 sub-architecture does not support unaligned accesses">;
		def err_opt_not_valid_with_opt : Error<
		"option '%0' cannot be specified with '%1'">;

// Source manager		// Source manager
def err_cannot_open_file : Error<"cannot open file '%0': %1">, DefaultFatal;		def err_cannot_open_file : Error<"cannot open file '%0': %1">, DefaultFatal;
def err_file_modified : Error<		def err_file_modified : Error<
"file '%0' modified since it was first processed">, DefaultFatal;		"file '%0' modified since it was first processed">, DefaultFatal;
def err_unsupported_bom : Error<"%0 byte order mark detected in '%1', but "		def err_unsupported_bom : Error<"%0 byte order mark detected in '%1', but "
"encoding is not supported">, DefaultFatal;		"encoding is not supported">, DefaultFatal;
def err_unable_to_rename_temp : Error<		def err_unable_to_rename_temp : Error<
Show All 18 Lines

lib/Basic/Targets.cpp

Show First 20 Lines • Show All 857 Lines • ▼ Show 20 Lines	public:
void getTargetDefines(const LangOptions &Opts,		void getTargetDefines(const LangOptions &Opts,
MacroBuilder &Builder) const override;		MacroBuilder &Builder) const override;

void getDefaultFeatures(llvm::StringMap<bool> &Features) const override;		void getDefaultFeatures(llvm::StringMap<bool> &Features) const override;

bool handleTargetFeatures(std::vector<std::string> &Features,		bool handleTargetFeatures(std::vector<std::string> &Features,
DiagnosticsEngine &Diags) override;		DiagnosticsEngine &Diags) override;
bool hasFeature(StringRef Feature) const override;		bool hasFeature(StringRef Feature) const override;
		void setFeatureEnabled(llvm::StringMap<bool> &Features, StringRef Name,
		bool Enabled) const override;

void getGCCRegNames(const char * const *&Names,		void getGCCRegNames(const char * const *&Names,
unsigned &NumNames) const override;		unsigned &NumNames) const override;
void getGCCRegAliases(const GCCRegAlias *&Aliases,		void getGCCRegAliases(const GCCRegAlias *&Aliases,
unsigned &NumAliases) const override;		unsigned &NumAliases) const override;
bool validateAsmConstraint(const char *&Name,		bool validateAsmConstraint(const char *&Name,
TargetInfo::ConstraintInfo &Info) const override {		TargetInfo::ConstraintInfo &Info) const override {
switch (*Name) {		switch (*Name) {
▲ Show 20 Lines • Show All 133 Lines • ▼ Show 20 Lines	#define LIBBUILTIN(ID, TYPE, ATTRS, HEADER) { #ID, TYPE, ATTRS, HEADER,\
ALL_LANGUAGES },		ALL_LANGUAGES },
#include "clang/Basic/BuiltinsPPC.def"		#include "clang/Basic/BuiltinsPPC.def"
};		};

/// handleTargetFeatures - Perform initialization based on the user		/// handleTargetFeatures - Perform initialization based on the user
/// configured set of features.		/// configured set of features.
bool PPCTargetInfo::handleTargetFeatures(std::vector<std::string> &Features,		bool PPCTargetInfo::handleTargetFeatures(std::vector<std::string> &Features,
DiagnosticsEngine &Diags) {		DiagnosticsEngine &Diags) {
for (unsigned i = 0, e = Features.size(); i !=e; ++i) {		for (unsigned i = 0, e = Features.size(); i !=e; ++i) {
		wschmidtUnsubmitted Done Reply Inline Actions This way of handling the various -m arguments positionally is not quite right. If both -mvsx and -mno-vsx are present in the command line, the last one seen wins. That means that if the user specifies -mno-vsx -mpower8-vector -mvsx we should turn on both the VSX and the P8Vector features. The logic you are using will only turn on the VSX feature because the specification of -mpower8-vector happened to be in between -mno-vsx and -mvsx. Also, it is an error to specify -mpower8-vector or -mdirect-moves if -mno-vsx is the switch value that wins due to occurring last. So I suggest that you track each feature separately during this loop, obtaining individual values for HasVSX, HasP8Vector, and HasDirectMove. Following the loop, if !HasVSX && (HasP8Vector \|\| HasDirectMove), report an error and fail the compilation. wschmidt: This way of handling the various -m arguments positionally is not quite right. If both -mvsx…
		nemanjaiAuthorUnsubmitted Not Done Reply Inline Actions Thank you for this comment. I think I know what and how we need to do (this matches the gcc behaviour): all three are set by default for ppc64le/pwr8 -mno-vsx disables all three defaults if an -mno-vsx wins (appears after any -mvsx) and the user explicitly specifies one of the other two, a diagnostic is emitted nemanjai: Thank you for this comment. I think I know what and how we need to do (this matches the gcc…
		wschmidtUnsubmitted Not Done Reply Inline Actions Agreed, that is more complete than what I wrote. wschmidt: Agreed, that is more complete than what I wrote.
// Ignore disabled features.		// Ignore disabled features.
if (Features[i][0] == '-')		if (Features[i][0] == '-')
continue;		continue;

StringRef Feature = StringRef(Features[i]).substr(1);		StringRef Feature = StringRef(Features[i]).substr(1);

if (Feature == "vsx") {		if (Feature == "vsx") {
HasVSX = true;		HasVSX = true;
continue;		continue;
		nemanjaiAuthorUnsubmitted Done Reply Inline Actions Oops, there was supposed to be a continue here. Added to the source tree. nemanjai: Oops, there was supposed to be a continue here. Added to the source tree.
}		}

if (Feature == "bpermd") {		if (Feature == "bpermd") {
HasBPERMD = true;		HasBPERMD = true;
continue;		continue;
}		}

if (Feature == "extdiv") {		if (Feature == "extdiv") {
HasExtDiv = true;		HasExtDiv = true;
continue;		continue;
}		}

if (Feature == "power8-vector") {		if (Feature == "power8-vector") {
HasP8Vector = true;		HasP8Vector = true;
HasVSX = true;
continue;		continue;
}		}

if (Feature == "crypto") {		if (Feature == "crypto") {
HasP8Crypto = true;		HasP8Crypto = true;
continue;		continue;
}		}

if (Feature == "direct-move") {		if (Feature == "direct-move") {
HasDirectMove = true;		HasDirectMove = true;
HasVSX = true;
continue;		continue;
}		}

if (Feature == "qpx") {		if (Feature == "qpx") {
HasQPX = true;		HasQPX = true;
continue;		continue;
}		}

if (Feature == "htm") {		if (Feature == "htm") {
HasHTM = true;		HasHTM = true;
continue;		continue;
}		}

// TODO: Finish this list and add an assert that we've handled them		// TODO: Finish this list and add an assert that we've handled them
// all.		// all.
}		}
		if (!HasVSX && (HasP8Vector \|\| HasDirectMove)) {
		if (HasP8Vector)
		Diags.Report(diag::err_opt_not_valid_with_opt) << "-mpower8-vector" <<
		"-mno-vsx";
		else if (HasDirectMove)
		Diags.Report(diag::err_opt_not_valid_with_opt) << "-mdirect-move" <<
		"-mno-vsx";
		return false;
		}

return true;		return true;
}		}

/// PPCTargetInfo::getTargetDefines - Return a set of the PowerPC-specific		/// PPCTargetInfo::getTargetDefines - Return a set of the PowerPC-specific
/// #defines that are not tied to a specific subtarget.		/// #defines that are not tied to a specific subtarget.
void PPCTargetInfo::getTargetDefines(const LangOptions &Opts,		void PPCTargetInfo::getTargetDefines(const LangOptions &Opts,
MacroBuilder &Builder) const {		MacroBuilder &Builder) const {
▲ Show 20 Lines • Show All 205 Lines • ▼ Show 20 Lines	Features["extdiv"] = llvm::StringSwitch<bool>(CPU)
.Case("ppc64le", true)		.Case("ppc64le", true)
.Case("pwr8", true)		.Case("pwr8", true)
.Case("pwr7", true)		.Case("pwr7", true)
.Default(false);		.Default(false);
Features["direct-move"] = llvm::StringSwitch<bool>(CPU)		Features["direct-move"] = llvm::StringSwitch<bool>(CPU)
.Case("ppc64le", true)		.Case("ppc64le", true)
.Case("pwr8", true)		.Case("pwr8", true)
.Default(false);		.Default(false);
		Features["vsx"] = llvm::StringSwitch<bool>(CPU)
		.Case("ppc64le", true)
		.Case("pwr8", true)
		.Case("pwr7", true)
		.Default(false);
}		}

bool PPCTargetInfo::hasFeature(StringRef Feature) const {		bool PPCTargetInfo::hasFeature(StringRef Feature) const {
return llvm::StringSwitch<bool>(Feature)		return llvm::StringSwitch<bool>(Feature)
.Case("powerpc", true)		.Case("powerpc", true)
.Case("vsx", HasVSX)		.Case("vsx", HasVSX)
.Case("power8-vector", HasP8Vector)		.Case("power8-vector", HasP8Vector)
.Case("crypto", HasP8Crypto)		.Case("crypto", HasP8Crypto)
.Case("direct-move", HasDirectMove)		.Case("direct-move", HasDirectMove)
.Case("qpx", HasQPX)		.Case("qpx", HasQPX)
.Case("htm", HasHTM)		.Case("htm", HasHTM)
.Case("bpermd", HasBPERMD)		.Case("bpermd", HasBPERMD)
.Case("extdiv", HasExtDiv)		.Case("extdiv", HasExtDiv)
.Default(false);		.Default(false);
}		}

		void PPCTargetInfo::setFeatureEnabled(llvm::StringMap<bool> &Features,
		StringRef Name, bool Enabled) const {
		/* We do not call this while populating default features. So at this
		point, all the default features are in the Features map. This information
		is useful as we can diagnose requests to enable features for which
		dependent features are disabled. Driver already handles the "last-wins"
		semantics so we will only be called with the last of the on/off options.
		*/
		static llvm::StringMap<bool> ExplicitFeatures;
		ExplicitFeatures[Name] = Enabled;

		// At this point, -mno-vsx turns off the dependent features but we respect
		// the user's requests.
		if (!Enabled && Name == "vsx") {
		Features["direct-move"] = ExplicitFeatures["direct-move"];
		Features["power8-vector"] = ExplicitFeatures["power8-vector"];
		}
		if ((Enabled && Name == "power8-vector") \|\|
		(Enabled && Name == "direct-move")) {
		if (ExplicitFeatures.find("vsx") == ExplicitFeatures.end()) {
		Features["vsx"] = true;
		}
		}
		Features[Name] = Enabled;
		wschmidtUnsubmitted Not Done Reply Inline Actions After chatting with you on IRC, the above logic is correct but it is still pretty hard to understand. Please add a few more comments to explain the various scenarios. wschmidt: After chatting with you on IRC, the above logic is correct but it is still pretty hard to…
		}

const char * const PPCTargetInfo::GCCRegNames[] = {		const char * const PPCTargetInfo::GCCRegNames[] = {
"r0", "r1", "r2", "r3", "r4", "r5", "r6", "r7",		"r0", "r1", "r2", "r3", "r4", "r5", "r6", "r7",
"r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15",		"r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15",
"r16", "r17", "r18", "r19", "r20", "r21", "r22", "r23",		"r16", "r17", "r18", "r19", "r20", "r21", "r22", "r23",
"r24", "r25", "r26", "r27", "r28", "r29", "r30", "r31",		"r24", "r25", "r26", "r27", "r28", "r29", "r30", "r31",
"f0", "f1", "f2", "f3", "f4", "f5", "f6", "f7",		"f0", "f1", "f2", "f3", "f4", "f5", "f6", "f7",
"f8", "f9", "f10", "f11", "f12", "f13", "f14", "f15",		"f8", "f9", "f10", "f11", "f12", "f13", "f14", "f15",
"f16", "f17", "f18", "f19", "f20", "f21", "f22", "f23",		"f16", "f17", "f18", "f19", "f20", "f21", "f22", "f23",
▲ Show 20 Lines • Show All 6,068 Lines • Show Last 20 Lines

lib/Headers/altivec.h

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 42 Lines • ▼ Show 20 Lines
static vector unsigned char __ATTRS_o_ai vec_perm(vector unsigned char __a,		static vector unsigned char __ATTRS_o_ai vec_perm(vector unsigned char __a,
vector unsigned char __b,		vector unsigned char __b,
vector unsigned char __c);		vector unsigned char __c);

static vector bool char __ATTRS_o_ai vec_perm(vector bool char __a,		static vector bool char __ATTRS_o_ai vec_perm(vector bool char __a,
vector bool char __b,		vector bool char __b,
vector unsigned char __c);		vector unsigned char __c);

static vector short __ATTRS_o_ai vec_perm(vector short __a, vector short __b,		static vector short __ATTRS_o_ai vec_perm(vector signed short __a,
		vector signed short __b,
vector unsigned char __c);		vector unsigned char __c);

static vector unsigned short __ATTRS_o_ai vec_perm(vector unsigned short __a,		static vector unsigned short __ATTRS_o_ai vec_perm(vector unsigned short __a,
vector unsigned short __b,		vector unsigned short __b,
vector unsigned char __c);		vector unsigned char __c);

static vector bool short __ATTRS_o_ai vec_perm(vector bool short __a,		static vector bool short __ATTRS_o_ai vec_perm(vector bool short __a,
vector bool short __b,		vector bool short __b,
vector unsigned char __c);		vector unsigned char __c);

static vector pixel __ATTRS_o_ai vec_perm(vector pixel __a, vector pixel __b,		static vector pixel __ATTRS_o_ai vec_perm(vector pixel __a, vector pixel __b,
vector unsigned char __c);		vector unsigned char __c);

static vector int __ATTRS_o_ai vec_perm(vector int __a, vector int __b,		static vector int __ATTRS_o_ai vec_perm(vector signed int __a,
		vector signed int __b,
vector unsigned char __c);		vector unsigned char __c);

static vector unsigned int __ATTRS_o_ai vec_perm(vector unsigned int __a,		static vector unsigned int __ATTRS_o_ai vec_perm(vector unsigned int __a,
vector unsigned int __b,		vector unsigned int __b,
vector unsigned char __c);		vector unsigned char __c);

static vector bool int __ATTRS_o_ai vec_perm(vector bool int __a,		static vector bool int __ATTRS_o_ai vec_perm(vector bool int __a,
vector bool int __b,		vector bool int __b,
vector unsigned char __c);		vector unsigned char __c);

static vector float __ATTRS_o_ai vec_perm(vector float __a, vector float __b,		static vector float __ATTRS_o_ai vec_perm(vector float __a, vector float __b,
vector unsigned char __c);		vector unsigned char __c);

#ifdef __VSX__		#ifdef __VSX__
static vector long long __ATTRS_o_ai vec_perm(vector long long __a,		static vector long long __ATTRS_o_ai vec_perm(vector signed long long __a,
vector long long __b,		vector signed long long __b,
vector unsigned char __c);		vector unsigned char __c);

static vector unsigned long long __ATTRS_o_ai		static vector unsigned long long __ATTRS_o_ai
vec_perm(vector unsigned long long __a, vector unsigned long long __b,		vec_perm(vector unsigned long long __a, vector unsigned long long __b,
vector unsigned char __c);		vector unsigned char __c);

		static vector bool long long __ATTRS_o_ai
		vec_perm(vector bool long long __a, vector bool long long __b,
		vector unsigned char __c);

static vector double __ATTRS_o_ai vec_perm(vector double __a, vector double __b,		static vector double __ATTRS_o_ai vec_perm(vector double __a, vector double __b,
vector unsigned char __c);		vector unsigned char __c);
#endif		#endif

static vector unsigned char __ATTRS_o_ai vec_xor(vector unsigned char __a,		static vector unsigned char __ATTRS_o_ai vec_xor(vector unsigned char __a,
vector unsigned char __b);		vector unsigned char __b);

/* vec_abs */		/* vec_abs */
▲ Show 20 Lines • Show All 1,740 Lines • ▼ Show 20 Lines

/* vec_dstt */		/* vec_dstt */

static void __attribute__((__always_inline__))		static void __attribute__((__always_inline__))
vec_dstt(const void *__a, int __b, int __c) {		vec_dstt(const void *__a, int __b, int __c) {
__builtin_altivec_dstt(__a, __b, __c);		__builtin_altivec_dstt(__a, __b, __c);
}		}

		/* vec_eqv */

		#ifdef __POWER8_VECTOR__
		static vector signed char __ATTRS_o_ai vec_eqv(vector signed char __a,
		vector signed char __b) {
		return (vector signed char)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector signed char __ATTRS_o_ai vec_eqv(vector bool char __a,
		vector signed char __b) {
		return (vector signed char)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector signed char __ATTRS_o_ai vec_eqv(vector signed char __a,
		vector bool char __b) {
		return (vector signed char)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector unsigned char __ATTRS_o_ai vec_eqv(vector unsigned char __a,
		vector unsigned char __b) {
		return (vector unsigned char)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector unsigned char __ATTRS_o_ai vec_eqv(vector bool char __a,
		vector unsigned char __b) {
		return (vector unsigned char)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector unsigned char __ATTRS_o_ai vec_eqv(vector unsigned char __a,
		vector bool char __b) {
		return (vector unsigned char)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector signed short __ATTRS_o_ai vec_eqv(vector signed short __a,
		vector signed short __b) {
		return (vector signed short)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector signed short __ATTRS_o_ai vec_eqv(vector bool short __a,
		vector signed short __b) {
		return (vector signed short)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector signed short __ATTRS_o_ai vec_eqv(vector signed short __a,
		vector bool short __b) {
		return (vector signed short)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector unsigned short __ATTRS_o_ai vec_eqv(vector unsigned short __a,
		vector unsigned short __b) {
		return (vector unsigned short)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector unsigned short __ATTRS_o_ai vec_eqv(vector bool short __a,
		vector unsigned short __b) {
		return (vector unsigned short)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector unsigned short __ATTRS_o_ai vec_eqv(vector unsigned short __a,
		vector bool short __b) {
		return (vector unsigned short)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector signed int __ATTRS_o_ai vec_eqv(vector signed int __a,
		vector signed int __b) {
		return (vector signed int)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector signed int __ATTRS_o_ai vec_eqv(vector bool int __a,
		vector signed int __b) {
		return (vector signed int)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector signed int __ATTRS_o_ai vec_eqv(vector signed int __a,
		vector bool int __b) {
		return (vector signed int)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector unsigned int __ATTRS_o_ai vec_eqv(vector unsigned int __a,
		vector unsigned int __b) {
		return __builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector unsigned int __ATTRS_o_ai vec_eqv(vector bool int __a,
		vector unsigned int __b) {
		return __builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector unsigned int __ATTRS_o_ai vec_eqv(vector unsigned int __a,
		vector bool int __b) {
		return __builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector signed long long __ATTRS_o_ai
		vec_eqv(vector signed long long __a, vector signed long long __b) {
		return (vector signed long long)
		__builtin_vsx_xxleqv((vector unsigned int)__a, (vector unsigned int)__b);
		}

		static vector signed long long __ATTRS_o_ai
		vec_eqv(vector bool long long __a, vector signed long long __b) {
		return (vector signed long long)
		__builtin_vsx_xxleqv((vector unsigned int)__a, (vector unsigned int)__b);
		}

		static vector signed long long __ATTRS_o_ai
		vec_eqv(vector signed long long __a, vector bool long long __b) {
		return (vector signed long long)
		__builtin_vsx_xxleqv((vector unsigned int)__a, (vector unsigned int)__b);
		}

		static vector unsigned long long __ATTRS_o_ai
		vec_eqv(vector unsigned long long __a, vector unsigned long long __b) {
		return (vector unsigned long long)
		__builtin_vsx_xxleqv((vector unsigned int)__a, (vector unsigned int)__b);
		}

		static vector unsigned long long __ATTRS_o_ai
		vec_eqv(vector bool long long __a, vector unsigned long long __b) {
		return (vector unsigned long long)
		__builtin_vsx_xxleqv((vector unsigned int)__a, (vector unsigned int)__b);
		}

		static vector unsigned long long __ATTRS_o_ai
		vec_eqv(vector unsigned long long __a, vector bool long long __b) {
		return (vector unsigned long long)
		__builtin_vsx_xxleqv((vector unsigned int)__a, (vector unsigned int)__b);
		}

		static vector float __ATTRS_o_ai vec_eqv(vector float __a, vector float __b) {
		return (vector float)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector float __ATTRS_o_ai vec_eqv(vector bool int __a,
		vector float __b) {
		return (vector float)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector float __ATTRS_o_ai vec_eqv(vector float __a,
		vector bool int __b) {
		return (vector float)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector double __ATTRS_o_ai vec_eqv(vector double __a,
		vector double __b) {
		return (vector double)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector double __ATTRS_o_ai vec_eqv(vector bool long long __a,
		vector double __b) {
		return (vector double)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}

		static vector double __ATTRS_o_ai vec_eqv(vector double __a,
		vector bool long long __b) {
		return (vector double)__builtin_vsx_xxleqv((vector unsigned int)__a,
		(vector unsigned int)__b);
		}
		#endif

/* vec_expte */		/* vec_expte */

static vector float __attribute__((__always_inline__))		static vector float __attribute__((__always_inline__))
vec_expte(vector float __a) {		vec_expte(vector float __a) {
return __builtin_altivec_vexptefp(__a);		return __builtin_altivec_vexptefp(__a);
}		}

/* vec_vexptefp */		/* vec_vexptefp */
▲ Show 20 Lines • Show All 3,125 Lines • ▼ Show 20 Lines	#ifdef __LITTLE_ENDIAN__
return (vector bool char)__builtin_altivec_vperm_4si((vector int)__b,		return (vector bool char)__builtin_altivec_vperm_4si((vector int)__b,
(vector int)__a, __d);		(vector int)__a, __d);
#else		#else
return (vector bool char)__builtin_altivec_vperm_4si((vector int)__a,		return (vector bool char)__builtin_altivec_vperm_4si((vector int)__a,
(vector int)__b, __c);		(vector int)__b, __c);
#endif		#endif
}		}

static vector short __ATTRS_o_ai vec_perm(vector short __a, vector short __b,		static vector short __ATTRS_o_ai vec_perm(vector signed short __a,
		vector signed short __b,
vector unsigned char __c) {		vector unsigned char __c) {
#ifdef __LITTLE_ENDIAN__		#ifdef __LITTLE_ENDIAN__
vector unsigned char __d = {255, 255, 255, 255, 255, 255, 255, 255,		vector unsigned char __d = {255, 255, 255, 255, 255, 255, 255, 255,
255, 255, 255, 255, 255, 255, 255, 255};		255, 255, 255, 255, 255, 255, 255, 255};
__d = vec_xor(__c, __d);		__d = vec_xor(__c, __d);
return (vector short)__builtin_altivec_vperm_4si((vector int)__b,		return (vector short)__builtin_altivec_vperm_4si((vector int)__b,
(vector int)__a, __d);		(vector int)__a, __d);
#else		#else
▲ Show 20 Lines • Show All 41 Lines • ▼ Show 20 Lines	#ifdef __LITTLE_ENDIAN__
return (vector pixel)__builtin_altivec_vperm_4si((vector int)__b,		return (vector pixel)__builtin_altivec_vperm_4si((vector int)__b,
(vector int)__a, __d);		(vector int)__a, __d);
#else		#else
return (vector pixel)__builtin_altivec_vperm_4si((vector int)__a,		return (vector pixel)__builtin_altivec_vperm_4si((vector int)__a,
(vector int)__b, __c);		(vector int)__b, __c);
#endif		#endif
}		}

static vector int __ATTRS_o_ai vec_perm(vector int __a, vector int __b,		static vector int __ATTRS_o_ai vec_perm(vector signed int __a,
		vector signed int __b,
vector unsigned char __c) {		vector unsigned char __c) {
#ifdef __LITTLE_ENDIAN__		#ifdef __LITTLE_ENDIAN__
vector unsigned char __d = {255, 255, 255, 255, 255, 255, 255, 255,		vector unsigned char __d = {255, 255, 255, 255, 255, 255, 255, 255,
255, 255, 255, 255, 255, 255, 255, 255};		255, 255, 255, 255, 255, 255, 255, 255};
__d = vec_xor(__c, __d);		__d = vec_xor(__c, __d);
return (vector int)__builtin_altivec_vperm_4si(__b, __a, __d);		return (vector int)__builtin_altivec_vperm_4si(__b, __a, __d);
#else		#else
return (vector int)__builtin_altivec_vperm_4si(__a, __b, __c);		return (vector int)__builtin_altivec_vperm_4si(__a, __b, __c);
Show All 40 Lines	return (vector float)__builtin_altivec_vperm_4si((vector int)__b,
(vector int)__a, __d);		(vector int)__a, __d);
#else		#else
return (vector float)__builtin_altivec_vperm_4si((vector int)__a,		return (vector float)__builtin_altivec_vperm_4si((vector int)__a,
(vector int)__b, __c);		(vector int)__b, __c);
#endif		#endif
}		}

#ifdef __VSX__		#ifdef __VSX__
static vector long long __ATTRS_o_ai vec_perm(vector long long __a,		static vector long long __ATTRS_o_ai vec_perm(vector signed long long __a,
vector long long __b,		vector signed long long __b,
vector unsigned char __c) {		vector unsigned char __c) {
#ifdef __LITTLE_ENDIAN__		#ifdef __LITTLE_ENDIAN__
vector unsigned char __d = {255, 255, 255, 255, 255, 255, 255, 255,		vector unsigned char __d = {255, 255, 255, 255, 255, 255, 255, 255,
255, 255, 255, 255, 255, 255, 255, 255};		255, 255, 255, 255, 255, 255, 255, 255};
__d = vec_xor(__c, __d);		__d = vec_xor(__c, __d);
return (vector long long)__builtin_altivec_vperm_4si(__b, __a, __d);		return (vector long long)__builtin_altivec_vperm_4si(__b, __a, __d);
#else		#else
return (vector long long)__builtin_altivec_vperm_4si(__a, __b, __c);		return (vector long long)__builtin_altivec_vperm_4si(__a, __b, __c);
Show All 10 Lines	#ifdef __LITTLE_ENDIAN__
return (vector unsigned long long)__builtin_altivec_vperm_4si(		return (vector unsigned long long)__builtin_altivec_vperm_4si(
(vector int)__b, (vector int)__a, __d);		(vector int)__b, (vector int)__a, __d);
#else		#else
return (vector unsigned long long)__builtin_altivec_vperm_4si(		return (vector unsigned long long)__builtin_altivec_vperm_4si(
(vector int)__a, (vector int)__b, __c);		(vector int)__a, (vector int)__b, __c);
#endif		#endif
}		}

		static vector bool long long __ATTRS_o_ai
		vec_perm(vector bool long long __a, vector bool long long __b,
		vector unsigned char __c) {
		#ifdef __LITTLE_ENDIAN__
		vector unsigned char __d = {255, 255, 255, 255, 255, 255, 255, 255,
		255, 255, 255, 255, 255, 255, 255, 255};
		__d = vec_xor(__c, __d);
		return (vector bool long long)__builtin_altivec_vperm_4si(
		(vector int)__b, (vector int)__a, __d);
		#else
		return (vector bool long long)__builtin_altivec_vperm_4si(
		(vector int)__a, (vector int)__b, __c);
		#endif
		}

static vector double __ATTRS_o_ai vec_perm(vector double __a, vector double __b,		static vector double __ATTRS_o_ai vec_perm(vector double __a, vector double __b,
vector unsigned char __c) {		vector unsigned char __c) {
#ifdef __LITTLE_ENDIAN__		#ifdef __LITTLE_ENDIAN__
vector unsigned char __d = {255, 255, 255, 255, 255, 255, 255, 255,		vector unsigned char __d = {255, 255, 255, 255, 255, 255, 255, 255,
255, 255, 255, 255, 255, 255, 255, 255};		255, 255, 255, 255, 255, 255, 255, 255};
__d = vec_xor(__c, __d);		__d = vec_xor(__c, __d);
return (vector double)__builtin_altivec_vperm_4si((vector int)__b,		return (vector double)__builtin_altivec_vperm_4si((vector int)__b,
(vector int)__a, __d);		(vector int)__a, __d);
▲ Show 20 Lines • Show All 178 Lines • ▼ Show 20 Lines

static vector unsigned int __ATTRS_o_ai vec_vrlw(vector unsigned int __a,		static vector unsigned int __ATTRS_o_ai vec_vrlw(vector unsigned int __a,
vector unsigned int __b) {		vector unsigned int __b) {
return (vector unsigned int)__builtin_altivec_vrlw((vector int)__a, __b);		return (vector unsigned int)__builtin_altivec_vrlw((vector int)__a, __b);
}		}

/* vec_round */		/* vec_round */

static vector float __attribute__((__always_inline__))		static vector float __ATTRS_o_ai vec_round(vector float __a) {
vec_round(vector float __a) {		#ifdef __VSX__
		return __builtin_vsx_xvrspi(__a);
		#else
return __builtin_altivec_vrfin(__a);		return __builtin_altivec_vrfin(__a);
		#endif
}		}

#ifdef __VSX__		#ifdef __VSX__
		static vector double __ATTRS_o_ai vec_round(vector double __a) {
		return __builtin_vsx_xvrdpi(__a);
		}

/* vec_rint */		/* vec_rint */

static vector float __ATTRS_o_ai		static vector float __ATTRS_o_ai
vec_rint(vector float __a) {		vec_rint(vector float __a) {
return __builtin_vsx_xvrspic(__a);		return __builtin_vsx_xvrspic(__a);
}		}

static vector double __ATTRS_o_ai		static vector double __ATTRS_o_ai
▲ Show 20 Lines • Show All 401 Lines • ▼ Show 20 Lines
}		}

/* vec_sld */		/* vec_sld */

#define __builtin_altivec_vsldoi_4si vec_sld		#define __builtin_altivec_vsldoi_4si vec_sld

static vector signed char __ATTRS_o_ai vec_sld(vector signed char __a,		static vector signed char __ATTRS_o_ai vec_sld(vector signed char __a,
vector signed char __b,		vector signed char __b,
unsigned char __c) {		unsigned const int __c) {
		unsigned char __d = __c & 0x0F;
return vec_perm(		return vec_perm(
__a, __b,		__a, __b,
(vector unsigned char)(__c, __c + 1, __c + 2, __c + 3, __c + 4, __c + 5,		(vector unsigned char)(__d, __d + 1, __d + 2, __d + 3, __d + 4, __d + 5,
__c + 6, __c + 7, __c + 8, __c + 9, __c + 10,		__d + 6, __d + 7, __d + 8, __d + 9, __d + 10,
__c + 11, __c + 12, __c + 13, __c + 14, __c + 15));		__d + 11, __d + 12, __d + 13, __d + 14, __d + 15));
}		}

static vector unsigned char __ATTRS_o_ai vec_sld(vector unsigned char __a,		static vector unsigned char __ATTRS_o_ai vec_sld(vector unsigned char __a,
vector unsigned char __b,		vector unsigned char __b,
unsigned char __c) {		unsigned const int __c) {
		unsigned char __d = __c & 0x0F;
return vec_perm(		return vec_perm(
__a, __b,		__a, __b,
(vector unsigned char)(__c, __c + 1, __c + 2, __c + 3, __c + 4, __c + 5,		(vector unsigned char)(__d, __d + 1, __d + 2, __d + 3, __d + 4, __d + 5,
__c + 6, __c + 7, __c + 8, __c + 9, __c + 10,		__d + 6, __d + 7, __d + 8, __d + 9, __d + 10,
__c + 11, __c + 12, __c + 13, __c + 14, __c + 15));		__d + 11, __d + 12, __d + 13, __d + 14, __d + 15));
}		}

static vector short __ATTRS_o_ai vec_sld(vector short __a, vector short __b,		static vector bool char __ATTRS_o_ai vec_sld(vector bool char __a,
unsigned char __c) {		vector bool char __b,
		unsigned const int __c) {
		unsigned char __d = __c & 0x0F;
return vec_perm(		return vec_perm(
__a, __b,		__a, __b,
(vector unsigned char)(__c, __c + 1, __c + 2, __c + 3, __c + 4, __c + 5,		(vector unsigned char)(__d, __d + 1, __d + 2, __d + 3, __d + 4, __d + 5,
__c + 6, __c + 7, __c + 8, __c + 9, __c + 10,		__d + 6, __d + 7, __d + 8, __d + 9, __d + 10,
__c + 11, __c + 12, __c + 13, __c + 14, __c + 15));		__d + 11, __d + 12, __d + 13, __d + 14, __d + 15));
		}

		static vector signed short __ATTRS_o_ai vec_sld(vector signed short __a,
		vector signed short __b,
		unsigned const int __c) {
		unsigned char __d = __c & 0x0F;
		return vec_perm(
		__a, __b,
		(vector unsigned char)(__d, __d + 1, __d + 2, __d + 3, __d + 4, __d + 5,
		__d + 6, __d + 7, __d + 8, __d + 9, __d + 10,
		__d + 11, __d + 12, __d + 13, __d + 14, __d + 15));
}		}

static vector unsigned short __ATTRS_o_ai vec_sld(vector unsigned short __a,		static vector unsigned short __ATTRS_o_ai vec_sld(vector unsigned short __a,
vector unsigned short __b,		vector unsigned short __b,
unsigned char __c) {		unsigned const int __c) {
		unsigned char __d = __c & 0x0F;
return vec_perm(		return vec_perm(
__a, __b,		__a, __b,
(vector unsigned char)(__c, __c + 1, __c + 2, __c + 3, __c + 4, __c + 5,		(vector unsigned char)(__d, __d + 1, __d + 2, __d + 3, __d + 4, __d + 5,
__c + 6, __c + 7, __c + 8, __c + 9, __c + 10,		__d + 6, __d + 7, __d + 8, __d + 9, __d + 10,
__c + 11, __c + 12, __c + 13, __c + 14, __c + 15));		__d + 11, __d + 12, __d + 13, __d + 14, __d + 15));
		}

		static vector bool short __ATTRS_o_ai vec_sld(vector bool short __a,
		vector bool short __b,
		unsigned const int __c) {
		unsigned char __d = __c & 0x0F;
		return vec_perm(
		__a, __b,
		(vector unsigned char)(__d, __d + 1, __d + 2, __d + 3, __d + 4, __d + 5,
		__d + 6, __d + 7, __d + 8, __d + 9, __d + 10,
		__d + 11, __d + 12, __d + 13, __d + 14, __d + 15));
}		}

static vector pixel __ATTRS_o_ai vec_sld(vector pixel __a, vector pixel __b,		static vector pixel __ATTRS_o_ai vec_sld(vector pixel __a, vector pixel __b,
unsigned char __c) {		unsigned const int __c) {
		unsigned char __d = __c & 0x0F;
return vec_perm(		return vec_perm(
__a, __b,		__a, __b,
(vector unsigned char)(__c, __c + 1, __c + 2, __c + 3, __c + 4, __c + 5,		(vector unsigned char)(__d, __d + 1, __d + 2, __d + 3, __d + 4, __d + 5,
__c + 6, __c + 7, __c + 8, __c + 9, __c + 10,		__d + 6, __d + 7, __d + 8, __d + 9, __d + 10,
__c + 11, __c + 12, __c + 13, __c + 14, __c + 15));		__d + 11, __d + 12, __d + 13, __d + 14, __d + 15));
}		}

static vector int __ATTRS_o_ai vec_sld(vector int __a, vector int __b,		static vector signed int __ATTRS_o_ai vec_sld(vector signed int __a,
unsigned char __c) {		vector signed int __b,
		unsigned const int __c) {
		unsigned char __d = __c & 0x0F;
return vec_perm(		return vec_perm(
__a, __b,		__a, __b,
(vector unsigned char)(__c, __c + 1, __c + 2, __c + 3, __c + 4, __c + 5,		(vector unsigned char)(__d, __d + 1, __d + 2, __d + 3, __d + 4, __d + 5,
__c + 6, __c + 7, __c + 8, __c + 9, __c + 10,		__d + 6, __d + 7, __d + 8, __d + 9, __d + 10,
__c + 11, __c + 12, __c + 13, __c + 14, __c + 15));		__d + 11, __d + 12, __d + 13, __d + 14, __d + 15));
}		}

static vector unsigned int __ATTRS_o_ai vec_sld(vector unsigned int __a,		static vector unsigned int __ATTRS_o_ai vec_sld(vector unsigned int __a,
vector unsigned int __b,		vector unsigned int __b,
unsigned char __c) {		unsigned const int __c) {
		unsigned char __d = __c & 0x0F;
return vec_perm(		return vec_perm(
__a, __b,		__a, __b,
(vector unsigned char)(__c, __c + 1, __c + 2, __c + 3, __c + 4, __c + 5,		(vector unsigned char)(__d, __d + 1, __d + 2, __d + 3, __d + 4, __d + 5,
__c + 6, __c + 7, __c + 8, __c + 9, __c + 10,		__d + 6, __d + 7, __d + 8, __d + 9, __d + 10,
__c + 11, __c + 12, __c + 13, __c + 14, __c + 15));		__d + 11, __d + 12, __d + 13, __d + 14, __d + 15));
		}

		static vector bool int __ATTRS_o_ai vec_sld(vector bool int __a,
		vector bool int __b,
		unsigned const int __c) {
		unsigned char __d = __c & 0x0F;
		return vec_perm(
		__a, __b,
		(vector unsigned char)(__d, __d + 1, __d + 2, __d + 3, __d + 4, __d + 5,
		__d + 6, __d + 7, __d + 8, __d + 9, __d + 10,
		__d + 11, __d + 12, __d + 13, __d + 14, __d + 15));
}		}

static vector float __ATTRS_o_ai vec_sld(vector float __a, vector float __b,		static vector float __ATTRS_o_ai vec_sld(vector float __a, vector float __b,
unsigned char __c) {		unsigned const int __c) {
		unsigned char __d = __c & 0x0F;
return vec_perm(		return vec_perm(
__a, __b,		__a, __b,
(vector unsigned char)(__c, __c + 1, __c + 2, __c + 3, __c + 4, __c + 5,		(vector unsigned char)(__d, __d + 1, __d + 2, __d + 3, __d + 4, __d + 5,
__c + 6, __c + 7, __c + 8, __c + 9, __c + 10,		__d + 6, __d + 7, __d + 8, __d + 9, __d + 10,
__c + 11, __c + 12, __c + 13, __c + 14, __c + 15));		__d + 11, __d + 12, __d + 13, __d + 14, __d + 15));
}		}

/* vec_vsldoi */		/* vec_vsldoi */

static vector signed char __ATTRS_o_ai vec_vsldoi(vector signed char __a,		static vector signed char __ATTRS_o_ai vec_vsldoi(vector signed char __a,
vector signed char __b,		vector signed char __b,
unsigned char __c) {		unsigned char __c) {
return vec_perm(		return vec_perm(
▲ Show 20 Lines • Show All 592 Lines • ▼ Show 20 Lines
static vector float __ATTRS_o_ai vec_vslo(vector float __a,		static vector float __ATTRS_o_ai vec_vslo(vector float __a,
vector unsigned char __b) {		vector unsigned char __b) {
return (vector float)__builtin_altivec_vslo((vector int)__a, (vector int)__b);		return (vector float)__builtin_altivec_vslo((vector int)__a, (vector int)__b);
}		}

/* vec_splat */		/* vec_splat */

static vector signed char __ATTRS_o_ai vec_splat(vector signed char __a,		static vector signed char __ATTRS_o_ai vec_splat(vector signed char __a,
unsigned char __b) {		unsigned const int __b) {
return vec_perm(__a, __a, (vector unsigned char)(__b));		return vec_perm(__a, __a, (vector unsigned char)(__b & 0x0F));
}		}

static vector unsigned char __ATTRS_o_ai vec_splat(vector unsigned char __a,		static vector unsigned char __ATTRS_o_ai vec_splat(vector unsigned char __a,
unsigned char __b) {		unsigned const int __b) {
return vec_perm(__a, __a, (vector unsigned char)(__b));		return vec_perm(__a, __a, (vector unsigned char)(__b & 0x0F));
		wschmidtUnsubmitted Done Reply Inline Actions Missing the & 0x0F here. wschmidt: Missing the & 0x0F here.
		nemanjaiAuthorUnsubmitted Not Done Reply Inline Actions Greath catch, thank you. nemanjai: Greath catch, thank you.
}		}

static vector bool char __ATTRS_o_ai vec_splat(vector bool char __a,		static vector bool char __ATTRS_o_ai vec_splat(vector bool char __a,
unsigned char __b) {		unsigned const int __b) {
return vec_perm(__a, __a, (vector unsigned char)(__b));		return vec_perm(__a, __a, (vector unsigned char)(__b & 0x0F));
}		}

static vector short __ATTRS_o_ai vec_splat(vector short __a,		static vector signed short __ATTRS_o_ai vec_splat(vector signed short __a,
unsigned char __b) {		unsigned const int __b) {
__b *= 2;		unsigned char b0 = (__b & 0x07) * 2;
unsigned char b1 = __b + 1;		unsigned char b1 = b0 + 1;
return vec_perm(__a, __a,		return vec_perm(__a, __a,
(vector unsigned char)(__b, b1, __b, b1, __b, b1, __b, b1,		(vector unsigned char)(b0, b1, b0, b1, b0, b1, b0, b1,
__b, b1, __b, b1, __b, b1, __b, b1));		b0, b1, b0, b1, b0, b1, b0, b1));
}		}

static vector unsigned short __ATTRS_o_ai vec_splat(vector unsigned short __a,		static vector unsigned short __ATTRS_o_ai vec_splat(vector unsigned short __a,
unsigned char __b) {		unsigned const int __b) {
__b *= 2;		unsigned char b0 = (__b & 0x07) * 2;
unsigned char b1 = __b + 1;		unsigned char b1 = b0 + 1;
return vec_perm(__a, __a,		return vec_perm(__a, __a,
(vector unsigned char)(__b, b1, __b, b1, __b, b1, __b, b1,		(vector unsigned char)(b0, b1, b0, b1, b0, b1, b0, b1,
__b, b1, __b, b1, __b, b1, __b, b1));		b0, b1, b0, b1, b0, b1, b0, b1));
}		}

static vector bool short __ATTRS_o_ai vec_splat(vector bool short __a,		static vector bool short __ATTRS_o_ai vec_splat(vector bool short __a,
unsigned char __b) {		unsigned const int __b) {
__b *= 2;		unsigned char b0 = (__b & 0x07) * 2;
unsigned char b1 = __b + 1;		unsigned char b1 = b0 + 1;
return vec_perm(__a, __a,		return vec_perm(__a, __a,
(vector unsigned char)(__b, b1, __b, b1, __b, b1, __b, b1,		(vector unsigned char)(b0, b1, b0, b1, b0, b1, b0, b1,
__b, b1, __b, b1, __b, b1, __b, b1));		b0, b1, b0, b1, b0, b1, b0, b1));
}		}

static vector pixel __ATTRS_o_ai vec_splat(vector pixel __a,		static vector pixel __ATTRS_o_ai vec_splat(vector pixel __a,
unsigned char __b) {		unsigned const int __b) {
__b *= 2;		unsigned char b0 = (__b & 0x07) * 2;
unsigned char b1 = __b + 1;		unsigned char b1 = b0 + 1;
return vec_perm(__a, __a,		return vec_perm(__a, __a,
(vector unsigned char)(__b, b1, __b, b1, __b, b1, __b, b1,		(vector unsigned char)(b0, b1, b0, b1, b0, b1, b0, b1,
__b, b1, __b, b1, __b, b1, __b, b1));		b0, b1, b0, b1, b0, b1, b0, b1));
}		}

static vector int __ATTRS_o_ai vec_splat(vector int __a, unsigned char __b) {		static vector signed int __ATTRS_o_ai vec_splat(vector signed int __a,
__b *= 4;		unsigned const int __b) {
unsigned char b1 = __b + 1, b2 = __b + 2, b3 = __b + 3;		unsigned char b0 = (__b & 0x03) * 4;
		unsigned char b1 = b0 + 1, b2 = b0 + 2, b3 = b0 + 3;
return vec_perm(__a, __a,		return vec_perm(__a, __a,
(vector unsigned char)(__b, b1, b2, b3, __b, b1, b2, b3, __b,		(vector unsigned char)(b0, b1, b2, b3, b0, b1, b2, b3, b0,
b1, b2, b3, __b, b1, b2, b3));		b1, b2, b3, b0, b1, b2, b3));
}		}

static vector unsigned int __ATTRS_o_ai vec_splat(vector unsigned int __a,		static vector unsigned int __ATTRS_o_ai vec_splat(vector unsigned int __a,
unsigned char __b) {		unsigned const int __b) {
__b *= 4;		unsigned char b0 = (__b & 0x03) * 4;
unsigned char b1 = __b + 1, b2 = __b + 2, b3 = __b + 3;		unsigned char b1 = b0 + 1, b2 = b0 + 2, b3 = b0 + 3;
return vec_perm(__a, __a,		return vec_perm(__a, __a,
(vector unsigned char)(__b, b1, b2, b3, __b, b1, b2, b3, __b,		(vector unsigned char)(b0, b1, b2, b3, b0, b1, b2, b3, b0,
b1, b2, b3, __b, b1, b2, b3));		b1, b2, b3, b0, b1, b2, b3));
}		}

static vector bool int __ATTRS_o_ai vec_splat(vector bool int __a,		static vector bool int __ATTRS_o_ai vec_splat(vector bool int __a,
unsigned char __b) {		unsigned const int __b) {
__b *= 4;		unsigned char b0 = (__b & 0x03) * 4;
unsigned char b1 = __b + 1, b2 = __b + 2, b3 = __b + 3;		unsigned char b1 = b0 + 1, b2 = b0 + 2, b3 = b0 + 3;
return vec_perm(__a, __a,		return vec_perm(__a, __a,
(vector unsigned char)(__b, b1, b2, b3, __b, b1, b2, b3, __b,		(vector unsigned char)(b0, b1, b2, b3, b0, b1, b2, b3, b0,
b1, b2, b3, __b, b1, b2, b3));		b1, b2, b3, b0, b1, b2, b3));
}		}

static vector float __ATTRS_o_ai vec_splat(vector float __a,		static vector float __ATTRS_o_ai vec_splat(vector float __a,
unsigned char __b) {		unsigned const int __b) {
__b *= 4;		unsigned char b0 = (__b & 0x03) * 4;
unsigned char b1 = __b + 1, b2 = __b + 2, b3 = __b + 3;		unsigned char b1 = b0 + 1, b2 = b0 + 2, b3 = b0 + 3;
return vec_perm(__a, __a,		return vec_perm(__a, __a,
(vector unsigned char)(__b, b1, b2, b3, __b, b1, b2, b3, __b,		(vector unsigned char)(b0, b1, b2, b3, b0, b1, b2, b3, b0,
b1, b2, b3, __b, b1, b2, b3));		b1, b2, b3, b0, b1, b2, b3));
}		}

		#ifdef __VSX__
		static vector double __ATTRS_o_ai vec_splat(vector double __a,
		unsigned const int __b) {
		unsigned char b0 = (__b & 0x01) * 8;
		unsigned char b1 = b0 + 1, b2 = b0 + 2, b3 = b0 + 3, b4 = b0 + 4,
		b5 = b0 + 5, b6 = b0 + 6, b7 = b0 + 7;
		return vec_perm(__a, __a,
		(vector unsigned char)(b0, b1, b2, b3, b4, b5, b6, b7,
		b0, b1, b2, b3, b4, b5, b6, b7));
		}
		static vector bool long long __ATTRS_o_ai vec_splat(vector bool long long __a,
		unsigned const int __b) {
		unsigned char b0 = (__b & 0x01) * 8;
		unsigned char b1 = b0 + 1, b2 = b0 + 2, b3 = b0 + 3, b4 = b0 + 4,
		b5 = b0 + 5, b6 = b0 + 6, b7 = b0 + 7;
		return vec_perm(__a, __a,
		(vector unsigned char)(b0, b1, b2, b3, b4, b5, b6, b7,
		b0, b1, b2, b3, b4, b5, b6, b7));
		}
		static vector signed long long __ATTRS_o_ai
		vec_splat(vector signed long long __a, unsigned const int __b) {
		unsigned char b0 = (__b & 0x01) * 8;
		unsigned char b1 = b0 + 1, b2 = b0 + 2, b3 = b0 + 3, b4 = b0 + 4,
		b5 = b0 + 5, b6 = b0 + 6, b7 = b0 + 7;
		return vec_perm(__a, __a,
		(vector unsigned char)(b0, b1, b2, b3, b4, b5, b6, b7,
		b0, b1, b2, b3, b4, b5, b6, b7));
		}
		static vector unsigned long long __ATTRS_o_ai
		vec_splat(vector unsigned long long __a, unsigned const int __b) {
		unsigned char b0 = (__b & 0x01) * 8;
		unsigned char b1 = b0 + 1, b2 = b0 + 2, b3 = b0 + 3, b4 = b0 + 4,
		b5 = b0 + 5, b6 = b0 + 6, b7 = b0 + 7;
		return vec_perm(__a, __a,
		(vector unsigned char)(b0, b1, b2, b3, b4, b5, b6, b7,
		b0, b1, b2, b3, b4, b5, b6, b7));
		}
		#endif

/* vec_vspltb */		/* vec_vspltb */

#define __builtin_altivec_vspltb vec_vspltb		#define __builtin_altivec_vspltb vec_vspltb

static vector signed char __ATTRS_o_ai vec_vspltb(vector signed char __a,		static vector signed char __ATTRS_o_ai vec_vspltb(vector signed char __a,
unsigned char __b) {		unsigned char __b) {
return vec_perm(__a, __a, (vector unsigned char)(__b));		return vec_perm(__a, __a, (vector unsigned char)(__b));
}		}
▲ Show 20 Lines • Show All 155 Lines • ▼ Show 20 Lines
static vector unsigned int __ATTRS_o_ai vec_splat_u32(signed char __a) {		static vector unsigned int __ATTRS_o_ai vec_splat_u32(signed char __a) {
return (vector unsigned int)(__a);		return (vector unsigned int)(__a);
}		}

/* vec_sr */		/* vec_sr */

static vector signed char __ATTRS_o_ai vec_sr(vector signed char __a,		static vector signed char __ATTRS_o_ai vec_sr(vector signed char __a,
vector unsigned char __b) {		vector unsigned char __b) {
return __a >> (vector signed char)__b;		vector unsigned char __res = (vector unsigned char)__a >> __b;
		return (vector signed char)__res;
}		}

static vector unsigned char __ATTRS_o_ai vec_sr(vector unsigned char __a,		static vector unsigned char __ATTRS_o_ai vec_sr(vector unsigned char __a,
vector unsigned char __b) {		vector unsigned char __b) {
return __a >> __b;		return __a >> __b;
}		}

static vector short __ATTRS_o_ai vec_sr(vector short __a,		static vector signed short __ATTRS_o_ai vec_sr(vector signed short __a,
vector unsigned short __b) {		vector unsigned short __b) {
return __a >> (vector short)__b;		vector unsigned short __res = (vector unsigned short)__a >> __b;
		return (vector signed short)__res;
}		}

static vector unsigned short __ATTRS_o_ai vec_sr(vector unsigned short __a,		static vector unsigned short __ATTRS_o_ai vec_sr(vector unsigned short __a,
vector unsigned short __b) {		vector unsigned short __b) {
return __a >> __b;		return __a >> __b;
}		}

static vector int __ATTRS_o_ai vec_sr(vector int __a, vector unsigned int __b) {		static vector signed int __ATTRS_o_ai vec_sr(vector signed int __a,
return __a >> (vector int)__b;		vector unsigned int __b) {
		vector unsigned int __res = (vector unsigned int)__a >> __b;
		return (vector signed int)__res;
}		}

static vector unsigned int __ATTRS_o_ai vec_sr(vector unsigned int __a,		static vector unsigned int __ATTRS_o_ai vec_sr(vector unsigned int __a,
vector unsigned int __b) {		vector unsigned int __b) {
return __a >> __b;		return __a >> __b;
}		}

#ifdef __POWER8_VECTOR__		#ifdef __POWER8_VECTOR__
static vector signed long long __ATTRS_o_ai		static vector signed long long __ATTRS_o_ai
vec_sr(vector signed long long __a, vector unsigned long long __b) {		vec_sr(vector signed long long __a, vector unsigned long long __b) {
return __a >> (vector long long)__b;		vector unsigned long long __res = (vector unsigned long long)__a >> __b;
		return (vector signed long long)__res;
}		}
		wschmidtUnsubmitted Not Done Reply Inline Actions Seems like too much casting above. It's ok to just use the original code here (and make "vector long long" into "vector unsigned long long"). The instruction will mask off all but the rightmost 6 bits of each element of b, so the signedness doesn't matter. wschmidt: Seems like too much casting above. It's ok to just use the original code here (and make…
		nemanjaiAuthorUnsubmitted Not Done Reply Inline Actions I am not sure if you are referring only to the vector long long overload of vec_sr or to all of them. In any case, the reason for the casts is that Clang will produce an `lshr` when the LHS is unsigned and an `ashr` when the LHS is signed. This is what was causing LLVM to emit `vsr[bhwd]` for the unsigned ones and `vsra[bhwd]` for the signed ones. So the casts are simply to ensure that the IR contains the `lshr` instructions rather than `ashr/lshr` depending on signedness. Of course, I could have just defined builtins and called the same one for both signed and unsigned overloads, but I assumed that since IR instructions exist for this, it is better to retain the information about what operation is actually being performed in case the optimizer can use it. nemanjai: I am not sure if you are referring only to the vector long long overload of vec_sr or to all of…
		wschmidtUnsubmitted Not Done Reply Inline Actions You have wrongly changed the instruction to be generated. The user has chosen vec_sr, which means the user wants vsr[bhwd]. If they wanted vsra[bhwd], they could have chosen vec_sra. See figures 4-120 and 4-121 of http://www.freescale.com/files/32bit/doc/ref_manual/ALTIVECPIM.pdf to see the required instruction mappings. wschmidt: You have wrongly changed the instruction to be generated. The user has chosen vec_sr, which…
		wschmidtUnsubmitted Not Done Reply Inline Actions Note that in this case we are adding code for the vector long long operands, which is not described in the PIM. But we should be consistent with existing behavior for the other types. wschmidt: Note that in this case we are adding code for the vector long long operands, which is not…
		wschmidtUnsubmitted Not Done Reply Inline Actions OK, I take it back, I misread the code. We were already generating the wrong instruction here. Carry on... ;) wschmidt: OK, I take it back, I misread the code. We were already generating the wrong instruction here.

static vector unsigned long long __ATTRS_o_ai		static vector unsigned long long __ATTRS_o_ai
vec_sr(vector unsigned long long __a, vector unsigned long long __b) {		vec_sr(vector unsigned long long __a, vector unsigned long long __b) {
return __a >> __b;		return __a >> __b;
}		}
#endif		#endif

/* vec_vsrb */		/* vec_vsrb */
▲ Show 20 Lines • Show All 5,722 Lines • Show Last 20 Lines

test/CodeGen/builtins-ppc-altivec.c

Show First 20 Lines • Show All 3,266 Lines • ▼ Show 20 Lines	// CHECK-LE: @llvm.ppc.altivec.vperm
res_vs = vec_sld(vs, vs, 0);		res_vs = vec_sld(vs, vs, 0);
// CHECK: @llvm.ppc.altivec.vperm		// CHECK: @llvm.ppc.altivec.vperm
// CHECK-LE: @llvm.ppc.altivec.vperm		// CHECK-LE: @llvm.ppc.altivec.vperm

res_vus = vec_sld(vus, vus, 0);		res_vus = vec_sld(vus, vus, 0);
// CHECK: @llvm.ppc.altivec.vperm		// CHECK: @llvm.ppc.altivec.vperm
// CHECK-LE: @llvm.ppc.altivec.vperm		// CHECK-LE: @llvm.ppc.altivec.vperm

		res_vbs = vec_sld(vbs, vbs, 0);
		// CHECK: [[T1:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK: call <4 x i32> @llvm.ppc.altivec.vperm(<4 x i32> [[T1]], <4 x i32> [[T2]], <16 x i8>
		// CHECK-LE: xor <16 x i8>
		// CHECK-LE: [[T1:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK-LE: call <4 x i32> @llvm.ppc.altivec.vperm(<4 x i32> [[T1]], <4 x i32> [[T2]], <16 x i8>

res_vp = vec_sld(vp, vp, 0);		res_vp = vec_sld(vp, vp, 0);
// CHECK: @llvm.ppc.altivec.vperm		// CHECK: @llvm.ppc.altivec.vperm
// CHECK-LE: @llvm.ppc.altivec.vperm		// CHECK-LE: @llvm.ppc.altivec.vperm

res_vi = vec_sld(vi, vi, 0);		res_vi = vec_sld(vi, vi, 0);
// CHECK: @llvm.ppc.altivec.vperm		// CHECK: @llvm.ppc.altivec.vperm
// CHECK-LE: @llvm.ppc.altivec.vperm		// CHECK-LE: @llvm.ppc.altivec.vperm

res_vui = vec_sld(vui, vui, 0);		res_vui = vec_sld(vui, vui, 0);
// CHECK: @llvm.ppc.altivec.vperm		// CHECK: @llvm.ppc.altivec.vperm
// CHECK-LE: @llvm.ppc.altivec.vperm		// CHECK-LE: @llvm.ppc.altivec.vperm

		res_vbi = vec_sld(vbi, vbi, 0);
		// CHECK: call <4 x i32> @llvm.ppc.altivec.vperm(<4 x i32> {{.+}}, <4 x i32> {{.+}}, <16 x i8>
		// CHECK-LE: xor <16 x i8>
		// CHECK-LE: call <4 x i32> @llvm.ppc.altivec.vperm(<4 x i32> {{.+}}, <4 x i32> {{.+}}, <16 x i8>

res_vf = vec_sld(vf, vf, 0);		res_vf = vec_sld(vf, vf, 0);
// CHECK: @llvm.ppc.altivec.vperm		// CHECK: @llvm.ppc.altivec.vperm
// CHECK-LE: @llvm.ppc.altivec.vperm		// CHECK-LE: @llvm.ppc.altivec.vperm

res_vsc = vec_vsldoi(vsc, vsc, 0);		res_vsc = vec_vsldoi(vsc, vsc, 0);
// CHECK: @llvm.ppc.altivec.vperm		// CHECK: @llvm.ppc.altivec.vperm
// CHECK-LE: @llvm.ppc.altivec.vperm		// CHECK-LE: @llvm.ppc.altivec.vperm

▲ Show 20 Lines • Show All 5,405 Lines • Show Last 20 Lines

test/CodeGen/builtins-ppc-p8vector.c

// REQUIRES: powerpc-registered-target		// REQUIRES: powerpc-registered-target
// RUN: %clang_cc1 -faltivec -target-feature +power8-vector -triple powerpc64-unknown-unknown -emit-llvm %s -o - \| FileCheck %s		// RUN: %clang_cc1 -faltivec -target-feature +power8-vector -triple powerpc64-unknown-unknown -emit-llvm %s -o - \| FileCheck %s
// RUN: %clang_cc1 -faltivec -target-feature +power8-vector -triple powerpc64le-unknown-unknown -emit-llvm %s -o - \| FileCheck %s -check-prefix=CHECK-LE		// RUN: %clang_cc1 -faltivec -target-feature +power8-vector -triple powerpc64le-unknown-unknown -emit-llvm %s -o - \| FileCheck %s -check-prefix=CHECK-LE
// RUN: not %clang_cc1 -faltivec -target-feature +vsx -triple powerpc64-unknown-unknown -emit-llvm %s -o - 2>&1 \| FileCheck %s -check-prefix=CHECK-PPC		// RUN: not %clang_cc1 -faltivec -target-feature +vsx -triple powerpc64-unknown-unknown -emit-llvm %s -o - 2>&1 \| FileCheck %s -check-prefix=CHECK-PPC
// Added -target-feature +vsx above to avoid errors about "vector double" and to		// Added -target-feature +vsx above to avoid errors about "vector double" and to
// generate the correct errors for functions that are only overloaded with VSX		// generate the correct errors for functions that are only overloaded with VSX
// (vec_cmpge, vec_cmple). Without this option, there is only one overload so		// (vec_cmpge, vec_cmple). Without this option, there is only one overload so
// it is selected.		// it is selected.

vector signed char vsc = { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 0, 1, 2, 3, 4, 5 };		vector signed char vsc = { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 0, 1, 2, 3, 4, 5 };
vector unsigned char vuc = { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 0, 1, 2, 3, 4, 5 };		vector unsigned char vuc = { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 0, 1, 2, 3, 4, 5 };
vector int vi = { -1, 2, -3, 4 };		vector bool char vbc = { 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1 };

		vector signed short vss = { 0, 1, 2, 3, 4, 5, 6, 7 };
		vector unsigned short vus = { 0, 1, 2, 3, 4, 5, 6, 7 };
		vector bool short vbs = { 1, 1, 0, 0, 0, 0, 1, 1 };

		vector signed int vsi = { -1, 2, -3, 4 };
vector unsigned int vui = { 1, 2, 3, 4 };		vector unsigned int vui = { 1, 2, 3, 4 };
vector bool int vbi = {0, -1, -1, 0};		vector bool int vbi = {0, -1, -1, 0};
vector bool long long vbll = { 1, 0 };
vector signed long long vsll = { 1, 2 };		vector signed long long vsll = { 1, 2 };
vector unsigned long long vull = { 1, 2 };		vector unsigned long long vull = { 1, 2 };
		vector bool long long vbll = { 1, 0 };

		vector float vfa = { 1.e-4f, -132.23f, -22.1, 32.00f };
vector double vda = { 1.e-11, -132.23e10 };		vector double vda = { 1.e-11, -132.23e10 };

int res_i;		int res_i;
vector signed char res_vsc;		vector signed char res_vsc;
vector unsigned char res_vuc;		vector unsigned char res_vuc;
vector int res_vi;		vector bool char res_vbc;

		vector signed short res_vss;
		vector unsigned short res_vus;
		vector bool short res_vbs;

		vector int res_vsi;
vector unsigned int res_vui;		vector unsigned int res_vui;
vector bool int res_vbi;		vector bool int res_vbi;
vector bool long long res_vbll;
vector signed long long res_vsll;		vector signed long long res_vsll;
vector unsigned long long res_vull;		vector unsigned long long res_vull;
		vector bool long long res_vbll;

		vector double res_vf;
vector double res_vd;		vector double res_vd;

// CHECK-LABEL: define void @test1		// CHECK-LABEL: define void @test1
void test1() {		void test1() {

/* vec_abs */		/* vec_abs */
res_vsll = vec_abs(vsll);		res_vsll = vec_abs(vsll);
// CHECK: call <2 x i64> @llvm.ppc.altivec.vmaxsd(<2 x i64> %{{[0-9]*}}, <2 x i64>		// CHECK: call <2 x i64> @llvm.ppc.altivec.vmaxsd(<2 x i64> %{{[0-9]*}}, <2 x i64>
Show All 18 Lines
// CHECK-LE: add <2 x i64>		// CHECK-LE: add <2 x i64>
// CHECK-PPC: error: call to 'vec_add' is ambiguous		// CHECK-PPC: error: call to 'vec_add' is ambiguous

/* vec_mergee */		/* vec_mergee */
res_vbi = vec_mergee(vbi, vbi);		res_vbi = vec_mergee(vbi, vbi);
// CHECK: @llvm.ppc.altivec.vperm		// CHECK: @llvm.ppc.altivec.vperm
// CHECK-LE: @llvm.ppc.altivec.vperm		// CHECK-LE: @llvm.ppc.altivec.vperm

res_vi = vec_mergee(vi, vi);		res_vsi = vec_mergee(vsi, vsi);
// CHECK: @llvm.ppc.altivec.vperm		// CHECK: @llvm.ppc.altivec.vperm
// CHECK-LE: @llvm.ppc.altivec.vperm		// CHECK-LE: @llvm.ppc.altivec.vperm

res_vui = vec_mergee(vui, vui);		res_vui = vec_mergee(vui, vui);
// CHECK: @llvm.ppc.altivec.vperm		// CHECK: @llvm.ppc.altivec.vperm
// CHECK-LE: @llvm.ppc.altivec.vperm		// CHECK-LE: @llvm.ppc.altivec.vperm
// CHECK-PPC: warning: implicit declaration of function 'vec_mergee'		// CHECK-PPC: warning: implicit declaration of function 'vec_mergee'

/* vec_mergeo */		/* vec_mergeo */
res_vbi = vec_mergeo(vbi, vbi);		res_vbi = vec_mergeo(vbi, vbi);
// CHECK: @llvm.ppc.altivec.vperm		// CHECK: @llvm.ppc.altivec.vperm
// CHECK-LE: @llvm.ppc.altivec.vperm		// CHECK-LE: @llvm.ppc.altivec.vperm

res_vi = vec_mergeo(vi, vi);		res_vsi = vec_mergeo(vsi, vsi);
// CHECK: @llvm.ppc.altivec.vperm		// CHECK: @llvm.ppc.altivec.vperm
// CHECK-LE: @llvm.ppc.altivec.vperm		// CHECK-LE: @llvm.ppc.altivec.vperm

res_vui = vec_mergeo(vui, vui);		res_vui = vec_mergeo(vui, vui);
// CHECK: @llvm.ppc.altivec.vperm		// CHECK: @llvm.ppc.altivec.vperm
// CHECK-LE: @llvm.ppc.altivec.vperm		// CHECK-LE: @llvm.ppc.altivec.vperm
// CHECK-PPC: warning: implicit declaration of function 'vec_mergeo'		// CHECK-PPC: warning: implicit declaration of function 'vec_mergeo'

▲ Show 20 Lines • Show All 47 Lines • ▼ Show 20 Lines
// CHECK-LE: call <2 x i64> @llvm.ppc.altivec.vcmpgtsd(<2 x i64> %{{[0-9]}}, <2 x i64> %{{[0-9]}})		// CHECK-LE: call <2 x i64> @llvm.ppc.altivec.vcmpgtsd(<2 x i64> %{{[0-9]}}, <2 x i64> %{{[0-9]}})
// CHECK-PPC: error: call to 'vec_cmplt' is ambiguous		// CHECK-PPC: error: call to 'vec_cmplt' is ambiguous

res_vbll = vec_cmplt(vull, vull);		res_vbll = vec_cmplt(vull, vull);
// CHECK: call <2 x i64> @llvm.ppc.altivec.vcmpgtud(<2 x i64> %{{[0-9]}}, <2 x i64> %{{[0-9]}})		// CHECK: call <2 x i64> @llvm.ppc.altivec.vcmpgtud(<2 x i64> %{{[0-9]}}, <2 x i64> %{{[0-9]}})
// CHECK-LE: call <2 x i64> @llvm.ppc.altivec.vcmpgtud(<2 x i64> %{{[0-9]}}, <2 x i64> %{{[0-9]}})		// CHECK-LE: call <2 x i64> @llvm.ppc.altivec.vcmpgtud(<2 x i64> %{{[0-9]}}, <2 x i64> %{{[0-9]}})
// CHECK-PPC: error: call to 'vec_cmplt' is ambiguous		// CHECK-PPC: error: call to 'vec_cmplt' is ambiguous

		/* vec_eqv */
		res_vsc = vec_eqv(vsc, vsc);
		// CHECK: [[T1:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <16 x i8>
		// CHECK-LE: [[T1:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <16 x i8>
		// CHECK-PPC: error: assigning to

		res_vsc = vec_eqv(vbc, vsc);
		// CHECK: [[T1:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <16 x i8>
		// CHECK-LE: [[T1:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <16 x i8>
		// CHECK-PPC: error: assigning to

		res_vsc = vec_eqv(vsc, vbc);
		// CHECK: [[T1:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <16 x i8>
		// CHECK-LE: [[T1:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <16 x i8>
		// CHECK-PPC: error: assigning to

		res_vuc = vec_eqv(vuc, vuc);
		// CHECK: [[T1:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <16 x i8>
		// CHECK-LE: [[T1:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <16 x i8>
		// CHECK-PPC: error: assigning to

		res_vuc = vec_eqv(vbc, vuc);
		// CHECK: [[T1:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <16 x i8>
		// CHECK-LE: [[T1:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <16 x i8>
		// CHECK-PPC: error: assigning to

		res_vuc = vec_eqv(vuc, vbc);
		// CHECK: [[T1:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <16 x i8>
		// CHECK-LE: [[T1:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <16 x i8> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <16 x i8>
		// CHECK-PPC: error: assigning to

		res_vss = vec_eqv(vss, vss);
		// CHECK: [[T1:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <8 x i16>
		// CHECK-LE: [[T1:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <8 x i16>
		// CHECK-PPC: error: assigning to

		res_vss = vec_eqv(vbs, vss);
		// CHECK: [[T1:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <8 x i16>
		// CHECK-LE: [[T1:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <8 x i16>
		// CHECK-PPC: error: assigning to

		res_vss = vec_eqv(vss, vbs);
		// CHECK: [[T1:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <8 x i16>
		// CHECK-LE: [[T1:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <8 x i16>
		// CHECK-PPC: error: assigning to

		res_vus = vec_eqv(vus, vus);
		// CHECK: [[T1:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <8 x i16>
		// CHECK-LE: [[T1:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <8 x i16>
		// CHECK-PPC: error: assigning to

		res_vus = vec_eqv(vbs, vus);
		// CHECK: [[T1:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <8 x i16>
		// CHECK-LE: [[T1:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <8 x i16>
		// CHECK-PPC: error: assigning to

		res_vus = vec_eqv(vus, vbs);
		// CHECK: [[T1:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <8 x i16>
		// CHECK-LE: [[T1:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <8 x i16> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <8 x i16>
		// CHECK-PPC: error: assigning to

		res_vsi = vec_eqv(vsi, vsi);
		// CHECK: call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.*}}, <4 x i32> {{.+}})
		// CHECK-LE: call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.*}}, <4 x i32> {{.+}})
		// CHECK-PPC: error: assigning to

		res_vsi = vec_eqv(vbi, vsi);
		// CHECK: call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.*}}, <4 x i32> {{.+}})
		// CHECK-LE: call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.*}}, <4 x i32> {{.+}})
		// CHECK-PPC: error: assigning to

		res_vsi = vec_eqv(vsi, vbi);
		// CHECK: call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.*}}, <4 x i32> {{.+}})
		// CHECK-LE: call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.*}}, <4 x i32> {{.+}})
		// CHECK-PPC: error: assigning to

		res_vui = vec_eqv(vui, vui);
		// CHECK: call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.*}}, <4 x i32> {{.+}})
		// CHECK-LE: call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.*}}, <4 x i32> {{.+}})
		// CHECK-PPC: error: assigning to

		res_vui = vec_eqv(vbi, vui);
		// CHECK: call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.*}}, <4 x i32> {{.+}})
		// CHECK-LE: call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.*}}, <4 x i32> {{.+}})
		// CHECK-PPC: error: assigning to

		res_vui = vec_eqv(vui, vbi);
		// CHECK: call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.*}}, <4 x i32> {{.+}})
		// CHECK-LE: call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.*}}, <4 x i32> {{.+}})
		// CHECK-PPC: error: assigning to

		res_vsll = vec_eqv(vsll, vsll);
		// CHECK: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <2 x i64>
		// CHECK-LE: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <2 x i64>
		// CHECK-PPC: error: assigning to

		res_vsll = vec_eqv(vbll, vsll);
		// CHECK: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <2 x i64>
		// CHECK-LE: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <2 x i64>
		// CHECK-PPC: error: assigning to

		res_vsll = vec_eqv(vsll, vbll);
		// CHECK: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <2 x i64>
		// CHECK-LE: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <2 x i64>
		// CHECK-PPC: error: assigning to

		res_vull = vec_eqv(vull, vull);
		// CHECK: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <2 x i64>
		// CHECK-LE: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <2 x i64>
		// CHECK-PPC: error: assigning to

		res_vull = vec_eqv(vbll, vull);
		// CHECK: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <2 x i64>
		// CHECK-LE: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <2 x i64>
		// CHECK-PPC: error: assigning to

		res_vull = vec_eqv(vull, vbll);
		// CHECK: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <2 x i64>
		// CHECK-LE: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <2 x i64>
		// CHECK-PPC: error: assigning to

		res_vf = vec_eqv(vfa, vfa);
		// CHECK: [[T1:%.+]] = bitcast <4 x float> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <4 x float> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <4 x float>
		// CHECK-LE: [[T1:%.+]] = bitcast <4 x float> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <4 x float> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <4 x float>
		// CHECK-PPC: error: assigning to

		res_vf = vec_eqv(vbi, vfa);
		// CHECK: [[T2:%.+]] = bitcast <4 x float> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.+}}, <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <4 x float>
		// CHECK-LE: [[T2:%.+]] = bitcast <4 x float> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.+}}, <4 x i32> [[T2]])
		// CHECK-PPC: error: assigning to

		res_vf = vec_eqv(vfa, vbi);
		// CHECK: [[T1:%.+]] = bitcast <4 x float> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32>
		// CHECK: bitcast <4 x i32> [[T3]] to <4 x float>
		// CHECK-LE: [[T1:%.+]] = bitcast <4 x float> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32>
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <4 x float>
		// CHECK-PPC: error: assigning to

		res_vd = vec_eqv(vda, vda);
		// CHECK: [[T1:%.+]] = bitcast <2 x double> {{.+}} to <4 x i32>
		// CHECK: [[T2:%.+]] = bitcast <2 x double> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <2 x double>
		// CHECK-LE: [[T1:%.+]] = bitcast <2 x double> {{.+}} to <4 x i32>
		// CHECK-LE: [[T2:%.+]] = bitcast <2 x double> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <2 x double>
		// CHECK-PPC: error: assigning to

		res_vd = vec_eqv(vbll, vda);
		// CHECK: [[T2:%.+]] = bitcast <2 x double> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.+}}, <4 x i32> [[T2]])
		// CHECK: bitcast <4 x i32> [[T3]] to <2 x double>
		// CHECK-LE: [[T2:%.+]] = bitcast <2 x double> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> {{.+}}, <4 x i32> [[T2]])
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <2 x double>
		// CHECK-PPC: error: assigning to

		res_vd = vec_eqv(vda, vbll);
		// CHECK: [[T1:%.+]] = bitcast <2 x double> {{.+}} to <4 x i32>
		// CHECK: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32>
		// CHECK: bitcast <4 x i32> [[T3]] to <2 x double>
		// CHECK-LE: [[T1:%.+]] = bitcast <2 x double> {{.+}} to <4 x i32>
		// CHECK-LE: [[T3:%.+]] = call <4 x i32> @llvm.ppc.vsx.xxleqv(<4 x i32> [[T1]], <4 x i32>
		// CHECK-LE: bitcast <4 x i32> [[T3]] to <2 x double>
		// CHECK-PPC: error: assigning to

/* ----------------------- predicates --------------------------- */		/* ----------------------- predicates --------------------------- */
/* vec_all_eq */		/* vec_all_eq */
res_i = vec_all_eq(vsll, vsll);		res_i = vec_all_eq(vsll, vsll);
// CHECK: @llvm.ppc.altivec.vcmpequd.p		// CHECK: @llvm.ppc.altivec.vcmpequd.p
// CHECK-LE: @llvm.ppc.altivec.vcmpequd.p		// CHECK-LE: @llvm.ppc.altivec.vcmpequd.p
// CHECK-PPC: error: call to 'vec_all_eq' is ambiguous		// CHECK-PPC: error: call to 'vec_all_eq' is ambiguous

res_i = vec_all_eq(vsll, vbll);		res_i = vec_all_eq(vsll, vbll);
▲ Show 20 Lines • Show All 480 Lines • ▼ Show 20 Lines
// CHECK-PPC: error: call to 'vec_min' is ambiguous		// CHECK-PPC: error: call to 'vec_min' is ambiguous

res_vull = vec_min(vull, vbll);		res_vull = vec_min(vull, vbll);
// CHECK: @llvm.ppc.altivec.vminud		// CHECK: @llvm.ppc.altivec.vminud
// CHECK-LE: @llvm.ppc.altivec.vminud		// CHECK-LE: @llvm.ppc.altivec.vminud
// CHECK-PPC: error: call to 'vec_min' is ambiguous		// CHECK-PPC: error: call to 'vec_min' is ambiguous

/* vec_mule */		/* vec_mule */
res_vsll = vec_mule(vi, vi);		res_vsll = vec_mule(vsi, vsi);
// CHECK: @llvm.ppc.altivec.vmulesw		// CHECK: @llvm.ppc.altivec.vmulesw
// CHECK-LE: @llvm.ppc.altivec.vmulosw		// CHECK-LE: @llvm.ppc.altivec.vmulosw
// CHECK-PPC: error: call to 'vec_mule' is ambiguous		// CHECK-PPC: error: call to 'vec_mule' is ambiguous

res_vull = vec_mule(vui , vui);		res_vull = vec_mule(vui , vui);
// CHECK: @llvm.ppc.altivec.vmuleuw		// CHECK: @llvm.ppc.altivec.vmuleuw
// CHECK-LE: @llvm.ppc.altivec.vmulouw		// CHECK-LE: @llvm.ppc.altivec.vmulouw
// CHECK-PPC: error: call to 'vec_mule' is ambiguous		// CHECK-PPC: error: call to 'vec_mule' is ambiguous

/* vec_mulo */		/* vec_mulo */
res_vsll = vec_mulo(vi, vi);		res_vsll = vec_mulo(vsi, vsi);
// CHECK: @llvm.ppc.altivec.vmulosw		// CHECK: @llvm.ppc.altivec.vmulosw
// CHECK-LE: @llvm.ppc.altivec.vmulesw		// CHECK-LE: @llvm.ppc.altivec.vmulesw
// CHECK-PPC: error: call to 'vec_mulo' is ambiguous		// CHECK-PPC: error: call to 'vec_mulo' is ambiguous

res_vull = vec_mulo(vui, vui);		res_vull = vec_mulo(vui, vui);
// CHECK: @llvm.ppc.altivec.vmulouw		// CHECK: @llvm.ppc.altivec.vmulouw
// CHECK-LE: @llvm.ppc.altivec.vmuleuw		// CHECK-LE: @llvm.ppc.altivec.vmuleuw
// CHECK-PPC: error: call to 'vec_mulo' is ambiguous		// CHECK-PPC: error: call to 'vec_mulo' is ambiguous

/* vec_packs */		/* vec_packs */
res_vi = vec_packs(vsll, vsll);		res_vsi = vec_packs(vsll, vsll);
// CHECK: @llvm.ppc.altivec.vpksdss		// CHECK: @llvm.ppc.altivec.vpksdss
// CHECK-LE: @llvm.ppc.altivec.vpksdss		// CHECK-LE: @llvm.ppc.altivec.vpksdss
// CHECK-PPC: error: call to 'vec_packs' is ambiguous		// CHECK-PPC: error: call to 'vec_packs' is ambiguous

res_vui = vec_packs(vull, vull);		res_vui = vec_packs(vull, vull);
// CHECK: @llvm.ppc.altivec.vpkudus		// CHECK: @llvm.ppc.altivec.vpkudus
// CHECK-LE: @llvm.ppc.altivec.vpkudus		// CHECK-LE: @llvm.ppc.altivec.vpkudus
// CHECK-PPC: error: call to 'vec_packs' is ambiguous		// CHECK-PPC: error: call to 'vec_packs' is ambiguous
Show All 28 Lines	// CHECK-PPC: error: call to 'vec_sl' is ambiguous

res_vull = vec_sl(vull, vull);		res_vull = vec_sl(vull, vull);
// CHECK: shl <2 x i64>		// CHECK: shl <2 x i64>
// CHECK-LE: shl <2 x i64>		// CHECK-LE: shl <2 x i64>
// CHECK-PPC: error: call to 'vec_sl' is ambiguous		// CHECK-PPC: error: call to 'vec_sl' is ambiguous

/* vec_sr */		/* vec_sr */
res_vsll = vec_sr(vsll, vull);		res_vsll = vec_sr(vsll, vull);
// CHECK: ashr <2 x i64>		// CHECK: lshr <2 x i64>
// CHECK-LE: ashr <2 x i64>		// CHECK-LE: lshr <2 x i64>
// CHECK-PPC: error: call to 'vec_sr' is ambiguous		// CHECK-PPC: error: call to 'vec_sr' is ambiguous
		wschmidtUnsubmitted Not Done Reply Inline Actions This will probably change back per my earlier comment. wschmidt: This will probably change back per my earlier comment.
		nemanjaiAuthorUnsubmitted Not Done Reply Inline Actions If we indeed want logical shifts for vec_sr, then this should not change back. nemanjai: If we indeed want logical shifts for vec_sr, then this should not change back.

res_vull = vec_sr(vull, vull);		res_vull = vec_sr(vull, vull);
// CHECK: lshr <2 x i64>		// CHECK: lshr <2 x i64>
// CHECK-LE: lshr <2 x i64>		// CHECK-LE: lshr <2 x i64>
// CHECK-PPC: error: call to 'vec_sr' is ambiguous		// CHECK-PPC: error: call to 'vec_sr' is ambiguous

/* vec_sra */		/* vec_sra */
res_vsll = vec_sra(vsll, vull);		res_vsll = vec_sra(vsll, vull);
// CHECK: ashr <2 x i64>		// CHECK: ashr <2 x i64>
// CHECK-LE: ashr <2 x i64>		// CHECK-LE: ashr <2 x i64>
// CHECK-PPC: error: call to 'vec_sra' is ambiguous		// CHECK-PPC: error: call to 'vec_sra' is ambiguous

res_vull = vec_sra(vull, vull);		res_vull = vec_sra(vull, vull);
// CHECK: ashr <2 x i64>		// CHECK: ashr <2 x i64>
// CHECK-LE: ashr <2 x i64>		// CHECK-LE: ashr <2 x i64>
// CHECK-PPC: error: call to 'vec_sra' is ambiguous		// CHECK-PPC: error: call to 'vec_sra' is ambiguous

/* vec_unpackh */		/* vec_unpackh */
res_vsll = vec_unpackh(vi);		res_vsll = vec_unpackh(vsi);
// CHECK: llvm.ppc.altivec.vupkhsw		// CHECK: llvm.ppc.altivec.vupkhsw
// CHECK-LE: llvm.ppc.altivec.vupklsw		// CHECK-LE: llvm.ppc.altivec.vupklsw
// CHECK-PPC: error: call to 'vec_unpackh' is ambiguous		// CHECK-PPC: error: call to 'vec_unpackh' is ambiguous

res_vbll = vec_unpackh(vbi);		res_vbll = vec_unpackh(vbi);
// CHECK: llvm.ppc.altivec.vupkhsw		// CHECK: llvm.ppc.altivec.vupkhsw
// CHECK-LE: llvm.ppc.altivec.vupklsw		// CHECK-LE: llvm.ppc.altivec.vupklsw
// CHECK-PPC: error: call to 'vec_unpackh' is ambiguous		// CHECK-PPC: error: call to 'vec_unpackh' is ambiguous

/* vec_unpackl */		/* vec_unpackl */
res_vsll = vec_unpackl(vi);		res_vsll = vec_unpackl(vsi);
// CHECK: llvm.ppc.altivec.vupklsw		// CHECK: llvm.ppc.altivec.vupklsw
// CHECK-LE: llvm.ppc.altivec.vupkhsw		// CHECK-LE: llvm.ppc.altivec.vupkhsw
// CHECK-PPC: error: call to 'vec_unpackl' is ambiguous		// CHECK-PPC: error: call to 'vec_unpackl' is ambiguous

res_vbll = vec_unpackl(vbi);		res_vbll = vec_unpackl(vbi);
// CHECK: llvm.ppc.altivec.vupklsw		// CHECK: llvm.ppc.altivec.vupklsw
// CHECK-LE: llvm.ppc.altivec.vupkhsw		// CHECK-LE: llvm.ppc.altivec.vupkhsw
// CHECK-PPC: error: call to 'vec_unpackl' is ambiguous		// CHECK-PPC: error: call to 'vec_unpackl' is ambiguous

/* vec_vpksdss */		/* vec_vpksdss */
res_vi = vec_vpksdss(vsll, vsll);		res_vsi = vec_vpksdss(vsll, vsll);
// CHECK: llvm.ppc.altivec.vpksdss		// CHECK: llvm.ppc.altivec.vpksdss
// CHECK-LE: llvm.ppc.altivec.vpksdss		// CHECK-LE: llvm.ppc.altivec.vpksdss
// CHECK-PPC: warning: implicit declaration of function 'vec_vpksdss'		// CHECK-PPC: warning: implicit declaration of function 'vec_vpksdss'

/* vec_vpksdus */		/* vec_vpksdus */
res_vui = vec_vpksdus(vsll, vsll);		res_vui = vec_vpksdus(vsll, vsll);
// CHECK: llvm.ppc.altivec.vpksdus		// CHECK: llvm.ppc.altivec.vpksdus
// CHECK-LE: llvm.ppc.altivec.vpksdus		// CHECK-LE: llvm.ppc.altivec.vpksdus
// CHECK-PPC: warning: implicit declaration of function 'vec_vpksdus'		// CHECK-PPC: warning: implicit declaration of function 'vec_vpksdus'

/* vec_vpkudum */		/* vec_vpkudum */
res_vi = vec_vpkudum(vsll, vsll);		res_vsi = vec_vpkudum(vsll, vsll);
// CHECK: vperm		// CHECK: vperm
// CHECK-LE: vperm		// CHECK-LE: vperm
// CHECK-PPC: warning: implicit declaration of function 'vec_vpkudum'		// CHECK-PPC: warning: implicit declaration of function 'vec_vpkudum'

res_vui = vec_vpkudum(vull, vull);		res_vui = vec_vpkudum(vull, vull);
// CHECK: vperm		// CHECK: vperm
// CHECK-LE: vperm		// CHECK-LE: vperm

res_vui = vec_vpkudus(vull, vull);		res_vui = vec_vpkudus(vull, vull);
// CHECK: llvm.ppc.altivec.vpkudus		// CHECK: llvm.ppc.altivec.vpkudus
// CHECK-LE: llvm.ppc.altivec.vpkudus		// CHECK-LE: llvm.ppc.altivec.vpkudus
// CHECK-PPC: warning: implicit declaration of function 'vec_vpkudus'		// CHECK-PPC: warning: implicit declaration of function 'vec_vpkudus'

/* vec_vupkhsw */		/* vec_vupkhsw */
res_vsll = vec_vupkhsw(vi);		res_vsll = vec_vupkhsw(vsi);
// CHECK: llvm.ppc.altivec.vupkhsw		// CHECK: llvm.ppc.altivec.vupkhsw
// CHECK-LE: llvm.ppc.altivec.vupklsw		// CHECK-LE: llvm.ppc.altivec.vupklsw
// CHECK-PPC: warning: implicit declaration of function 'vec_vupkhsw'		// CHECK-PPC: warning: implicit declaration of function 'vec_vupkhsw'

res_vbll = vec_vupkhsw(vbi);		res_vbll = vec_vupkhsw(vbi);
// CHECK: llvm.ppc.altivec.vupkhsw		// CHECK: llvm.ppc.altivec.vupkhsw
// CHECK-LE: llvm.ppc.altivec.vupklsw		// CHECK-LE: llvm.ppc.altivec.vupklsw

/* vec_vupklsw */		/* vec_vupklsw */
res_vsll = vec_vupklsw(vi);		res_vsll = vec_vupklsw(vsi);
// CHECK: llvm.ppc.altivec.vupklsw		// CHECK: llvm.ppc.altivec.vupklsw
// CHECK-LE: llvm.ppc.altivec.vupkhsw		// CHECK-LE: llvm.ppc.altivec.vupkhsw
// CHECK-PPC: warning: implicit declaration of function 'vec_vupklsw'		// CHECK-PPC: warning: implicit declaration of function 'vec_vupklsw'

res_vbll = vec_vupklsw(vbi);		res_vbll = vec_vupklsw(vbi);
// CHECK: llvm.ppc.altivec.vupklsw		// CHECK: llvm.ppc.altivec.vupklsw
// CHECK-LE: llvm.ppc.altivec.vupkhsw		// CHECK-LE: llvm.ppc.altivec.vupkhsw

▲ Show 20 Lines • Show All 62 Lines • Show Last 20 Lines

test/CodeGen/builtins-ppc-vsx.c

	// REQUIRES: powerpc-registered-target			// REQUIRES: powerpc-registered-target
	// RUN: %clang_cc1 -faltivec -target-feature +vsx -triple powerpc64-unknown-unknown -emit-llvm %s -o - \| FileCheck %s			// RUN: %clang_cc1 -faltivec -target-feature +vsx -triple powerpc64-unknown-unknown -emit-llvm %s -o - \| FileCheck %s
	// RUN: %clang_cc1 -faltivec -target-feature +vsx -triple powerpc64le-unknown-unknown -emit-llvm %s -o - \| FileCheck %s			// RUN: %clang_cc1 -faltivec -target-feature +vsx -triple powerpc64le-unknown-unknown -emit-llvm %s -o - \| FileCheck %s -check-prefix=CHECK-LE

	vector unsigned char vuc = { 8, 9, 10, 11, 12, 13, 14, 15,			vector unsigned char vuc = { 8, 9, 10, 11, 12, 13, 14, 15,
	0, 1, 2, 3, 4, 5, 6, 7};			0, 1, 2, 3, 4, 5, 6, 7};
	vector float vf = { -1.5, 2.5, -3.5, 4.5 };			vector float vf = { -1.5, 2.5, -3.5, 4.5 };
	vector double vd = { 3.5, -7.5 };			vector double vd = { 3.5, -7.5 };
	vector signed int vsi = { -1, 2, -3, 4 };			vector signed int vsi = { -1, 2, -3, 4 };
	vector unsigned int vui = { 0, 1, 2, 3 };			vector unsigned int vui = { 0, 1, 2, 3 };
	vector bool long long vbll = { 1, 0 };			vector bool long long vbll = { 1, 0 };
	Show All 10 Lines
	vector signed long long res_vsll;			vector signed long long res_vsll;
	vector unsigned long long res_vull;			vector unsigned long long res_vull;
	double res_d;			double res_d;

	void dummy() { }			void dummy() { }

	void test1() {			void test1() {
	// CHECK-LABEL: define void @test1			// CHECK-LABEL: define void @test1
				// CHECK-LE-LABEL: define void @test1

	res_vd = vec_add(vd, vd);			res_vd = vec_add(vd, vd);
	// CHECK: fadd <2 x double>			// CHECK: fadd <2 x double>
				// CHECK-LE: fadd <2 x double>

	res_vd = vec_and(vbll, vd);			res_vd = vec_and(vbll, vd);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
	// CHECK: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>			// CHECK: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>
				// CHECK-LE: and <2 x i64>
				// CHECK-LE: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>

	res_vd = vec_and(vd, vbll);			res_vd = vec_and(vd, vbll);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
	// CHECK: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>			// CHECK: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>
				// CHECK-LE: and <2 x i64>
				// CHECK-LE: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>

	res_vd = vec_and(vd, vd);			res_vd = vec_and(vd, vd);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
	// CHECK: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>			// CHECK: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>
				// CHECK-LE: and <2 x i64>
				// CHECK-LE: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>

	dummy();			dummy();
	// CHECK: call void @dummy()			// CHECK: call void @dummy()
				// CHECK-LE: call void @dummy()

	res_vd = vec_andc(vbll, vd);			res_vd = vec_andc(vbll, vd);
	// CHECK: bitcast <2 x double> %{{[0-9]*}} to <2 x i64>			// CHECK: bitcast <2 x double> %{{[0-9]*}} to <2 x i64>
	// CHECK: xor <2 x i64> %{{[0-9]*}}, <i64 -1, i64 -1>			// CHECK: xor <2 x i64> %{{[0-9]*}}, <i64 -1, i64 -1>
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
	// CHECK: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>			// CHECK: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>
				// CHECK-LE: bitcast <2 x double> %{{[0-9]*}} to <2 x i64>
				// CHECK-LE: xor <2 x i64> %{{[0-9]*}}, <i64 -1, i64 -1>
				// CHECK-LE: and <2 x i64>
				// CHECK-LE: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>

	dummy();			dummy();
	// CHECK: call void @dummy()			// CHECK: call void @dummy()
				// CHECK-LE: call void @dummy()

	res_vd = vec_andc(vd, vbll);			res_vd = vec_andc(vd, vbll);
	// CHECK: bitcast <2 x double> %{{[0-9]*}} to <2 x i64>			// CHECK: bitcast <2 x double> %{{[0-9]*}} to <2 x i64>
	// CHECK: xor <2 x i64> %{{[0-9]*}}, <i64 -1, i64 -1>			// CHECK: xor <2 x i64> %{{[0-9]*}}, <i64 -1, i64 -1>
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
	// CHECK: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>			// CHECK: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>
				// CHECK-LE: bitcast <2 x double> %{{[0-9]*}} to <2 x i64>
				// CHECK-LE: xor <2 x i64> %{{[0-9]*}}, <i64 -1, i64 -1>
				// CHECK-LE: and <2 x i64>
				// CHECK-LE: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>

	dummy();			dummy();
	// CHECK: call void @dummy()			// CHECK: call void @dummy()

	res_vd = vec_andc(vd, vd);			res_vd = vec_andc(vd, vd);
	// CHECK: bitcast <2 x double> %{{[0-9]*}} to <2 x i64>			// CHECK: bitcast <2 x double> %{{[0-9]*}} to <2 x i64>
	// CHECK: xor <2 x i64> %{{[0-9]*}}, <i64 -1, i64 -1>			// CHECK: xor <2 x i64> %{{[0-9]*}}, <i64 -1, i64 -1>
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
	// CHECK: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>			// CHECK: bitcast <2 x i64> %{{[0-9]*}} to <2 x double>

	dummy();			dummy();
	// CHECK: call void @dummy()			// CHECK: call void @dummy()
				// CHECK-LE: call void @dummy()

	res_vd = vec_ceil(vd);			res_vd = vec_ceil(vd);
	// CHECK: call <2 x double> @llvm.ceil.v2f64(<2 x double> %{{[0-9]*}})			// CHECK: call <2 x double> @llvm.ceil.v2f64(<2 x double> %{{[0-9]*}})
				// CHECK-LE: call <2 x double> @llvm.ceil.v2f64(<2 x double> %{{[0-9]*}})

	res_vf = vec_ceil(vf);			res_vf = vec_ceil(vf);
	// CHECK: call <4 x float> @llvm.ceil.v4f32(<4 x float> %{{[0-9]*}})			// CHECK: call <4 x float> @llvm.ceil.v4f32(<4 x float> %{{[0-9]*}})
				// CHECK-LE: call <4 x float> @llvm.ceil.v4f32(<4 x float> %{{[0-9]*}})

	res_vbll = vec_cmpeq(vd, vd);			res_vbll = vec_cmpeq(vd, vd);
	// CHECK: call <2 x i64> @llvm.ppc.vsx.xvcmpeqdp(<2 x double> %{{[0-9]}}, <2 x double> %{{[0-9]}})			// CHECK: call <2 x i64> @llvm.ppc.vsx.xvcmpeqdp(<2 x double> %{{[0-9]}}, <2 x double> %{{[0-9]}})
				// CHECK-LE: call <2 x i64> @llvm.ppc.vsx.xvcmpeqdp(<2 x double> %{{[0-9]}}, <2 x double> %{{[0-9]}})

	res_vbi = vec_cmpeq(vf, vf);			res_vbi = vec_cmpeq(vf, vf);
	// CHECK: call <4 x i32> @llvm.ppc.vsx.xvcmpeqsp(<4 x float> %{{[0-9]}}, <4 x float> %{{[0-9]}})			// CHECK: call <4 x i32> @llvm.ppc.vsx.xvcmpeqsp(<4 x float> %{{[0-9]}}, <4 x float> %{{[0-9]}})
				// CHECK-LE: call <4 x i32> @llvm.ppc.vsx.xvcmpeqsp(<4 x float> %{{[0-9]}}, <4 x float> %{{[0-9]}})

	res_vbll = vec_cmpge(vd, vd);			res_vbll = vec_cmpge(vd, vd);
	// CHECK: call <2 x i64> @llvm.ppc.vsx.xvcmpgedp(<2 x double> %{{[0-9]}}, <2 x double> %{{[0-9]}})			// CHECK: call <2 x i64> @llvm.ppc.vsx.xvcmpgedp(<2 x double> %{{[0-9]}}, <2 x double> %{{[0-9]}})
				// CHECK-LE: call <2 x i64> @llvm.ppc.vsx.xvcmpgedp(<2 x double> %{{[0-9]}}, <2 x double> %{{[0-9]}})

	res_vbi = vec_cmpge(vf, vf);			res_vbi = vec_cmpge(vf, vf);
	// CHECK: call <4 x i32> @llvm.ppc.vsx.xvcmpgesp(<4 x float> %{{[0-9]}}, <4 x float> %{{[0-9]}})			// CHECK: call <4 x i32> @llvm.ppc.vsx.xvcmpgesp(<4 x float> %{{[0-9]}}, <4 x float> %{{[0-9]}})
				// CHECK-LE: call <4 x i32> @llvm.ppc.vsx.xvcmpgesp(<4 x float> %{{[0-9]}}, <4 x float> %{{[0-9]}})

	res_vbll = vec_cmpgt(vd, vd);			res_vbll = vec_cmpgt(vd, vd);
	// CHECK: call <2 x i64> @llvm.ppc.vsx.xvcmpgtdp(<2 x double> %{{[0-9]}}, <2 x double> %{{[0-9]}})			// CHECK: call <2 x i64> @llvm.ppc.vsx.xvcmpgtdp(<2 x double> %{{[0-9]}}, <2 x double> %{{[0-9]}})
				// CHECK-LE: call <2 x i64> @llvm.ppc.vsx.xvcmpgtdp(<2 x double> %{{[0-9]}}, <2 x double> %{{[0-9]}})

	res_vbi = vec_cmpgt(vf, vf);			res_vbi = vec_cmpgt(vf, vf);
	// CHECK: call <4 x i32> @llvm.ppc.vsx.xvcmpgtsp(<4 x float> %{{[0-9]}}, <4 x float> %{{[0-9]}})			// CHECK: call <4 x i32> @llvm.ppc.vsx.xvcmpgtsp(<4 x float> %{{[0-9]}}, <4 x float> %{{[0-9]}})
				// CHECK-LE: call <4 x i32> @llvm.ppc.vsx.xvcmpgtsp(<4 x float> %{{[0-9]}}, <4 x float> %{{[0-9]}})

	res_vbll = vec_cmple(vd, vd);			res_vbll = vec_cmple(vd, vd);
	// CHECK: call <2 x i64> @llvm.ppc.vsx.xvcmpgedp(<2 x double> %{{[0-9]}}, <2 x double> %{{[0-9]}})			// CHECK: call <2 x i64> @llvm.ppc.vsx.xvcmpgedp(<2 x double> %{{[0-9]}}, <2 x double> %{{[0-9]}})
				// CHECK-LE: call <2 x i64> @llvm.ppc.vsx.xvcmpgedp(<2 x double> %{{[0-9]}}, <2 x double> %{{[0-9]}})

	res_vbi = vec_cmple(vf, vf);			res_vbi = vec_cmple(vf, vf);
	// CHECK: call <4 x i32> @llvm.ppc.vsx.xvcmpgesp(<4 x float> %{{[0-9]}}, <4 x float> %{{[0-9]}})			// CHECK: call <4 x i32> @llvm.ppc.vsx.xvcmpgesp(<4 x float> %{{[0-9]}}, <4 x float> %{{[0-9]}})
				// CHECK-LE: call <4 x i32> @llvm.ppc.vsx.xvcmpgesp(<4 x float> %{{[0-9]}}, <4 x float> %{{[0-9]}})

	res_vbll = vec_cmplt(vd, vd);			res_vbll = vec_cmplt(vd, vd);
	// CHECK: call <2 x i64> @llvm.ppc.vsx.xvcmpgtdp(<2 x double> %{{[0-9]}}, <2 x double> %{{[0-9]}})			// CHECK: call <2 x i64> @llvm.ppc.vsx.xvcmpgtdp(<2 x double> %{{[0-9]}}, <2 x double> %{{[0-9]}})
				// CHECK-LE: call <2 x i64> @llvm.ppc.vsx.xvcmpgtdp(<2 x double> %{{[0-9]}}, <2 x double> %{{[0-9]}})

	res_vbi = vec_cmplt(vf, vf);			res_vbi = vec_cmplt(vf, vf);
	// CHECK: call <4 x i32> @llvm.ppc.vsx.xvcmpgtsp(<4 x float> %{{[0-9]}}, <4 x float> %{{[0-9]}})			// CHECK: call <4 x i32> @llvm.ppc.vsx.xvcmpgtsp(<4 x float> %{{[0-9]}}, <4 x float> %{{[0-9]}})
				// CHECK-LE: call <4 x i32> @llvm.ppc.vsx.xvcmpgtsp(<4 x float> %{{[0-9]}}, <4 x float> %{{[0-9]}})

	/* vec_div */			/* vec_div */
	res_vf = vec_div(vf, vf);			res_vf = vec_div(vf, vf);
	// CHECK: @llvm.ppc.vsx.xvdivsp			// CHECK: @llvm.ppc.vsx.xvdivsp
				// CHECK-LE: @llvm.ppc.vsx.xvdivsp

	res_vd = vec_div(vd, vd);			res_vd = vec_div(vd, vd);
	// CHECK: @llvm.ppc.vsx.xvdivdp			// CHECK: @llvm.ppc.vsx.xvdivdp
				// CHECK-LE: @llvm.ppc.vsx.xvdivdp

	/* vec_max */			/* vec_max */
	res_vf = vec_max(vf, vf);			res_vf = vec_max(vf, vf);
	// CHECK: @llvm.ppc.vsx.xvmaxsp			// CHECK: @llvm.ppc.vsx.xvmaxsp
				// CHECK-LE: @llvm.ppc.vsx.xvmaxsp

	res_vd = vec_max(vd, vd);			res_vd = vec_max(vd, vd);
	// CHECK: @llvm.ppc.vsx.xvmaxdp			// CHECK: @llvm.ppc.vsx.xvmaxdp
				// CHECK-LE: @llvm.ppc.vsx.xvmaxdp

	res_vf = vec_vmaxfp(vf, vf);			res_vf = vec_vmaxfp(vf, vf);
	// CHECK: @llvm.ppc.vsx.xvmaxsp			// CHECK: @llvm.ppc.vsx.xvmaxsp
				// CHECK-LE: @llvm.ppc.vsx.xvmaxsp

	/* vec_min */			/* vec_min */
	res_vf = vec_min(vf, vf);			res_vf = vec_min(vf, vf);
	// CHECK: @llvm.ppc.vsx.xvminsp			// CHECK: @llvm.ppc.vsx.xvminsp
				// CHECK-LE: @llvm.ppc.vsx.xvminsp

	res_vd = vec_min(vd, vd);			res_vd = vec_min(vd, vd);
	// CHECK: @llvm.ppc.vsx.xvmindp			// CHECK: @llvm.ppc.vsx.xvmindp
				// CHECK-LE: @llvm.ppc.vsx.xvmindp

	res_vf = vec_vminfp(vf, vf);			res_vf = vec_vminfp(vf, vf);
	// CHECK: @llvm.ppc.vsx.xvminsp			// CHECK: @llvm.ppc.vsx.xvminsp
				// CHECK-LE: @llvm.ppc.vsx.xvminsp

	res_d = __builtin_vsx_xsmaxdp(d, d);			res_d = __builtin_vsx_xsmaxdp(d, d);
	// CHECK: @llvm.ppc.vsx.xsmaxdp			// CHECK: @llvm.ppc.vsx.xsmaxdp
				// CHECK-LE: @llvm.ppc.vsx.xsmaxdp

	res_d = __builtin_vsx_xsmindp(d, d);			res_d = __builtin_vsx_xsmindp(d, d);
	// CHECK: @llvm.ppc.vsx.xsmindp			// CHECK: @llvm.ppc.vsx.xsmindp
				// CHECK-LE: @llvm.ppc.vsx.xsmindp

	/* vec_perm */			/* vec_perm */
	res_vsll = vec_perm(vsll, vsll, vuc);			res_vsll = vec_perm(vsll, vsll, vuc);
	// CHECK: @llvm.ppc.altivec.vperm			// CHECK: @llvm.ppc.altivec.vperm
				// CHECK-LE: @llvm.ppc.altivec.vperm

	res_vull = vec_perm(vull, vull, vuc);			res_vull = vec_perm(vull, vull, vuc);
	// CHECK: @llvm.ppc.altivec.vperm			// CHECK: @llvm.ppc.altivec.vperm
				// CHECK-LE: @llvm.ppc.altivec.vperm

				res_vbll = vec_perm(vbll, vbll, vuc);
				// CHECK: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK: call <4 x i32> @llvm.ppc.altivec.vperm(<4 x i32> [[T1]], <4 x i32> [[T2]], <16 x i8>
				// CHECK-LE: xor <16 x i8>
				// CHECK-LE: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK-LE: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK-LE: call <4 x i32> @llvm.ppc.altivec.vperm(<4 x i32> [[T1]], <4 x i32> [[T2]], <16 x i8>

				res_vf = vec_round(vf);
				// CHECK: call <4 x float> @llvm.round.v4f32(<4 x float>
				// CHECK-LE: call <4 x float> @llvm.round.v4f32(<4 x float>

				res_vd = vec_round(vd);
				// CHECK: call <2 x double> @llvm.round.v2f64(<2 x double>
				// CHECK-LE: call <2 x double> @llvm.round.v2f64(<2 x double>

	res_vd = vec_perm(vd, vd, vuc);			res_vd = vec_perm(vd, vd, vuc);
	// CHECK: @llvm.ppc.altivec.vperm			// CHECK: @llvm.ppc.altivec.vperm
				// CHECK-LE: @llvm.ppc.altivec.vperm

				res_vd = vec_splat(vd, 1);
				// CHECK: [[T1:%.+]] = bitcast <2 x double> {{.+}} to <4 x i32>
				// CHECK: [[T2:%.+]] = bitcast <2 x double> {{.+}} to <4 x i32>
				// CHECK: call <4 x i32> @llvm.ppc.altivec.vperm(<4 x i32> [[T1]], <4 x i32> [[T2]], <16 x i8>
				// CHECK-LE: xor <16 x i8>
				// CHECK-LE: [[T1:%.+]] = bitcast <2 x double> {{.+}} to <4 x i32>
				// CHECK-LE: [[T2:%.+]] = bitcast <2 x double> {{.+}} to <4 x i32>
				// CHECK-LE: call <4 x i32> @llvm.ppc.altivec.vperm(<4 x i32> [[T1]], <4 x i32> [[T2]], <16 x i8>

				res_vbll = vec_splat(vbll, 1);
				// CHECK: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK: call <4 x i32> @llvm.ppc.altivec.vperm(<4 x i32> [[T1]], <4 x i32> [[T2]], <16 x i8>
				// CHECK-LE: xor <16 x i8>
				// CHECK-LE: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK-LE: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK-LE: call <4 x i32> @llvm.ppc.altivec.vperm(<4 x i32> [[T1]], <4 x i32> [[T2]], <16 x i8>

				res_vsll = vec_splat(vsll, 1);
				// CHECK: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK: call <4 x i32> @llvm.ppc.altivec.vperm(<4 x i32> [[T1]], <4 x i32> [[T2]], <16 x i8>
				// CHECK-LE: xor <16 x i8>
				// CHECK-LE: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK-LE: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK-LE: call <4 x i32> @llvm.ppc.altivec.vperm(<4 x i32> [[T1]], <4 x i32> [[T2]], <16 x i8>

				res_vull = vec_splat(vull, 1);
				// CHECK: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK: call <4 x i32> @llvm.ppc.altivec.vperm(<4 x i32> [[T1]], <4 x i32> [[T2]], <16 x i8>
				// CHECK-LE: xor <16 x i8>
				// CHECK-LE: [[T1:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK-LE: [[T2:%.+]] = bitcast <2 x i64> {{.+}} to <4 x i32>
				// CHECK-LE: call <4 x i32> @llvm.ppc.altivec.vperm(<4 x i32> [[T1]], <4 x i32> [[T2]], <16 x i8>

	res_vsll = vec_vperm(vsll, vsll, vuc);			res_vsll = vec_vperm(vsll, vsll, vuc);
	// CHECK: @llvm.ppc.altivec.vperm			// CHECK: @llvm.ppc.altivec.vperm
				// CHECK-LE: @llvm.ppc.altivec.vperm

	res_vull = vec_vperm(vull, vull, vuc);			res_vull = vec_vperm(vull, vull, vuc);
	// CHECK: @llvm.ppc.altivec.vperm			// CHECK: @llvm.ppc.altivec.vperm
				// CHECK-LE: @llvm.ppc.altivec.vperm

	res_vd = vec_vperm(vd, vd, vuc);			res_vd = vec_vperm(vd, vd, vuc);
	// CHECK: @llvm.ppc.altivec.vperm			// CHECK: @llvm.ppc.altivec.vperm
				// CHECK-LE: @llvm.ppc.altivec.vperm

	/* vec_vsx_ld */			/* vec_vsx_ld */

	res_vsi = vec_vsx_ld(0, &vsi);			res_vsi = vec_vsx_ld(0, &vsi);
	// CHECK: @llvm.ppc.vsx.lxvw4x			// CHECK: @llvm.ppc.vsx.lxvw4x
				// CHECK-LE: @llvm.ppc.vsx.lxvw4x

	res_vui = vec_vsx_ld(0, &vui);			res_vui = vec_vsx_ld(0, &vui);
	// CHECK: @llvm.ppc.vsx.lxvw4x			// CHECK: @llvm.ppc.vsx.lxvw4x
				// CHECK-LE: @llvm.ppc.vsx.lxvw4x

	res_vf = vec_vsx_ld (0, &vf);			res_vf = vec_vsx_ld (0, &vf);
	// CHECK: @llvm.ppc.vsx.lxvw4x			// CHECK: @llvm.ppc.vsx.lxvw4x
				// CHECK-LE: @llvm.ppc.vsx.lxvw4x

	res_vsll = vec_vsx_ld(0, &vsll);			res_vsll = vec_vsx_ld(0, &vsll);
	// CHECK: @llvm.ppc.vsx.lxvd2x			// CHECK: @llvm.ppc.vsx.lxvd2x
				// CHECK-LE: @llvm.ppc.vsx.lxvd2x

	res_vull = vec_vsx_ld(0, &vull);			res_vull = vec_vsx_ld(0, &vull);
	// CHECK: @llvm.ppc.vsx.lxvd2x			// CHECK: @llvm.ppc.vsx.lxvd2x
				// CHECK-LE: @llvm.ppc.vsx.lxvd2x

	res_vd = vec_vsx_ld(0, &vd);			res_vd = vec_vsx_ld(0, &vd);
	// CHECK: @llvm.ppc.vsx.lxvd2x			// CHECK: @llvm.ppc.vsx.lxvd2x
				// CHECK-LE: @llvm.ppc.vsx.lxvd2x

	/* vec_vsx_st */			/* vec_vsx_st */

	vec_vsx_st(vsi, 0, &res_vsi);			vec_vsx_st(vsi, 0, &res_vsi);
	// CHECK: @llvm.ppc.vsx.stxvw4x			// CHECK: @llvm.ppc.vsx.stxvw4x
				// CHECK-LE: @llvm.ppc.vsx.stxvw4x

	vec_vsx_st(vui, 0, &res_vui);			vec_vsx_st(vui, 0, &res_vui);
	// CHECK: @llvm.ppc.vsx.stxvw4x			// CHECK: @llvm.ppc.vsx.stxvw4x
				// CHECK-LE: @llvm.ppc.vsx.stxvw4x

	vec_vsx_st(vf, 0, &res_vf);			vec_vsx_st(vf, 0, &res_vf);
	// CHECK: @llvm.ppc.vsx.stxvw4x			// CHECK: @llvm.ppc.vsx.stxvw4x
				// CHECK-LE: @llvm.ppc.vsx.stxvw4x

	vec_vsx_st(vsll, 0, &res_vsll);			vec_vsx_st(vsll, 0, &res_vsll);
	// CHECK: @llvm.ppc.vsx.stxvd2x			// CHECK: @llvm.ppc.vsx.stxvd2x
				// CHECK-LE: @llvm.ppc.vsx.stxvd2x

	vec_vsx_st(vull, 0, &res_vull);			vec_vsx_st(vull, 0, &res_vull);
	// CHECK: @llvm.ppc.vsx.stxvd2x			// CHECK: @llvm.ppc.vsx.stxvd2x
				// CHECK-LE: @llvm.ppc.vsx.stxvd2x

	vec_vsx_st(vd, 0, &res_vd);			vec_vsx_st(vd, 0, &res_vd);
	// CHECK: @llvm.ppc.vsx.stxvd2x			// CHECK: @llvm.ppc.vsx.stxvd2x
				// CHECK-LE: @llvm.ppc.vsx.stxvd2x

	/* vec_and */			/* vec_and */
	res_vsll = vec_and(vsll, vsll);			res_vsll = vec_and(vsll, vsll);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vsll = vec_and(vbll, vsll);			res_vsll = vec_and(vbll, vsll);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vsll = vec_and(vsll, vbll);			res_vsll = vec_and(vsll, vbll);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vull = vec_and(vull, vull);			res_vull = vec_and(vull, vull);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vull = vec_and(vbll, vull);			res_vull = vec_and(vbll, vull);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vull = vec_and(vull, vbll);			res_vull = vec_and(vull, vbll);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vbll = vec_and(vbll, vbll);			res_vbll = vec_and(vbll, vbll);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: and <2 x i64>

	/* vec_vand */			/* vec_vand */
	res_vsll = vec_vand(vsll, vsll);			res_vsll = vec_vand(vsll, vsll);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vsll = vec_vand(vbll, vsll);			res_vsll = vec_vand(vbll, vsll);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vsll = vec_vand(vsll, vbll);			res_vsll = vec_vand(vsll, vbll);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vull = vec_vand(vull, vull);			res_vull = vec_vand(vull, vull);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vull = vec_vand(vbll, vull);			res_vull = vec_vand(vbll, vull);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vull = vec_vand(vull, vbll);			res_vull = vec_vand(vull, vbll);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vbll = vec_vand(vbll, vbll);			res_vbll = vec_vand(vbll, vbll);
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: and <2 x i64>

	/* vec_andc */			/* vec_andc */
	res_vsll = vec_andc(vsll, vsll);			res_vsll = vec_andc(vsll, vsll);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: xor <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vsll = vec_andc(vbll, vsll);			res_vsll = vec_andc(vbll, vsll);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: xor <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vsll = vec_andc(vsll, vbll);			res_vsll = vec_andc(vsll, vbll);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: xor <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vull = vec_andc(vull, vull);			res_vull = vec_andc(vull, vull);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: xor <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vull = vec_andc(vbll, vull);			res_vull = vec_andc(vbll, vull);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: xor <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vull = vec_andc(vull, vbll);			res_vull = vec_andc(vull, vbll);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: xor <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vbll = vec_andc(vbll, vbll);			res_vbll = vec_andc(vbll, vbll);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
	// CHECK: and <2 x i64>			// CHECK: and <2 x i64>
				// CHECK-LE: xor <2 x i64>
				// CHECK-LE: and <2 x i64>

	res_vf = vec_floor(vf);			res_vf = vec_floor(vf);
	// CHECK: call <4 x float> @llvm.floor.v4f32(<4 x float> %{{[0-9]+}})			// CHECK: call <4 x float> @llvm.floor.v4f32(<4 x float> %{{[0-9]+}})
				// CHECK-LE: call <4 x float> @llvm.floor.v4f32(<4 x float> %{{[0-9]+}})

	res_vd = vec_floor(vd);			res_vd = vec_floor(vd);
	// CHECK: call <2 x double> @llvm.floor.v2f64(<2 x double> %{{[0-9]+}})			// CHECK: call <2 x double> @llvm.floor.v2f64(<2 x double> %{{[0-9]+}})
				// CHECK-LE: call <2 x double> @llvm.floor.v2f64(<2 x double> %{{[0-9]+}})

	res_vf = vec_madd(vf, vf, vf);			res_vf = vec_madd(vf, vf, vf);
	// CHECK: call <4 x float> @llvm.fma.v4f32(<4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}})			// CHECK: call <4 x float> @llvm.fma.v4f32(<4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}})
				// CHECK-LE: call <4 x float> @llvm.fma.v4f32(<4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}})

	res_vd = vec_madd(vd, vd, vd);			res_vd = vec_madd(vd, vd, vd);
	// CHECK: call <2 x double> @llvm.fma.v2f64(<2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}})			// CHECK: call <2 x double> @llvm.fma.v2f64(<2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}})
				// CHECK-LE: call <2 x double> @llvm.fma.v2f64(<2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}})

	res_vf = vec_msub(vf, vf, vf);			res_vf = vec_msub(vf, vf, vf);
	// CHECK: fsub <4 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %{{[0-9]+}}			// CHECK: fsub <4 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %{{[0-9]+}}
	// CHECK-NEXT: call <4 x float> @llvm.fma.v4f32(<4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}}, <4 x float>			// CHECK-NEXT: call <4 x float> @llvm.fma.v4f32(<4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}}, <4 x float>
				// CHECK-LE: fsub <4 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %{{[0-9]+}}
				// CHECK-LE-NEXT: call <4 x float> @llvm.fma.v4f32(<4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}}, <4 x float>

	res_vd = vec_msub(vd, vd, vd);			res_vd = vec_msub(vd, vd, vd);
	// CHECK: fsub <2 x double> <double -0.000000e+00, double -0.000000e+00>, %{{[0-9]+}}			// CHECK: fsub <2 x double> <double -0.000000e+00, double -0.000000e+00>, %{{[0-9]+}}
	// CHECK-NEXT: call <2 x double> @llvm.fma.v2f64(<2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}}, <2 x double>			// CHECK-NEXT: call <2 x double> @llvm.fma.v2f64(<2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}}, <2 x double>
				// CHECK-LE: fsub <2 x double> <double -0.000000e+00, double -0.000000e+00>, %{{[0-9]+}}
				// CHECK-LE-NEXT: call <2 x double> @llvm.fma.v2f64(<2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}}, <2 x double>

	res_vf = vec_mul(vf, vf);			res_vf = vec_mul(vf, vf);
	// CHECK: fmul <4 x float> %{{[0-9]+}}, %{{[0-9]+}}			// CHECK: fmul <4 x float> %{{[0-9]+}}, %{{[0-9]+}}
				// CHECK-LE: fmul <4 x float> %{{[0-9]+}}, %{{[0-9]+}}

	res_vd = vec_mul(vd, vd);			res_vd = vec_mul(vd, vd);
	// CHECK: fmul <2 x double> %{{[0-9]+}}, %{{[0-9]+}}			// CHECK: fmul <2 x double> %{{[0-9]+}}, %{{[0-9]+}}
				// CHECK-LE: fmul <2 x double> %{{[0-9]+}}, %{{[0-9]+}}

	res_vf = vec_nearbyint(vf);			res_vf = vec_nearbyint(vf);
	// CHECK: call <4 x float> @llvm.round.v4f32(<4 x float> %{{[0-9]+}})			// CHECK: call <4 x float> @llvm.round.v4f32(<4 x float> %{{[0-9]+}})
				// CHECK-LE: call <4 x float> @llvm.round.v4f32(<4 x float> %{{[0-9]+}})

	res_vd = vec_nearbyint(vd);			res_vd = vec_nearbyint(vd);
	// CHECK: call <2 x double> @llvm.round.v2f64(<2 x double> %{{[0-9]+}})			// CHECK: call <2 x double> @llvm.round.v2f64(<2 x double> %{{[0-9]+}})
				// CHECK-LE: call <2 x double> @llvm.round.v2f64(<2 x double> %{{[0-9]+}})

	res_vf = vec_nmadd(vf, vf, vf);			res_vf = vec_nmadd(vf, vf, vf);
	// CHECK: [[FM:[0-9]+]] = call <4 x float> @llvm.fma.v4f32(<4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}})			// CHECK: [[FM:[0-9]+]] = call <4 x float> @llvm.fma.v4f32(<4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}})
	// CHECK-NEXT: fsub <4 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %[[FM]]			// CHECK-NEXT: fsub <4 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %[[FM]]
				// CHECK-LE: [[FM:[0-9]+]] = call <4 x float> @llvm.fma.v4f32(<4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}})
				// CHECK-LE-NEXT: fsub <4 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %[[FM]]

	res_vd = vec_nmadd(vd, vd, vd);			res_vd = vec_nmadd(vd, vd, vd);
	// CHECK: [[FM:[0-9]+]] = call <2 x double> @llvm.fma.v2f64(<2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}})			// CHECK: [[FM:[0-9]+]] = call <2 x double> @llvm.fma.v2f64(<2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}})
	// CHECK-NEXT: fsub <2 x double> <double -0.000000e+00, double -0.000000e+00>, %[[FM]]			// CHECK-NEXT: fsub <2 x double> <double -0.000000e+00, double -0.000000e+00>, %[[FM]]
				// CHECK-LE: [[FM:[0-9]+]] = call <2 x double> @llvm.fma.v2f64(<2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}})
				// CHECK-LE-NEXT: fsub <2 x double> <double -0.000000e+00, double -0.000000e+00>, %[[FM]]

	res_vf = vec_nmsub(vf, vf, vf);			res_vf = vec_nmsub(vf, vf, vf);
	// CHECK: fsub <4 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %{{[0-9]+}}			// CHECK: fsub <4 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %{{[0-9]+}}
	// CHECK-NEXT: call <4 x float> @llvm.fma.v4f32(<4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}}, <4 x float>			// CHECK-NEXT: call <4 x float> @llvm.fma.v4f32(<4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}}, <4 x float>
	// CHECK: fsub <4 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %{{[0-9]+}}			// CHECK: fsub <4 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %{{[0-9]+}}
				// CHECK-LE: fsub <4 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %{{[0-9]+}}
				// CHECK-LE-NEXT: call <4 x float> @llvm.fma.v4f32(<4 x float> %{{[0-9]+}}, <4 x float> %{{[0-9]+}}, <4 x float>
				// CHECK-LE: fsub <4 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %{{[0-9]+}}

	res_vd = vec_nmsub(vd, vd, vd);			res_vd = vec_nmsub(vd, vd, vd);
	// CHECK: fsub <2 x double> <double -0.000000e+00, double -0.000000e+00>, %{{[0-9]+}}			// CHECK: fsub <2 x double> <double -0.000000e+00, double -0.000000e+00>, %{{[0-9]+}}
	// CHECK-NEXT: [[FM:[0-9]+]] = call <2 x double> @llvm.fma.v2f64(<2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}}, <2 x double>			// CHECK-NEXT: [[FM:[0-9]+]] = call <2 x double> @llvm.fma.v2f64(<2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}}, <2 x double>
	// CHECK-NEXT: fsub <2 x double> <double -0.000000e+00, double -0.000000e+00>, %[[FM]]			// CHECK-NEXT: fsub <2 x double> <double -0.000000e+00, double -0.000000e+00>, %[[FM]]
				// CHECK-LE: fsub <2 x double> <double -0.000000e+00, double -0.000000e+00>, %{{[0-9]+}}
				// CHECK-LE-NEXT: [[FM:[0-9]+]] = call <2 x double> @llvm.fma.v2f64(<2 x double> %{{[0-9]+}}, <2 x double> %{{[0-9]+}}, <2 x double>
				// CHECK-LE-NEXT: fsub <2 x double> <double -0.000000e+00, double -0.000000e+00>, %[[FM]]

	/* vec_nor */			/* vec_nor */
	res_vsll = vec_nor(vsll, vsll);			res_vsll = vec_nor(vsll, vsll);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: or <2 x i64>
				// CHECK-LE: xor <2 x i64>

	res_vull = vec_nor(vull, vull);			res_vull = vec_nor(vull, vull);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: or <2 x i64>
				// CHECK-LE: xor <2 x i64>

	res_vull = vec_nor(vbll, vbll);			res_vull = vec_nor(vbll, vbll);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: or <2 x i64>
				// CHECK-LE: xor <2 x i64>

	res_vd = vec_nor(vd, vd);			res_vd = vec_nor(vd, vd);
	// CHECK: bitcast <2 x double> %{{[0-9]+}} to <2 x i64>			// CHECK: bitcast <2 x double> %{{[0-9]+}} to <2 x i64>
	// CHECK: [[OR:%.+]] = or <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}			// CHECK: [[OR:%.+]] = or <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}
	// CHECK-NEXT: xor <2 x i64> [[OR]], <i64 -1, i64 -1>			// CHECK-NEXT: xor <2 x i64> [[OR]], <i64 -1, i64 -1>
				// CHECK-LE: bitcast <2 x double> %{{[0-9]+}} to <2 x i64>
				// CHECK-LE: [[OR:%.+]] = or <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}
				// CHECK-LE-NEXT: xor <2 x i64> [[OR]], <i64 -1, i64 -1>

	/* vec_or */			/* vec_or */
	res_vsll = vec_or(vsll, vsll);			res_vsll = vec_or(vsll, vsll);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
				// CHECK-LE: or <2 x i64>

	res_vsll = vec_or(vbll, vsll);			res_vsll = vec_or(vbll, vsll);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
				// CHECK-LE: or <2 x i64>

	res_vsll = vec_or(vsll, vbll);			res_vsll = vec_or(vsll, vbll);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
				// CHECK-LE: or <2 x i64>

	res_vull = vec_or(vull, vull);			res_vull = vec_or(vull, vull);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
				// CHECK-LE: or <2 x i64>

	res_vull = vec_or(vbll, vull);			res_vull = vec_or(vbll, vull);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
				// CHECK-LE: or <2 x i64>

	res_vull = vec_or(vull, vbll);			res_vull = vec_or(vull, vbll);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
				// CHECK-LE: or <2 x i64>

	res_vbll = vec_or(vbll, vbll);			res_vbll = vec_or(vbll, vbll);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
				// CHECK-LE: or <2 x i64>

	res_vd = vec_or(vd, vd);			res_vd = vec_or(vd, vd);
	// CHECK: bitcast <2 x double> %{{[0-9]+}} to <2 x i64>			// CHECK: bitcast <2 x double> %{{[0-9]+}} to <2 x i64>
	// CHECK: or <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}			// CHECK: or <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}
				// CHECK-LE: bitcast <2 x double> %{{[0-9]+}} to <2 x i64>
				// CHECK-LE: or <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}

	res_vf = vec_rint(vf);			res_vf = vec_rint(vf);
	// CHECK: call <4 x float> @llvm.nearbyint.v4f32(<4 x float> %{{[0-9]+}})			// CHECK: call <4 x float> @llvm.nearbyint.v4f32(<4 x float> %{{[0-9]+}})
				// CHECK-LE: call <4 x float> @llvm.nearbyint.v4f32(<4 x float> %{{[0-9]+}})

	res_vd = vec_rint(vd);			res_vd = vec_rint(vd);
	// CHECK: call <2 x double> @llvm.nearbyint.v2f64(<2 x double> %{{[0-9]+}})			// CHECK: call <2 x double> @llvm.nearbyint.v2f64(<2 x double> %{{[0-9]+}})
				// CHECK-LE: call <2 x double> @llvm.nearbyint.v2f64(<2 x double> %{{[0-9]+}})

	res_vf = vec_rsqrte(vf);			res_vf = vec_rsqrte(vf);
	// CHECK: call <4 x float> @llvm.ppc.vsx.xvrsqrtesp(<4 x float> %{{[0-9]+}})			// CHECK: call <4 x float> @llvm.ppc.vsx.xvrsqrtesp(<4 x float> %{{[0-9]+}})
				// CHECK-LE: call <4 x float> @llvm.ppc.vsx.xvrsqrtesp(<4 x float> %{{[0-9]+}})

	res_vd = vec_rsqrte(vd);			res_vd = vec_rsqrte(vd);
	// CHECK: call <2 x double> @llvm.ppc.vsx.xvrsqrtedp(<2 x double> %{{[0-9]+}})			// CHECK: call <2 x double> @llvm.ppc.vsx.xvrsqrtedp(<2 x double> %{{[0-9]+}})
				// CHECK-LE: call <2 x double> @llvm.ppc.vsx.xvrsqrtedp(<2 x double> %{{[0-9]+}})

	dummy();			dummy();
	// CHECK: call void @dummy()			// CHECK: call void @dummy()
				// CHECK-LE: call void @dummy()

	res_vf = vec_sel(vd, vd, vbll);			res_vf = vec_sel(vd, vd, vbll);
	// CHECK: xor <2 x i64> %{{[0-9]+}}, <i64 -1, i64 -1>			// CHECK: xor <2 x i64> %{{[0-9]+}}, <i64 -1, i64 -1>
	// CHECK: and <2 x i64> %{{[0-9]+}},			// CHECK: and <2 x i64> %{{[0-9]+}},
	// CHECK: and <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}			// CHECK: and <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
	// CHECK: bitcast <2 x i64> %{{[0-9]+}} to <2 x double>			// CHECK: bitcast <2 x i64> %{{[0-9]+}} to <2 x double>
				// CHECK-LE: xor <2 x i64> %{{[0-9]+}}, <i64 -1, i64 -1>
				// CHECK-LE: and <2 x i64> %{{[0-9]+}},
				// CHECK-LE: and <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}
				// CHECK-LE: or <2 x i64>
				// CHECK-LE: bitcast <2 x i64> %{{[0-9]+}} to <2 x double>

	dummy();			dummy();
	// CHECK: call void @dummy()			// CHECK: call void @dummy()
				// CHECK-LE: call void @dummy()

	res_vd = vec_sel(vd, vd, vull);			res_vd = vec_sel(vd, vd, vull);
	// CHECK: xor <2 x i64> %{{[0-9]+}}, <i64 -1, i64 -1>			// CHECK: xor <2 x i64> %{{[0-9]+}}, <i64 -1, i64 -1>
	// CHECK: and <2 x i64> %{{[0-9]+}},			// CHECK: and <2 x i64> %{{[0-9]+}},
	// CHECK: and <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}			// CHECK: and <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
	// CHECK: bitcast <2 x i64> %{{[0-9]+}} to <2 x double>			// CHECK: bitcast <2 x i64> %{{[0-9]+}} to <2 x double>
				// CHECK-LE: xor <2 x i64> %{{[0-9]+}}, <i64 -1, i64 -1>
				// CHECK-LE: and <2 x i64> %{{[0-9]+}},
				// CHECK-LE: and <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}
				// CHECK-LE: or <2 x i64>
				// CHECK-LE: bitcast <2 x i64> %{{[0-9]+}} to <2 x double>

	res_vf = vec_sqrt(vf);			res_vf = vec_sqrt(vf);
	// CHECK: call <4 x float> @llvm.sqrt.v4f32(<4 x float> %{{[0-9]+}})			// CHECK: call <4 x float> @llvm.sqrt.v4f32(<4 x float> %{{[0-9]+}})
				// CHECK-LE: call <4 x float> @llvm.sqrt.v4f32(<4 x float> %{{[0-9]+}})

	res_vd = vec_sqrt(vd);			res_vd = vec_sqrt(vd);
	// CHECK: call <2 x double> @llvm.sqrt.v2f64(<2 x double> %{{[0-9]+}})			// CHECK: call <2 x double> @llvm.sqrt.v2f64(<2 x double> %{{[0-9]+}})
				// CHECK-LE: call <2 x double> @llvm.sqrt.v2f64(<2 x double> %{{[0-9]+}})

	res_vd = vec_sub(vd, vd);			res_vd = vec_sub(vd, vd);
	// CHECK: fsub <2 x double> %{{[0-9]+}}, %{{[0-9]+}}			// CHECK: fsub <2 x double> %{{[0-9]+}}, %{{[0-9]+}}
				// CHECK-LE: fsub <2 x double> %{{[0-9]+}}, %{{[0-9]+}}

	res_vf = vec_trunc(vf);			res_vf = vec_trunc(vf);
	// CHECK: call <4 x float> @llvm.trunc.v4f32(<4 x float> %{{[0-9]+}})			// CHECK: call <4 x float> @llvm.trunc.v4f32(<4 x float> %{{[0-9]+}})
				// CHECK-LE: call <4 x float> @llvm.trunc.v4f32(<4 x float> %{{[0-9]+}})

	res_vd = vec_trunc(vd);			res_vd = vec_trunc(vd);
	// CHECK: call <2 x double> @llvm.trunc.v2f64(<2 x double> %{{[0-9]+}})			// CHECK: call <2 x double> @llvm.trunc.v2f64(<2 x double> %{{[0-9]+}})
				// CHECK-LE: call <2 x double> @llvm.trunc.v2f64(<2 x double> %{{[0-9]+}})

	/* vec_vor */			/* vec_vor */
	res_vsll = vec_vor(vsll, vsll);			res_vsll = vec_vor(vsll, vsll);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
				// CHECK-LE: or <2 x i64>

	res_vsll = vec_vor(vbll, vsll);			res_vsll = vec_vor(vbll, vsll);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
				// CHECK-LE: or <2 x i64>

	res_vsll = vec_vor(vsll, vbll);			res_vsll = vec_vor(vsll, vbll);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
				// CHECK-LE: or <2 x i64>

	res_vull = vec_vor(vull, vull);			res_vull = vec_vor(vull, vull);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
				// CHECK-LE: or <2 x i64>

	res_vull = vec_vor(vbll, vull);			res_vull = vec_vor(vbll, vull);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
				// CHECK-LE: or <2 x i64>

	res_vull = vec_vor(vull, vbll);			res_vull = vec_vor(vull, vbll);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
				// CHECK-LE: or <2 x i64>

	res_vbll = vec_vor(vbll, vbll);			res_vbll = vec_vor(vbll, vbll);
	// CHECK: or <2 x i64>			// CHECK: or <2 x i64>
				// CHECK-LE: or <2 x i64>

	/* vec_xor */			/* vec_xor */
	res_vsll = vec_xor(vsll, vsll);			res_vsll = vec_xor(vsll, vsll);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: xor <2 x i64>

	res_vsll = vec_xor(vbll, vsll);			res_vsll = vec_xor(vbll, vsll);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: xor <2 x i64>

	res_vsll = vec_xor(vsll, vbll);			res_vsll = vec_xor(vsll, vbll);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: xor <2 x i64>

	res_vull = vec_xor(vull, vull);			res_vull = vec_xor(vull, vull);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: xor <2 x i64>

	res_vull = vec_xor(vbll, vull);			res_vull = vec_xor(vbll, vull);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: xor <2 x i64>

	res_vull = vec_xor(vull, vbll);			res_vull = vec_xor(vull, vbll);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: xor <2 x i64>

	res_vbll = vec_xor(vbll, vbll);			res_vbll = vec_xor(vbll, vbll);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: xor <2 x i64>

	dummy();			dummy();
	// CHECK: call void @dummy()			// CHECK: call void @dummy()
				// CHECK-LE: call void @dummy()

	res_vd = vec_xor(vd, vd);			res_vd = vec_xor(vd, vd);
	// CHECK: [[X1:%.+]] = xor <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}			// CHECK: [[X1:%.+]] = xor <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}
	// CHECK: bitcast <2 x i64> [[X1]] to <2 x double>			// CHECK: bitcast <2 x i64> [[X1]] to <2 x double>
				// CHECK-LE: [[X1:%.+]] = xor <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}
				// CHECK-LE: bitcast <2 x i64> [[X1]] to <2 x double>

	dummy();			dummy();
	// CHECK: call void @dummy()			// CHECK: call void @dummy()
				// CHECK-LE: call void @dummy()

	res_vd = vec_xor(vd, vbll);			res_vd = vec_xor(vd, vbll);
	// CHECK: [[X1:%.+]] = xor <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}			// CHECK: [[X1:%.+]] = xor <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}
	// CHECK: bitcast <2 x i64> [[X1]] to <2 x double>			// CHECK: bitcast <2 x i64> [[X1]] to <2 x double>
				// CHECK-LE: [[X1:%.+]] = xor <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}
				// CHECK-LE: bitcast <2 x i64> [[X1]] to <2 x double>

	dummy();			dummy();
	// CHECK: call void @dummy()			// CHECK: call void @dummy()
				// CHECK-LE: call void @dummy()

	res_vd = vec_xor(vbll, vd);			res_vd = vec_xor(vbll, vd);
	// CHECK: [[X1:%.+]] = xor <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}			// CHECK: [[X1:%.+]] = xor <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}
	// CHECK: bitcast <2 x i64> [[X1]] to <2 x double>			// CHECK: bitcast <2 x i64> [[X1]] to <2 x double>
				// CHECK-LE: [[X1:%.+]] = xor <2 x i64> %{{[0-9]+}}, %{{[0-9]+}}
				// CHECK-LE: bitcast <2 x i64> [[X1]] to <2 x double>

	/* vec_vxor */			/* vec_vxor */
	res_vsll = vec_vxor(vsll, vsll);			res_vsll = vec_vxor(vsll, vsll);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: xor <2 x i64>

	res_vsll = vec_vxor(vbll, vsll);			res_vsll = vec_vxor(vbll, vsll);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: xor <2 x i64>

	res_vsll = vec_vxor(vsll, vbll);			res_vsll = vec_vxor(vsll, vbll);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: xor <2 x i64>

	res_vull = vec_vxor(vull, vull);			res_vull = vec_vxor(vull, vull);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: xor <2 x i64>

	res_vull = vec_vxor(vbll, vull);			res_vull = vec_vxor(vbll, vull);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: xor <2 x i64>

	res_vull = vec_vxor(vull, vbll);			res_vull = vec_vxor(vull, vbll);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: xor <2 x i64>

	res_vbll = vec_vxor(vbll, vbll);			res_vbll = vec_vxor(vbll, vbll);
	// CHECK: xor <2 x i64>			// CHECK: xor <2 x i64>
				// CHECK-LE: xor <2 x i64>

	}			}