This is an archive of the discontinued LLVM Phabricator instance.

Paths

Table of Contentst

-
lib/builtins/
-
builtins/
2
divdc3.c
1
divsc3.c
-
divtc3.c
-
divxc3.c
-
test/builtins/Unit/
-
builtins/
-
Unit/
1
divdc3_test.c
-
divsc3_test.c
-
divtc3_test.c
-
divxc3_test.c

Differential D63061

[builtins] Fix overflow issue for complex division with big numbers
Needs RevisionPublic

Authored by zsrkmyn on Jun 9 2019, 9:58 AM.

Download Raw Diff

Details

Reviewers

howard.hinnant
nsz
phosek
• ddunbar
craig.topper
andrew.w.kaylor
scanon

Summary

__div*c3 functions get overflow with large numbers, e.g. (DBL_MAX + DBL_MAXi) / (0.5DBL_MAX + 0.5DBL_MAXi) for __divdc3.
This patch tries to fix them.

Diff Detail

Event Timeline

zsrkmyn created this revision.Jun 9 2019, 9:58 AM

Herald added projects: Restricted Project, Restricted Project. · View Herald TranscriptJun 9 2019, 9:58 AM

Herald added subscribers: Restricted Project, llvm-commits. · View Herald Transcript

MaskRay added a subscriber: MaskRay.Jul 9 2019, 7:16 PM

zsrkmyn added reviewers: nsz, phosek.Jul 9 2019, 10:01 PM

ping

erichkeane added a reviewer: craig.topper.Sep 3 2019, 6:17 AM

craig.topper added a reviewer: andrew.w.kaylor.Sep 3 2019, 9:57 AM

craig.topper added a reviewer: scanon.Sep 3 2019, 10:20 AM

fzou1 added a subscriber: fzou1.Sep 19 2019, 10:33 PM

@scanon, is this something you can help with?

scanon requested changes to this revision.Nov 20 2019, 6:11 AM

scanon added inline comments.

lib/builtins/divdc3.c
34	We don't have a clear definition of the required semantics for these builtins, but should FMA formation be allowed here? As written, it looks like we're at the mercy of the fp-contract flags passed while building compiler-rt, which means that the exact cancellation assumed by the tests won't pass if the default is ever "on". I would suggest either relaxing the tests or adding an explicit `#pragma STDC FP_CONTRACT OFF` in these functions. The latter is the simpler option, and doesn't have any real downside; we can discuss relaxing it later if we want.
test/builtins/Unit/divdc3_test.c
368	It would be good to build up these tests a bit more. In particular for double, we should include the test cases from Baudin & Smith's "A Robust Complex Division in Scilab" (https://arxiv.org/abs/1210.4539) for double; there are only 10, but they cover most of the hardest-to-get-right finite-result cases for complex division. They are trying to implement a division with a componentwise error-bound. That's a non-goal for compiler-rt, so we shouldn't expect to get them exactly right, but we should be able to get them with small relative error.

This revision now requires changes to proceed.Nov 20 2019, 6:11 AM

scanon added inline comments.Nov 20 2019, 6:39 AM

lib/builtins/divdc3.c
33	This rescaling strategy is still prone to overflow. Consider `a = b = DBL_MAX`, `c = d = 1`. The rescaled `ac + bd` will still overflow, because `max(c,d)` is 1, but the result should be finite. In general, I don't think that you can implement a rescaled division like this without considering the scaling of both (a,b) and (c,d); it doesn't suffice to only use the scaling of (c,d) alone.
lib/builtins/divsc3.c
21	On targets where we have hardware double-precision, it would be a huge win for float to simply promote to double and skip rescaling entirely. We still need the inf/nan checks, but for finite results this always gives the right answer. This can be a follow-on patch, however.

Revision Contents

Path

Size

lib/

builtins/

7 lines

7 lines

7 lines

7 lines

test/

builtins/

Unit/

39 lines

39 lines

43 lines

39 lines

Diff 203746

lib/builtins/divdc3.c

	Show All 17 Lines
	// Returns: the quotient of (a + ib) / (c + id)			// Returns: the quotient of (a + ib) / (c + id)

	COMPILER_RT_ABI Dcomplex __divdc3(double __a, double __b, double __c,			COMPILER_RT_ABI Dcomplex __divdc3(double __a, double __b, double __c,
	double __d) {			double __d) {
	int __ilogbw = 0;			int __ilogbw = 0;
	double __logbw = __compiler_rt_logb(crt_fmax(crt_fabs(__c), crt_fabs(__d)));			double __logbw = __compiler_rt_logb(crt_fmax(crt_fabs(__c), crt_fabs(__d)));
	if (crt_isfinite(__logbw)) {			if (crt_isfinite(__logbw)) {
	__ilogbw = (int)__logbw;			__ilogbw = (int)__logbw;
				__a = crt_scalbn(__a, -__ilogbw);
				__b = crt_scalbn(__b, -__ilogbw);
	__c = crt_scalbn(__c, -__ilogbw);			__c = crt_scalbn(__c, -__ilogbw);
	__d = crt_scalbn(__d, -__ilogbw);			__d = crt_scalbn(__d, -__ilogbw);
	}			}
	double __denom = __c * __c + __d * __d;			double __denom = __c * __c + __d * __d;
	Dcomplex z;			Dcomplex z;
	COMPLEX_REAL(z) = crt_scalbn((__a * __c + __b * __d) / __denom, -__ilogbw);			COMPLEX_REAL(z) = (__a * __c + __b * __d) / __denom;
				scanonUnsubmitted Not Done Reply Inline Actions This rescaling strategy is still prone to overflow. Consider `a = b = DBL_MAX`, `c = d = 1`. The rescaled `ac + bd` will still overflow, because `max(c,d)` is 1, but the result should be finite. In general, I don't think that you can implement a rescaled division like this without considering the scaling of both (a,b) and (c,d); it doesn't suffice to only use the scaling of (c,d) alone. scanon: This rescaling strategy is still prone to overflow. Consider `a = b = DBL_MAX`, `c = d = 1`.
	COMPLEX_IMAGINARY(z) =			COMPLEX_IMAGINARY(z) = (__b * __c - __a * __d) / __denom;
				scanonUnsubmitted Not Done Reply Inline Actions We don't have a clear definition of the required semantics for these builtins, but should FMA formation be allowed here? As written, it looks like we're at the mercy of the fp-contract flags passed while building compiler-rt, which means that the exact cancellation assumed by the tests won't pass if the default is ever "on". I would suggest either relaxing the tests or adding an explicit `#pragma STDC FP_CONTRACT OFF` in these functions. The latter is the simpler option, and doesn't have any real downside; we can discuss relaxing it later if we want. scanon: We don't have a clear definition of the required semantics for these builtins, but should FMA…
	crt_scalbn((__b * __c - __a * __d) / __denom, -__ilogbw);
	if (crt_isnan(COMPLEX_REAL(z)) && crt_isnan(COMPLEX_IMAGINARY(z))) {			if (crt_isnan(COMPLEX_REAL(z)) && crt_isnan(COMPLEX_IMAGINARY(z))) {
	if ((__denom == 0.0) && (!crt_isnan(__a) \|\| !crt_isnan(__b))) {			if ((__denom == 0.0) && (!crt_isnan(__a) \|\| !crt_isnan(__b))) {
	COMPLEX_REAL(z) = crt_copysign(CRT_INFINITY, __c) * __a;			COMPLEX_REAL(z) = crt_copysign(CRT_INFINITY, __c) * __a;
	COMPLEX_IMAGINARY(z) = crt_copysign(CRT_INFINITY, __c) * __b;			COMPLEX_IMAGINARY(z) = crt_copysign(CRT_INFINITY, __c) * __b;
	} else if ((crt_isinf(__a) \|\| crt_isinf(__b)) && crt_isfinite(__c) &&			} else if ((crt_isinf(__a) \|\| crt_isinf(__b)) && crt_isfinite(__c) &&
	crt_isfinite(__d)) {			crt_isfinite(__d)) {
	__a = crt_copysign(crt_isinf(__a) ? 1.0 : 0.0, __a);			__a = crt_copysign(crt_isinf(__a) ? 1.0 : 0.0, __a);
	__b = crt_copysign(crt_isinf(__b) ? 1.0 : 0.0, __b);			__b = crt_copysign(crt_isinf(__b) ? 1.0 : 0.0, __b);
	Show All 12 Lines

lib/builtins/divsc3.c

	Show All 12 Lines
	#define SINGLE_PRECISION			#define SINGLE_PRECISION
	#include "fp_lib.h"			#include "fp_lib.h"
	#include "int_lib.h"			#include "int_lib.h"
	#include "int_math.h"			#include "int_math.h"

	// Returns: the quotient of (a + ib) / (c + id)			// Returns: the quotient of (a + ib) / (c + id)

	COMPILER_RT_ABI Fcomplex __divsc3(float __a, float __b, float __c, float __d) {			COMPILER_RT_ABI Fcomplex __divsc3(float __a, float __b, float __c, float __d) {
	int __ilogbw = 0;			int __ilogbw = 0;
				scanonUnsubmitted Not Done Reply Inline Actions On targets where we have hardware double-precision, it would be a huge win for float to simply promote to double and skip rescaling entirely. We still need the inf/nan checks, but for finite results this always gives the right answer. This can be a follow-on patch, however. scanon: On targets where we have hardware double-precision, it would be a huge win for float to simply…
	float __logbw =			float __logbw =
	__compiler_rt_logbf(crt_fmaxf(crt_fabsf(__c), crt_fabsf(__d)));			__compiler_rt_logbf(crt_fmaxf(crt_fabsf(__c), crt_fabsf(__d)));
	if (crt_isfinite(__logbw)) {			if (crt_isfinite(__logbw)) {
	__ilogbw = (int)__logbw;			__ilogbw = (int)__logbw;
				__a = crt_scalbnf(__a, -__ilogbw);
				__b = crt_scalbnf(__b, -__ilogbw);
	__c = crt_scalbnf(__c, -__ilogbw);			__c = crt_scalbnf(__c, -__ilogbw);
	__d = crt_scalbnf(__d, -__ilogbw);			__d = crt_scalbnf(__d, -__ilogbw);
	}			}
	float __denom = __c * __c + __d * __d;			float __denom = __c * __c + __d * __d;
	Fcomplex z;			Fcomplex z;
	COMPLEX_REAL(z) = crt_scalbnf((__a * __c + __b * __d) / __denom, -__ilogbw);			COMPLEX_REAL(z) = (__a * __c + __b * __d) / __denom;
	COMPLEX_IMAGINARY(z) =			COMPLEX_IMAGINARY(z) = (__b * __c - __a * __d) / __denom;
	crt_scalbnf((__b * __c - __a * __d) / __denom, -__ilogbw);
	if (crt_isnan(COMPLEX_REAL(z)) && crt_isnan(COMPLEX_IMAGINARY(z))) {			if (crt_isnan(COMPLEX_REAL(z)) && crt_isnan(COMPLEX_IMAGINARY(z))) {
	if ((__denom == 0) && (!crt_isnan(__a) \|\| !crt_isnan(__b))) {			if ((__denom == 0) && (!crt_isnan(__a) \|\| !crt_isnan(__b))) {
	COMPLEX_REAL(z) = crt_copysignf(CRT_INFINITY, __c) * __a;			COMPLEX_REAL(z) = crt_copysignf(CRT_INFINITY, __c) * __a;
	COMPLEX_IMAGINARY(z) = crt_copysignf(CRT_INFINITY, __c) * __b;			COMPLEX_IMAGINARY(z) = crt_copysignf(CRT_INFINITY, __c) * __b;
	} else if ((crt_isinf(__a) \|\| crt_isinf(__b)) && crt_isfinite(__c) &&			} else if ((crt_isinf(__a) \|\| crt_isinf(__b)) && crt_isfinite(__c) &&
	crt_isfinite(__d)) {			crt_isfinite(__d)) {
	__a = crt_copysignf(crt_isinf(__a) ? 1 : 0, __a);			__a = crt_copysignf(crt_isinf(__a) ? 1 : 0, __a);
	__b = crt_copysignf(crt_isinf(__b) ? 1 : 0, __b);			__b = crt_copysignf(crt_isinf(__b) ? 1 : 0, __b);
	Show All 12 Lines

lib/builtins/divtc3.c

	Show All 18 Lines

	COMPILER_RT_ABI Lcomplex __divtc3(long double __a, long double __b,			COMPILER_RT_ABI Lcomplex __divtc3(long double __a, long double __b,
	long double __c, long double __d) {			long double __c, long double __d) {
	int __ilogbw = 0;			int __ilogbw = 0;
	long double __logbw =			long double __logbw =
	__compiler_rt_logbl(crt_fmaxl(crt_fabsl(__c), crt_fabsl(__d)));			__compiler_rt_logbl(crt_fmaxl(crt_fabsl(__c), crt_fabsl(__d)));
	if (crt_isfinite(__logbw)) {			if (crt_isfinite(__logbw)) {
	__ilogbw = (int)__logbw;			__ilogbw = (int)__logbw;
				__a = crt_scalbnl(__a, -__ilogbw);
				__b = crt_scalbnl(__b, -__ilogbw);
	__c = crt_scalbnl(__c, -__ilogbw);			__c = crt_scalbnl(__c, -__ilogbw);
	__d = crt_scalbnl(__d, -__ilogbw);			__d = crt_scalbnl(__d, -__ilogbw);
	}			}
	long double __denom = __c * __c + __d * __d;			long double __denom = __c * __c + __d * __d;
	Lcomplex z;			Lcomplex z;
	COMPLEX_REAL(z) = crt_scalbnl((__a * __c + __b * __d) / __denom, -__ilogbw);			COMPLEX_REAL(z) = (__a * __c + __b * __d) / __denom;
	COMPLEX_IMAGINARY(z) =			COMPLEX_IMAGINARY(z) = (__b * __c - __a * __d) / __denom;
	crt_scalbnl((__b * __c - __a * __d) / __denom, -__ilogbw);
	if (crt_isnan(COMPLEX_REAL(z)) && crt_isnan(COMPLEX_IMAGINARY(z))) {			if (crt_isnan(COMPLEX_REAL(z)) && crt_isnan(COMPLEX_IMAGINARY(z))) {
	if ((__denom == 0.0) && (!crt_isnan(__a) \|\| !crt_isnan(__b))) {			if ((__denom == 0.0) && (!crt_isnan(__a) \|\| !crt_isnan(__b))) {
	COMPLEX_REAL(z) = crt_copysignl(CRT_INFINITY, __c) * __a;			COMPLEX_REAL(z) = crt_copysignl(CRT_INFINITY, __c) * __a;
	COMPLEX_IMAGINARY(z) = crt_copysignl(CRT_INFINITY, __c) * __b;			COMPLEX_IMAGINARY(z) = crt_copysignl(CRT_INFINITY, __c) * __b;
	} else if ((crt_isinf(__a) \|\| crt_isinf(__b)) && crt_isfinite(__c) &&			} else if ((crt_isinf(__a) \|\| crt_isinf(__b)) && crt_isfinite(__c) &&
	crt_isfinite(__d)) {			crt_isfinite(__d)) {
	__a = crt_copysignl(crt_isinf(__a) ? 1.0 : 0.0, __a);			__a = crt_copysignl(crt_isinf(__a) ? 1.0 : 0.0, __a);
	__b = crt_copysignl(crt_isinf(__b) ? 1.0 : 0.0, __b);			__b = crt_copysignl(crt_isinf(__b) ? 1.0 : 0.0, __b);
	Show All 12 Lines

lib/builtins/divxc3.c

	Show All 17 Lines
	// Returns: the quotient of (a + ib) / (c + id)			// Returns: the quotient of (a + ib) / (c + id)

	COMPILER_RT_ABI Lcomplex __divxc3(long double __a, long double __b,			COMPILER_RT_ABI Lcomplex __divxc3(long double __a, long double __b,
	long double __c, long double __d) {			long double __c, long double __d) {
	int __ilogbw = 0;			int __ilogbw = 0;
	long double __logbw = crt_logbl(crt_fmaxl(crt_fabsl(__c), crt_fabsl(__d)));			long double __logbw = crt_logbl(crt_fmaxl(crt_fabsl(__c), crt_fabsl(__d)));
	if (crt_isfinite(__logbw)) {			if (crt_isfinite(__logbw)) {
	__ilogbw = (int)__logbw;			__ilogbw = (int)__logbw;
				__a = crt_scalbnl(__a, -__ilogbw);
				__b = crt_scalbnl(__b, -__ilogbw);
	__c = crt_scalbnl(__c, -__ilogbw);			__c = crt_scalbnl(__c, -__ilogbw);
	__d = crt_scalbnl(__d, -__ilogbw);			__d = crt_scalbnl(__d, -__ilogbw);
	}			}
	long double __denom = __c * __c + __d * __d;			long double __denom = __c * __c + __d * __d;
	Lcomplex z;			Lcomplex z;
	COMPLEX_REAL(z) = crt_scalbnl((__a * __c + __b * __d) / __denom, -__ilogbw);			COMPLEX_REAL(z) = (__a * __c + __b * __d) / __denom;
	COMPLEX_IMAGINARY(z) =			COMPLEX_IMAGINARY(z) = (__b * __c - __a * __d) / __denom;
	crt_scalbnl((__b * __c - __a * __d) / __denom, -__ilogbw);
	if (crt_isnan(COMPLEX_REAL(z)) && crt_isnan(COMPLEX_IMAGINARY(z))) {			if (crt_isnan(COMPLEX_REAL(z)) && crt_isnan(COMPLEX_IMAGINARY(z))) {
	if ((__denom == 0) && (!crt_isnan(__a) \|\| !crt_isnan(__b))) {			if ((__denom == 0) && (!crt_isnan(__a) \|\| !crt_isnan(__b))) {
	COMPLEX_REAL(z) = crt_copysignl(CRT_INFINITY, __c) * __a;			COMPLEX_REAL(z) = crt_copysignl(CRT_INFINITY, __c) * __a;
	COMPLEX_IMAGINARY(z) = crt_copysignl(CRT_INFINITY, __c) * __b;			COMPLEX_IMAGINARY(z) = crt_copysignl(CRT_INFINITY, __c) * __b;
	} else if ((crt_isinf(__a) \|\| crt_isinf(__b)) && crt_isfinite(__c) &&			} else if ((crt_isinf(__a) \|\| crt_isinf(__b)) && crt_isfinite(__c) &&
	crt_isfinite(__d)) {			crt_isfinite(__d)) {
	__a = crt_copysignl(crt_isinf(__a) ? 1 : 0, __a);			__a = crt_copysignl(crt_isinf(__a) ? 1 : 0, __a);
	__b = crt_copysignl(crt_isinf(__b) ? 1 : 0, __b);			__b = crt_copysignl(crt_isinf(__b) ? 1 : 0, __b);
	Show All 14 Lines

test/builtins/Unit/divdc3_test.c

Show First 20 Lines • Show All 48 Lines • ▼ Show 20 Lines	classify(double _Complex x)
return non_zero;		return non_zero;
}		}

int test__divdc3(double a, double b, double c, double d)		int test__divdc3(double a, double b, double c, double d)
{		{
double _Complex r = __divdc3(a, b, c, d);		double _Complex r = __divdc3(a, b, c, d);
// printf("test__divdc3(%f, %f, %f, %f) = %f + I%f\n",		// printf("test__divdc3(%f, %f, %f, %f) = %f + I%f\n",
// a, b, c, d, creal(r), cimag(r));		// a, b, c, d, creal(r), cimag(r));
double _Complex dividend;		double _Complex dividend;
double _Complex divisor;		double _Complex divisor;

__real__ dividend = a;		__real__ dividend = a;
__imag__ dividend = b;		__imag__ dividend = b;
__real__ divisor = c;		__real__ divisor = c;
__imag__ divisor = d;		__imag__ divisor = d;

switch (classify(dividend))		switch (classify(dividend))
{		{
case zero:		case zero:
switch (classify(divisor))		switch (classify(divisor))
{		{
case zero:		case zero:
if (classify(r) != NaN)		if (classify(r) != NaN)
return 1;		return 1;
▲ Show 20 Lines • Show All 118 Lines • ▼ Show 20 Lines	case non_zero_nan:
break;		break;
case non_zero_nan:		case non_zero_nan:
if (classify(r) != NaN)		if (classify(r) != NaN)
return 1;		return 1;
break;		break;
}		}
break;		break;
}		}

return 0;		return 0;
}		}

double x[][2] =		double x[][2] =
{		{
{ 1.e-6, 1.e-6},		{ 1.e-6, 1.e-6},
{-1.e-6, 1.e-6},		{-1.e-6, 1.e-6},
{-1.e-6, -1.e-6},		{-1.e-6, -1.e-6},
▲ Show 20 Lines • Show All 143 Lines • ▼ Show 20 Lines	double x[][2] =
{+0., INFINITY},		{+0., INFINITY},
{0.5, INFINITY},		{0.5, INFINITY},
{1, INFINITY},		{1, INFINITY},
{2, INFINITY},		{2, INFINITY},
{INFINITY, INFINITY}		{INFINITY, INFINITY}

};		};

		int test_bignum__divdc3(double a, double b, double c, double d, double _Complex r)
		{
		return __divdc3(a, b, c, d) != r;
		}

		double x_bignum[][5] =
		{
		{__DBL_MAX__, __DBL_MAX__, __DBL_MAX__/2, __DBL_MAX__/2, 2.},
		{-__DBL_MAX__, -__DBL_MAX__, __DBL_MAX__/2, __DBL_MAX__/2, -2.},
		};
		scanonUnsubmitted Not Done Reply Inline Actions It would be good to build up these tests a bit more. In particular for double, we should include the test cases from Baudin & Smith's "A Robust Complex Division in Scilab" (https://arxiv.org/abs/1210.4539) for double; there are only 10, but they cover most of the hardest-to-get-right finite-result cases for complex division. They are trying to implement a division with a componentwise error-bound. That's a non-goal for compiler-rt, so we shouldn't expect to get them exactly right, but we should be able to get them with small relative error. scanon: It would be good to build up these tests a bit more. In particular for double, we should…

int main()		int main()
{		{
const unsigned N = sizeof(x) / sizeof(x[0]);		unsigned N = sizeof(x) / sizeof(x[0]);
unsigned i, j;		unsigned i, j;
for (i = 0; i < N; ++i)		for (i = 0; i < N; ++i)
{		{
for (j = 0; j < N; ++j)		for (j = 0; j < N; ++j)
{		{
if (test__divdc3(x[i][0], x[i][1], x[j][0], x[j][1]))		if (test__divdc3(x[i][0], x[i][1], x[j][0], x[j][1]))
return 1;		return 1;
}		}
}		}

		N = sizeof(x_bignum) / sizeof(x_bignum[0]);
		for (i = 0; i < N; ++i)
		{
		double *t = x_bignum[i];
		if (test_bignum__divdc3(t[0], t[1], t[2], t[3], t[4]))
		return 1;
		}

return 0;		return 0;
}		}

test/builtins/Unit/divsc3_test.c

Show First 20 Lines • Show All 48 Lines • ▼ Show 20 Lines	classify(float _Complex x)
return non_zero;		return non_zero;
}		}

int test__divsc3(float a, float b, float c, float d)		int test__divsc3(float a, float b, float c, float d)
{		{
float _Complex r = __divsc3(a, b, c, d);		float _Complex r = __divsc3(a, b, c, d);
// printf("test__divsc3(%f, %f, %f, %f) = %f + I%f\n",		// printf("test__divsc3(%f, %f, %f, %f) = %f + I%f\n",
// a, b, c, d, crealf(r), cimagf(r));		// a, b, c, d, crealf(r), cimagf(r));
float _Complex dividend;		float _Complex dividend;
float _Complex divisor;		float _Complex divisor;

__real__ dividend = a;		__real__ dividend = a;
__imag__ dividend = b;		__imag__ dividend = b;
__real__ divisor = c;		__real__ divisor = c;
__imag__ divisor = d;		__imag__ divisor = d;

switch (classify(dividend))		switch (classify(dividend))
{		{
case zero:		case zero:
switch (classify(divisor))		switch (classify(divisor))
{		{
case zero:		case zero:
if (classify(r) != NaN)		if (classify(r) != NaN)
return 1;		return 1;
▲ Show 20 Lines • Show All 118 Lines • ▼ Show 20 Lines	case non_zero_nan:
break;		break;
case non_zero_nan:		case non_zero_nan:
if (classify(r) != NaN)		if (classify(r) != NaN)
return 1;		return 1;
break;		break;
}		}
break;		break;
}		}

return 0;		return 0;
}		}

float x[][2] =		float x[][2] =
{		{
{ 1.e-6, 1.e-6},		{ 1.e-6, 1.e-6},
{-1.e-6, 1.e-6},		{-1.e-6, 1.e-6},
{-1.e-6, -1.e-6},		{-1.e-6, -1.e-6},
▲ Show 20 Lines • Show All 143 Lines • ▼ Show 20 Lines	float x[][2] =
{+0., INFINITY},		{+0., INFINITY},
{0.5, INFINITY},		{0.5, INFINITY},
{1, INFINITY},		{1, INFINITY},
{2, INFINITY},		{2, INFINITY},
{INFINITY, INFINITY}		{INFINITY, INFINITY}

};		};

		int test_bignum__divsc3(float a, float b, float c, float d, float _Complex r)
		{
		return __divsc3(a, b, c, d) != r;
		}

		float x_bignum[][5] =
		{
		{__FLT_MAX__, __FLT_MAX__, __FLT_MAX__/2, __FLT_MAX__/2, 2.},
		{-__FLT_MAX__, -__FLT_MAX__, __FLT_MAX__/2, __FLT_MAX__/2, -2.},
		};

int main()		int main()
{		{
const unsigned N = sizeof(x) / sizeof(x[0]);		unsigned N = sizeof(x) / sizeof(x[0]);
unsigned i, j;		unsigned i, j;
for (i = 0; i < N; ++i)		for (i = 0; i < N; ++i)
{		{
for (j = 0; j < N; ++j)		for (j = 0; j < N; ++j)
{		{
if (test__divsc3(x[i][0], x[i][1], x[j][0], x[j][1]))		if (test__divsc3(x[i][0], x[i][1], x[j][0], x[j][1]))
return 1;		return 1;
}		}
}		}

		N = sizeof(x_bignum) / sizeof(x_bignum[0]);
		for (i = 0; i < N; ++i)
		{
		float *t = x_bignum[i];
		if (test_bignum__divsc3(t[0], t[1], t[2], t[3], t[4]))
		return 1;
		}

return 0;		return 0;
}		}

test/builtins/Unit/divtc3_test.c

Show First 20 Lines • Show All 49 Lines • ▼ Show 20 Lines	classify(long double _Complex x)
return non_zero;		return non_zero;
}		}

int test__divtc3(long double a, long double b, long double c, long double d)		int test__divtc3(long double a, long double b, long double c, long double d)
{		{
long double _Complex r = __divtc3(a, b, c, d);		long double _Complex r = __divtc3(a, b, c, d);
// printf("test__divtc3(%Lf, %Lf, %Lf, %Lf) = %Lf + I%Lf\n",		// printf("test__divtc3(%Lf, %Lf, %Lf, %Lf) = %Lf + I%Lf\n",
// a, b, c, d, creall(r), cimagl(r));		// a, b, c, d, creall(r), cimagl(r));

long double _Complex dividend;		long double _Complex dividend;
long double _Complex divisor;		long double _Complex divisor;

__real__ dividend = a;		__real__ dividend = a;
__imag__ dividend = b;		__imag__ dividend = b;
__real__ divisor = c;		__real__ divisor = c;
__imag__ divisor = d;		__imag__ divisor = d;

switch (classify(dividend))		switch (classify(dividend))
{		{
case zero:		case zero:
switch (classify(divisor))		switch (classify(divisor))
{		{
case zero:		case zero:
if (classify(r) != NaN)		if (classify(r) != NaN)
return 1;		return 1;
▲ Show 20 Lines • Show All 118 Lines • ▼ Show 20 Lines	case non_zero_nan:
break;		break;
case non_zero_nan:		case non_zero_nan:
if (classify(r) != NaN)		if (classify(r) != NaN)
return 1;		return 1;
break;		break;
}		}
break;		break;
}		}

return 0;		return 0;
}		}

long double x[][2] =		long double x[][2] =
{		{
{ 1.e-6, 1.e-6},		{ 1.e-6, 1.e-6},
{-1.e-6, 1.e-6},		{-1.e-6, 1.e-6},
{-1.e-6, -1.e-6},		{-1.e-6, -1.e-6},
▲ Show 20 Lines • Show All 143 Lines • ▼ Show 20 Lines	long double x[][2] =
{+0., INFINITY},		{+0., INFINITY},
{0.5, INFINITY},		{0.5, INFINITY},
{1, INFINITY},		{1, INFINITY},
{2, INFINITY},		{2, INFINITY},
{INFINITY, INFINITY}		{INFINITY, INFINITY}

};		};

		int test_bignum__divtc3(long double a, long double b, long double c, long double d, long double _Complex r)
		{
		return __divtc3(a, b, c, d) != r;
		}

		long double x_bignum[][5] =
		{
		{__LDBL_MAX__, __LDBL_MAX__, __LDBL_MAX__/2, __LDBL_MAX__/2, 2.},
		{-__LDBL_MAX__, -__LDBL_MAX__, __LDBL_MAX__/2, __LDBL_MAX__/2, -2.},
		};

int main()		int main()
{		{
const unsigned N = sizeof(x) / sizeof(x[0]);		unsigned N = sizeof(x) / sizeof(x[0]);
unsigned i, j;		unsigned i, j;
for (i = 0; i < N; ++i)		for (i = 0; i < N; ++i)
{		{
for (j = 0; j < N; ++j)		for (j = 0; j < N; ++j)
{		{
if (test__divtc3(x[i][0], x[i][1], x[j][0], x[j][1]))		if (test__divtc3(x[i][0], x[i][1], x[j][0], x[j][1]))
return 1;		return 1;
}		}
}		}

		N = sizeof(x_bignum) / sizeof(x_bignum[0]);
		for (i = 0; i < N; ++i)
		{
		long double *t = x_bignum[i];
		if (test_bignum__divtc3(t[0], t[1], t[2], t[3], t[4]))
		return 1;
		}

// printf("No errors found.\n");		// printf("No errors found.\n");
return 0;		return 0;
}		}

test/builtins/Unit/divxc3_test.c

Show First 20 Lines • Show All 53 Lines • ▼ Show 20 Lines	classify(long double _Complex x)
return non_zero;		return non_zero;
}		}

int test__divxc3(long double a, long double b, long double c, long double d)		int test__divxc3(long double a, long double b, long double c, long double d)
{		{
long double _Complex r = __divxc3(a, b, c, d);		long double _Complex r = __divxc3(a, b, c, d);
// printf("test__divxc3(%Lf, %Lf, %Lf, %Lf) = %Lf + I%Lf\n",		// printf("test__divxc3(%Lf, %Lf, %Lf, %Lf) = %Lf + I%Lf\n",
// a, b, c, d, creall(r), cimagl(r));		// a, b, c, d, creall(r), cimagl(r));
long double _Complex dividend;		long double _Complex dividend;
long double _Complex divisor;		long double _Complex divisor;

__real__ dividend = a;		__real__ dividend = a;
__imag__ dividend = b;		__imag__ dividend = b;
__real__ divisor = c;		__real__ divisor = c;
__imag__ divisor = d;		__imag__ divisor = d;

switch (classify(dividend))		switch (classify(dividend))
{		{
case zero:		case zero:
switch (classify(divisor))		switch (classify(divisor))
{		{
case zero:		case zero:
if (classify(r) != NaN)		if (classify(r) != NaN)
return 1;		return 1;
▲ Show 20 Lines • Show All 118 Lines • ▼ Show 20 Lines	case non_zero_nan:
break;		break;
case non_zero_nan:		case non_zero_nan:
if (classify(r) != NaN)		if (classify(r) != NaN)
return 1;		return 1;
break;		break;
}		}
break;		break;
}		}

return 0;		return 0;
}		}

long double x[][2] =		long double x[][2] =
{		{
{ 1.e-6, 1.e-6},		{ 1.e-6, 1.e-6},
{-1.e-6, 1.e-6},		{-1.e-6, 1.e-6},
{-1.e-6, -1.e-6},		{-1.e-6, -1.e-6},
▲ Show 20 Lines • Show All 143 Lines • ▼ Show 20 Lines	long double x[][2] =
{+0., INFINITY},		{+0., INFINITY},
{0.5, INFINITY},		{0.5, INFINITY},
{1, INFINITY},		{1, INFINITY},
{2, INFINITY},		{2, INFINITY},
{INFINITY, INFINITY}		{INFINITY, INFINITY}

};		};

		int test_bignum__divxc3(long double a, long double b, long double c, long double d, long double _Complex r)
		{
		return __divxc3(a, b, c, d) != r;
		}

		long double x_bignum[][5] =
		{
		{__LDBL_MAX__, __LDBL_MAX__, __LDBL_MAX__/2, __LDBL_MAX__/2, 2.},
		{-__LDBL_MAX__, -__LDBL_MAX__, __LDBL_MAX__/2, __LDBL_MAX__/2, -2.},
		};

#endif		#endif

int main()		int main()
{		{
#if !_ARCH_PPC		#if !_ARCH_PPC
const unsigned N = sizeof(x) / sizeof(x[0]);		unsigned N = sizeof(x) / sizeof(x[0]);
unsigned i, j;		unsigned i, j;
for (i = 0; i < N; ++i)		for (i = 0; i < N; ++i)
{		{
for (j = 0; j < N; ++j)		for (j = 0; j < N; ++j)
{		{
if (test__divxc3(x[i][0], x[i][1], x[j][0], x[j][1]))		if (test__divxc3(x[i][0], x[i][1], x[j][0], x[j][1]))
return 1;		return 1;
}		}
}		}

		N = sizeof(x_bignum) / sizeof(x_bignum[0]);
		for (i = 0; i < N; ++i)
		{
		long double *t = x_bignum[i];
		if (test_bignum__divxc3(t[0], t[1], t[2], t[3], t[4]))
		return 1;
		}

#else		#else
printf("skipped\n");		printf("skipped\n");
#endif		#endif
return 0;		return 0;
}		}

This is an archive of the discontinued LLVM Phabricator instance.

[builtins] Fix overflow issue for complex division with big numbersNeeds RevisionPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 203746

lib/builtins/divdc3.c

lib/builtins/divsc3.c

lib/builtins/divtc3.c

lib/builtins/divxc3.c

test/builtins/Unit/divdc3_test.c

test/builtins/Unit/divsc3_test.c

test/builtins/Unit/divtc3_test.c

test/builtins/Unit/divxc3_test.c

[builtins] Fix overflow issue for complex division with big numbers
Needs RevisionPublic