test_conformance/math_brute_force/Utility.cpp - external/github.com/KhronosGroup/OpenCL-CTS - Git at Google

 //
 // Copyright (c) 2017 The Khronos Group Inc.
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //    http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.
 //
 #include "Utility.h"
 #include "FunctionList.h"

 #if defined(__PPC__)
 // Global varaiable used to hold the FPU control register state. The FPSCR register can not
 // be used because not all Power implementations retain or observed the NI (non-IEEE
 // mode) bit.
 __thread fpu_control_t fpu_control = 0;
 #endif

 void MulD(double *rhi, double *rlo, double u, double v)
 {
     const double c = 134217729.0; // 1+2^27
     double up, u1, u2, vp, v1, v2;

     up = u*c;
     u1 = (u - up) + up;
     u2 = u - u1;

     vp = v*c;
     v1 = (v - vp) + vp;
     v2 = v - v1;

     double rh = u*v;
     double rl = (((u1*v1 - rh) + (u1*v2)) + (u2*v1)) + (u2*v2);

     *rhi = rh;
     *rlo = rl;
 }

 void AddD(double *rhi, double *rlo, double a, double b)
 {
     double zhi, zlo;
     zhi = a + b;
     if(fabs(a) > fabs(b)) {
         zlo = zhi - a;
         zlo = b - zlo;
     }
     else {
         zlo = zhi - b;
         zlo = a - zlo;
     }

     *rhi = zhi;
     *rlo = zlo;
 }

 void MulDD(double *rhi, double *rlo, double xh, double xl, double yh, double yl)
 {
     double mh, ml;
     double c = 134217729.0;
     double up, u1, u2, vp, v1, v2;

     up = xh*c;
     u1 = (xh - up) + up;
     u2 = xh - u1;

     vp = yh*c;
     v1 = (yh - vp) + vp;
     v2 = yh - v1;

     mh = xh*yh;
     ml = (((u1*v1 - mh) + (u1*v2)) + (u2*v1)) + (u2*v2);
     ml += xh*yl + xl*yh;

     *rhi = mh + ml;
     *rlo = (mh - (*rhi)) + ml;
 }

 void AddDD(double *rhi, double *rlo, double xh, double xl, double yh, double yl)
 {
     double r, s;
     r = xh + yh;
     s = (fabs(xh) > fabs(yh)) ? (xh - r + yh + yl + xl) : (yh - r + xh + xl + yl);
     *rhi = r + s;
     *rlo = (r - (*rhi)) + s;
 }

 void DivideDD(double *chi, double *clo, double a, double b)
 {
     *chi = a / b;
     double rhi, rlo;
     MulD(&rhi, &rlo, *chi, b);
     AddDD(&rhi, &rlo, -rhi, -rlo, a, 0.0);
     *clo = rhi / b;
 }

 // These functions comapre two floats/doubles. Since some platforms may choose to
 // flush denormals to zeros before comparison, comparison like a < b may give wrong
 // result in "certain cases" where we do need correct compasion result when operands
 // are denormals .... these functions comapre floats/doubles using signed integer/long int
 // rep. In other cases, when flushing to zeros is fine, these should not be used.
 // Also these doesn't check for nans and assume nans are handled separately as special edge case
 // by the caller which calls these functions
 // return 0 if both are equal, 1 if x > y and -1 if x < y.

 inline
 int compareFloats(float x, float y)
 {
     int32f_t a, b;

     a.f = x;
     b.f = y;

     if( a.i & 0x80000000 )
         a.i = 0x80000000 - a.i;
     if( b.i & 0x80000000 )
         b.i = 0x80000000 - b.i;

     if( a.i == b.i )
         return 0;

     return a.i < b.i ? -1 : 1;
 }

 inline
 int compareDoubles(double x, double y)
 {
     int64d_t a, b;

     a.d = x;
     b.d = y;

     if( a.l & 0x8000000000000000LL )
         a.l = 0x8000000000000000LL - a.l;
     if( b.l & 0x8000000000000000LL )
         b.l = 0x8000000000000000LL - b.l;

     if( a.l == b.l )
         return 0;

     return a.l < b.l ? -1 : 1;
 }

 void logFunctionInfo(const char *fname, unsigned int float_size, unsigned int isFastRelaxed)
 {
     char const *fpSizeStr = NULL;
     char const *fpFastRelaxedStr = "";
     switch (float_size) {
     case sizeof(cl_double):
         fpSizeStr = "fp64";
         break;
     case sizeof(cl_float):
         fpSizeStr = "fp32";
         break;
     case sizeof(cl_half):
         fpSizeStr = "fp16";
         break;
     }
     if (isFastRelaxed) {
         fpFastRelaxedStr = "rlx";
     }
     vlog("%15s %4s %4s",fname, fpSizeStr, fpFastRelaxedStr);
 }

 float getAllowedUlpError(const Func *f, const bool relaxed)
 {
     float ulp;

     if (relaxed)
     {
         if (gIsEmbedded)
         {
             ulp = f->relaxed_embedded_error;
         }
         else
         {
             ulp = f->relaxed_error;
         }
     }
     else
     {
         if (gIsEmbedded)
         {
             ulp = f->float_embedded_ulps;
         }
         else
         {
             ulp = f->float_ulps;
         }
     }

     return ulp;
 }
	//
	// Copyright (c) 2017 The Khronos Group Inc.
	//
	// Licensed under the Apache License, Version 2.0 (the "License");
	// you may not use this file except in compliance with the License.
	// You may obtain a copy of the License at
	//
	// http://www.apache.org/licenses/LICENSE-2.0
	//
	// Unless required by applicable law or agreed to in writing, software
	// distributed under the License is distributed on an "AS IS" BASIS,
	// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	// See the License for the specific language governing permissions and
	// limitations under the License.
	//
	#include "Utility.h"
	#include "FunctionList.h"

	#if defined(__PPC__)
	// Global varaiable used to hold the FPU control register state. The FPSCR register can not
	// be used because not all Power implementations retain or observed the NI (non-IEEE
	// mode) bit.
	__thread fpu_control_t fpu_control = 0;
	#endif

	void MulD(double rhi, double rlo, double u, double v)
	{
	const double c = 134217729.0; // 1+2^27
	double up, u1, u2, vp, v1, v2;

	up = u*c;
	u1 = (u - up) + up;
	u2 = u - u1;

	vp = v*c;
	v1 = (v - vp) + vp;
	v2 = v - v1;

	double rh = u*v;
	double rl = (((u1v1 - rh) + (u1v2)) + (u2v1)) + (u2v2);

	*rhi = rh;
	*rlo = rl;
	}

	void AddD(double rhi, double rlo, double a, double b)
	{
	double zhi, zlo;
	zhi = a + b;
	if(fabs(a) > fabs(b)) {
	zlo = zhi - a;
	zlo = b - zlo;
	}
	else {
	zlo = zhi - b;
	zlo = a - zlo;
	}

	*rhi = zhi;
	*rlo = zlo;
	}

	void MulDD(double rhi, double rlo, double xh, double xl, double yh, double yl)
	{
	double mh, ml;
	double c = 134217729.0;
	double up, u1, u2, vp, v1, v2;

	up = xh*c;
	u1 = (xh - up) + up;
	u2 = xh - u1;

	vp = yh*c;
	v1 = (yh - vp) + vp;
	v2 = yh - v1;

	mh = xh*yh;
	ml = (((u1v1 - mh) + (u1v2)) + (u2v1)) + (u2v2);
	ml += xhyl + xlyh;

	*rhi = mh + ml;
	rlo = (mh - (rhi)) + ml;
	}

	void AddDD(double rhi, double rlo, double xh, double xl, double yh, double yl)
	{
	double r, s;
	r = xh + yh;
	s = (fabs(xh) > fabs(yh)) ? (xh - r + yh + yl + xl) : (yh - r + xh + xl + yl);
	*rhi = r + s;
	rlo = (r - (rhi)) + s;
	}

	void DivideDD(double chi, double clo, double a, double b)
	{
	*chi = a / b;
	double rhi, rlo;
	MulD(&rhi, &rlo, *chi, b);
	AddDD(&rhi, &rlo, -rhi, -rlo, a, 0.0);
	*clo = rhi / b;
	}

	// These functions comapre two floats/doubles. Since some platforms may choose to
	// flush denormals to zeros before comparison, comparison like a < b may give wrong
	// result in "certain cases" where we do need correct compasion result when operands
	// are denormals .... these functions comapre floats/doubles using signed integer/long int
	// rep. In other cases, when flushing to zeros is fine, these should not be used.
	// Also these doesn't check for nans and assume nans are handled separately as special edge case
	// by the caller which calls these functions
	// return 0 if both are equal, 1 if x > y and -1 if x < y.

	inline
	int compareFloats(float x, float y)
	{
	int32f_t a, b;

	a.f = x;
	b.f = y;

	if( a.i & 0x80000000 )
	a.i = 0x80000000 - a.i;
	if( b.i & 0x80000000 )
	b.i = 0x80000000 - b.i;

	if( a.i == b.i )
	return 0;

	return a.i < b.i ? -1 : 1;
	}

	inline
	int compareDoubles(double x, double y)
	{
	int64d_t a, b;

	a.d = x;
	b.d = y;

	if( a.l & 0x8000000000000000LL )
	a.l = 0x8000000000000000LL - a.l;
	if( b.l & 0x8000000000000000LL )
	b.l = 0x8000000000000000LL - b.l;

	if( a.l == b.l )
	return 0;

	return a.l < b.l ? -1 : 1;
	}

	void logFunctionInfo(const char *fname, unsigned int float_size, unsigned int isFastRelaxed)
	{
	char const *fpSizeStr = NULL;
	char const *fpFastRelaxedStr = "";
	switch (float_size) {
	case sizeof(cl_double):
	fpSizeStr = "fp64";
	break;
	case sizeof(cl_float):
	fpSizeStr = "fp32";
	break;
	case sizeof(cl_half):
	fpSizeStr = "fp16";
	break;
	}
	if (isFastRelaxed) {
	fpFastRelaxedStr = "rlx";
	}
	vlog("%15s %4s %4s",fname, fpSizeStr, fpFastRelaxedStr);
	}

	float getAllowedUlpError(const Func *f, const bool relaxed)
	{
	float ulp;

	if (relaxed)
	{
	if (gIsEmbedded)
	{
	ulp = f->relaxed_embedded_error;
	}
	else
	{
	ulp = f->relaxed_error;
	}
	}
	else
	{
	if (gIsEmbedded)
	{
	ulp = f->float_embedded_ulps;
	}
	else
	{
	ulp = f->float_ulps;
	}
	}

	return ulp;
	}