cpp/ja/fast__math_8hpp_source.html

/*M///////////////////////////////////////////////////////////////////////////////////////


//


//  IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING.


//


//  By downloading, copying, installing or using the software you agree to this license.


//  If you do not agree to this license, do not download, install,


//  copy or use the software.


//


//


//                          License Agreement


//                For Open Source Computer Vision Library


//


// Copyright (C) 2000-2008, Intel Corporation, all rights reserved.


// Copyright (C) 2009, Willow Garage Inc., all rights reserved.


// Copyright (C) 2013, OpenCV Foundation, all rights reserved.


// Copyright (C) 2015, Itseez Inc., all rights reserved.


// Third party copyrights are property of their respective owners.


//


// Redistribution and use in source and binary forms, with or without modification,


// are permitted provided that the following conditions are met:


//


//   * Redistribution's of source code must retain the above copyright notice,


//     this list of conditions and the following disclaimer.


//


//   * Redistribution's in binary form must reproduce the above copyright notice,


//     this list of conditions and the following disclaimer in the documentation


//     and/or other materials provided with the distribution.


//


//   * The name of the copyright holders may not be used to endorse or promote products


//     derived from this software without specific prior written permission.


//


// This software is provided by the copyright holders and contributors "as is" and


// any express or implied warranties, including, but not limited to, the implied


// warranties of merchantability and fitness for a particular purpose are disclaimed.


// In no event shall the Intel Corporation or contributors be liable for any direct,


// indirect, incidental, special, exemplary, or consequential damages


// (including, but not limited to, procurement of substitute goods or services;


// loss of use, data, or profits; or business interruption) however caused


// and on any theory of liability, whether in contract, strict liability,


// or tort (including negligence or otherwise) arising in any way out of


// the use of this software, even if advised of the possibility of such damage.


//


//M*/


#ifndef OPENCV_CORE_FAST_MATH_HPP


#define OPENCV_CORE_FAST_MATH_HPP


#include "opencv2/core/cvdef.h"


/****************************************************************************************\


*                                      fast math                                         *


\****************************************************************************************/


#ifdef __cplusplus


#  include <cmath>


#else


#  ifdef __BORLANDC__


#    include <fastmath.h>


#  else


#    include <math.h>


#  endif


#endif


#if defined(__CUDACC__)


// nothing, intrinsics/asm code is not supported


#else


#if ((defined _MSC_VER && defined _M_X64) \


|| (defined __GNUC__ && defined __x86_64__ && defined __SSE2__)) \


&& !defined(OPENCV_SKIP_INCLUDE_EMMINTRIN_H)


#include <emmintrin.h>


#endif


#if defined __PPC64__ && defined __GNUC__ && defined _ARCH_PWR8 \


&& !defined(OPENCV_SKIP_INCLUDE_ALTIVEC_H)


#include <altivec.h>


#undef vector


#undef bool


#undef pixel


#endif


#if defined(CV_INLINE_ROUND_FLT)


// user-specified version


// CV_INLINE_ROUND_DBL should be defined too


#elif defined __GNUC__ && defined __arm__ && (defined __ARM_PCS_VFP || defined __ARM_VFPV3__ || defined __ARM_NEON__) && !defined __SOFTFP__


// 1. general scheme


#define ARM_ROUND(_value, _asm_string) \


int res; \


float temp; \


CV_UNUSED(temp); \


__asm__(_asm_string : [res] "=r"
(res), [temp] "=w" (temp) : [value] "w" (_value)); \


return res


// 2. version for double


#ifdef __clang__


#define CV_INLINE_ROUND_DBL(value) ARM_ROUND(value, "vcvtr.s32.f64 %[temp], %[value] \n vmov %[res], %[temp]")


#else


#define CV_INLINE_ROUND_DBL(value) ARM_ROUND(value, "vcvtr.s32.f64 %[temp], %P[value] \n vmov %[res], %[temp]")


#endif


// 3. version for float


#define CV_INLINE_ROUND_FLT(value) ARM_ROUND(value, "vcvtr.s32.f32 %[temp], %[value]\n vmov %[res], %[temp]")


#elif defined __PPC64__ && defined __GNUC__ && defined _ARCH_PWR8


// P8 and newer machines can convert fp32/64 to int quickly.


#define CV_INLINE_ROUND_DBL(value) \


int out; \


double temp; \


__asm__( "fctiw %[temp],%[in]\n\tmfvsrwz %[out],%[temp]\n\t"
: [out] "=r" (out), [temp] "=d" (temp) : [in] "d" ((double)(value)) : ); \


return out;


// FP32 also works with FP64 routine above


#define CV_INLINE_ROUND_FLT(value) CV_INLINE_ROUND_DBL(value)


#endif


#ifdef CV_INLINE_ISINF_FLT


// user-specified version


// CV_INLINE_ISINF_DBL should be defined too


#elif defined __PPC64__ && defined _ARCH_PWR9 && defined(scalar_test_data_class)


#define CV_INLINE_ISINF_DBL(value) return scalar_test_data_class(value, 0x30);


#define CV_INLINE_ISINF_FLT(value) CV_INLINE_ISINF_DBL(value)


#endif


#ifdef CV_INLINE_ISNAN_FLT


// user-specified version


// CV_INLINE_ISNAN_DBL should be defined too


#elif defined __PPC64__ && defined _ARCH_PWR9 && defined(scalar_test_data_class)


#define CV_INLINE_ISNAN_DBL(value) return scalar_test_data_class(value, 0x40);


#define CV_INLINE_ISNAN_FLT(value) CV_INLINE_ISNAN_DBL(value)


#endif


#if !defined(OPENCV_USE_FASTMATH_BUILTINS) \


&& ( \


defined(__x86_64__) || defined(__i686__) \


|| defined(__arm__) \


|| defined(__PPC64__) \


)


/* Let builtin C math functions when available. Dedicated hardware is available to


round and convert FP values. */


#define OPENCV_USE_FASTMATH_BUILTINS 1


#endif


/* Enable builtin math functions if possible, desired, and available.


Note, not all math functions inline equally. E.g lrint will not inline


without the -fno-math-errno option. */


#if defined(CV_ICC)


// nothing


#elif defined(OPENCV_USE_FASTMATH_BUILTINS) && OPENCV_USE_FASTMATH_BUILTINS


#if defined(__clang__)


#define CV__FASTMATH_ENABLE_CLANG_MATH_BUILTINS


#if !defined(CV_INLINE_ISNAN_DBL) && __has_builtin(__builtin_isnan)


#define CV_INLINE_ISNAN_DBL(value) return __builtin_isnan(value);


#endif


#if !defined(CV_INLINE_ISNAN_FLT) && __has_builtin(__builtin_isnan)


#define CV_INLINE_ISNAN_FLT(value) return __builtin_isnan(value);


#endif


#if !defined(CV_INLINE_ISINF_DBL) && __has_builtin(__builtin_isinf)


#define CV_INLINE_ISINF_DBL(value) return __builtin_isinf(value);


#endif


#if !defined(CV_INLINE_ISINF_FLT) && __has_builtin(__builtin_isinf)


#define CV_INLINE_ISINF_FLT(value) return __builtin_isinf(value);


#endif


#elif defined(__GNUC__)


#define CV__FASTMATH_ENABLE_GCC_MATH_BUILTINS


#if !defined(CV_INLINE_ISNAN_DBL)


#define CV_INLINE_ISNAN_DBL(value) return __builtin_isnan(value);


#endif


#if !defined(CV_INLINE_ISNAN_FLT)


#define CV_INLINE_ISNAN_FLT(value) return __builtin_isnanf(value);


#endif


#if !defined(CV_INLINE_ISINF_DBL)


#define CV_INLINE_ISINF_DBL(value) return __builtin_isinf(value);


#endif


#if !defined(CV_INLINE_ISINF_FLT)


#define CV_INLINE_ISINF_FLT(value) return __builtin_isinff(value);


#endif


#elif defined(_MSC_VER)


#if !defined(CV_INLINE_ISNAN_DBL)


#define CV_INLINE_ISNAN_DBL(value) return isnan(value);


#endif


#if !defined(CV_INLINE_ISNAN_FLT)


#define CV_INLINE_ISNAN_FLT(value) return isnan(value);


#endif


#if !defined(CV_INLINE_ISINF_DBL)


#define CV_INLINE_ISINF_DBL(value) return isinf(value);


#endif


#if !defined(CV_INLINE_ISINF_FLT)


#define CV_INLINE_ISINF_FLT(value) return isinf(value);


#endif


#endif


#endif


#endif

// defined(__CUDACC__)


CV_INLINE
int


cvRound(
double
value )


{


#if defined CV_INLINE_ROUND_DBL


CV_INLINE_ROUND_DBL(value);


#elif ((defined _MSC_VER && defined _M_X64) || (defined __GNUC__ && defined __x86_64__ \


&& defined __SSE2__ && !defined __APPLE__) || CV_SSE2) \


&& !defined(__CUDACC__)


__m128d t = _mm_set_sd( value );


return
_mm_cvtsd_si32(t);


#elif defined _MSC_VER && defined _M_IX86


int
t;


__asm


{


fld value;


fistp t;


}


return
t;


#elif defined CV_ICC || defined __GNUC__


return
(int)(lrint(value));


#else


/* it's ok if round does not comply with IEEE754 standard;


the tests should allow +/-1 difference when the tested functions use round */


return
(int)(value + (value >= 0 ? 0.5 : -0.5));


#endif


}


CV_INLINE
int
cvFloor(
double
value )


{


#if (defined CV__FASTMATH_ENABLE_GCC_MATH_BUILTINS || defined CV__FASTMATH_ENABLE_CLANG_MATH_BUILTINS) \


&& ( \


defined(__PPC64__) \


)


return
__builtin_floor(value);


#else


int
i = (int)value;


return
i - (i > value);


#endif


}


CV_INLINE
int
cvCeil(
double
value )


{


#if (defined CV__FASTMATH_ENABLE_GCC_MATH_BUILTINS || defined CV__FASTMATH_ENABLE_CLANG_MATH_BUILTINS) \


&& ( \


defined(__PPC64__) \


)


return
__builtin_ceil(value);


#else


int
i = (int)value;


return
i + (i < value);


#endif


}


CV_INLINE
int
cvIsNaN(
double
value )


{


#if defined CV_INLINE_ISNAN_DBL


CV_INLINE_ISNAN_DBL(value);


#else


Cv64suf
ieee754;


ieee754.f = value;


return
((unsigned)(ieee754.u >> 32) & 0x7fffffff) +


((unsigned)ieee754.u != 0) > 0x7ff00000;


#endif


}


CV_INLINE
int
cvIsInf(
double
value )


{


#if defined CV_INLINE_ISINF_DBL


CV_INLINE_ISINF_DBL(value);


#elif defined(__x86_64__) || defined(_M_X64) || defined(__aarch64__) || defined(_M_ARM64) || defined(__PPC64__)


Cv64suf
ieee754;


ieee754.f = value;


return
(ieee754.u & 0x7fffffff00000000) ==


0x7ff0000000000000;


#else


Cv64suf
ieee754;


ieee754.f = value;


return
((unsigned)(ieee754.u >> 32) & 0x7fffffff) == 0x7ff00000 &&


(unsigned)ieee754.u == 0;


#endif


}


#ifdef __cplusplus


CV_INLINE
int
cvRound(float
value)


{


#if defined CV_INLINE_ROUND_FLT


CV_INLINE_ROUND_FLT(value);


#elif ((defined _MSC_VER && defined _M_X64) || (defined __GNUC__ && defined __x86_64__ \


&& defined __SSE2__ && !defined __APPLE__) || CV_SSE2) \


&& !defined(__CUDACC__)


__m128 t = _mm_set_ss( value );


return
_mm_cvtss_si32(t);


#elif defined _MSC_VER && defined _M_IX86


int
t;


__asm


{


fld value;


fistp t;


}


return
t;


#elif defined CV_ICC || defined __GNUC__


return
(int)(lrintf(value));


#else


/* it's ok if round does not comply with IEEE754 standard;


the tests should allow +/-1 difference when the tested functions use round */


return
(int)(value + (value >= 0 ? 0.5f : -0.5f));


#endif


}


CV_INLINE
int
cvRound(
int
value )


{


return
value;


}


CV_INLINE
int
cvFloor(
float
value )


{


#if (defined CV__FASTMATH_ENABLE_GCC_MATH_BUILTINS || defined CV__FASTMATH_ENABLE_CLANG_MATH_BUILTINS) \


&& ( \


defined(__PPC64__) \


)


return
__builtin_floorf(value);


#else


int
i = (int)value;


return
i - (i > value);


#endif


}


CV_INLINE
int
cvFloor(
int
value )


{


return
value;


}


CV_INLINE
int
cvCeil(
float
value )


{


#if (defined CV__FASTMATH_ENABLE_GCC_MATH_BUILTINS || defined CV__FASTMATH_ENABLE_CLANG_MATH_BUILTINS) \


&& ( \


defined(__PPC64__) \


)


return
__builtin_ceilf(value);


#else


int
i = (int)value;


return
i + (i < value);


#endif


}


CV_INLINE
int
cvCeil(
int
value )


{


return
value;


}


CV_INLINE
int
cvIsNaN(
float
value )


{


#if defined CV_INLINE_ISNAN_FLT


CV_INLINE_ISNAN_FLT(value);


#else


Cv32suf
ieee754;


ieee754.f = value;


return
(ieee754.u & 0x7fffffff) > 0x7f800000;


#endif


}


CV_INLINE
int
cvIsInf(
float
value )


{


#if defined CV_INLINE_ISINF_FLT


CV_INLINE_ISINF_FLT(value);


#else


Cv32suf
ieee754;


ieee754.f = value;


return
(ieee754.u & 0x7fffffff) == 0x7f800000;


#endif


}


#endif

// __cplusplus


#endif


cvIsNaN

CV_INLINE int cvIsNaN(double value)

Determines if the argument is Not A Number.


Definition:
fast_math.hpp:273


cvIsInf

CV_INLINE int cvIsInf(double value)

Determines if the argument is Infinity.


Definition:
fast_math.hpp:291


cvRound

CV_INLINE int cvRound(double value)

Rounds floating-point number to the nearest integer


Definition:
fast_math.hpp:200


cvCeil

CV_INLINE int cvCeil(double value)

Rounds floating-point number to the nearest integer not smaller than the original.


Definition:
fast_math.hpp:254


cvFloor

CV_INLINE int cvFloor(double value)

Rounds floating-point number to the nearest integer not larger than the original.


Definition:
fast_math.hpp:234


Cv32suf


Definition:
cvdef.h:382


Cv64suf


Definition:
cvdef.h:390