include/core/SkMath.h - skia - Git at Google


 /*
  * Copyright 2006 The Android Open Source Project
  *
  * Use of this source code is governed by a BSD-style license that can be
  * found in the LICENSE file.
  */


 #ifndef SkMath_DEFINED
 #define SkMath_DEFINED

 #include "SkTypes.h"

 // 64bit -> 32bit utilities

 /**
  *  Return true iff the 64bit value can exactly be represented in signed 32bits
  */
 static inline bool sk_64_isS32(int64_t value) {
     return (int32_t)value == value;
 }

 /**
  *  Return the 64bit argument as signed 32bits, asserting in debug that the arg
  *  exactly fits in signed 32bits. In the release build, no checks are preformed
  *  and the return value if the arg does not fit is undefined.
  */
 static inline int32_t sk_64_asS32(int64_t value) {
     SkASSERT(sk_64_isS32(value));
     return (int32_t)value;
 }

 // Handy util that can be passed two ints, and will automatically promote to
 // 64bits before the multiply, so the caller doesn't have to remember to cast
 // e.g. (int64_t)a * b;
 static inline int64_t sk_64_mul(int64_t a, int64_t b) {
     return a * b;
 }

 ///////////////////////////////////////////////////////////////////////////////

 /**
  *  Computes numer1 * numer2 / denom in full 64 intermediate precision.
  *  It is an error for denom to be 0. There is no special handling if
  *  the result overflows 32bits.
  */
 static inline int32_t SkMulDiv(int32_t numer1, int32_t numer2, int32_t denom) {
     SkASSERT(denom);

     int64_t tmp = sk_64_mul(numer1, numer2) / denom;
     return sk_64_asS32(tmp);
 }

 /**
  *  Computes (numer1 << shift) / denom in full 64 intermediate precision.
  *  It is an error for denom to be 0. There is no special handling if
  *  the result overflows 32bits.
  */
 int32_t SkDivBits(int32_t numer, int32_t denom, int shift);

 /**
  *  Return the integer square root of value, with a bias of bitBias
  */
 int32_t SkSqrtBits(int32_t value, int bitBias);

 /** Return the integer square root of n, treated as a SkFixed (16.16)
  */
 #define SkSqrt32(n)         SkSqrtBits(n, 15)

 //! Returns the number of leading zero bits (0...32)
 int SkCLZ_portable(uint32_t);

 #ifndef SkCLZ
     #if defined(_MSC_VER) && _MSC_VER >= 1400
         #include <intrin.h>

         static inline int SkCLZ(uint32_t mask) {
             if (mask) {
                 DWORD index;
                 _BitScanReverse(&index, mask);
                 return index ^ 0x1F;
             } else {
                 return 32;
             }
         }
     #elif defined(SK_CPU_ARM32) || defined(__GNUC__) || defined(__clang__)
         static inline int SkCLZ(uint32_t mask) {
             // __builtin_clz(0) is undefined, so we have to detect that case.
             return mask ? __builtin_clz(mask) : 32;
         }
     #else
         #define SkCLZ(x)    SkCLZ_portable(x)
     #endif
 #endif

 /**
  *  Returns (value < 0 ? 0 : value) efficiently (i.e. no compares or branches)
  */
 static inline int SkClampPos(int value) {
     return value & ~(value >> 31);
 }

 /** Given an integer and a positive (max) integer, return the value
  *  pinned against 0 and max, inclusive.
  *  @param value    The value we want returned pinned between [0...max]
  *  @param max      The positive max value
  *  @return 0 if value < 0, max if value > max, else value
  */
 static inline int SkClampMax(int value, int max) {
     // ensure that max is positive
     SkASSERT(max >= 0);
     if (value < 0) {
         value = 0;
     }
     if (value > max) {
         value = max;
     }
     return value;
 }

 /**
  *  Returns the smallest power-of-2 that is >= the specified value. If value
  *  is already a power of 2, then it is returned unchanged. It is undefined
  *  if value is <= 0.
  */
 static inline int SkNextPow2(int value) {
     SkASSERT(value > 0);
     return 1 << (32 - SkCLZ(value - 1));
 }

 /**
  *  Returns the log2 of the specified value, were that value to be rounded up
  *  to the next power of 2. It is undefined to pass 0. Examples:
  *  SkNextLog2(1) -> 0
  *  SkNextLog2(2) -> 1
  *  SkNextLog2(3) -> 2
  *  SkNextLog2(4) -> 2
  *  SkNextLog2(5) -> 3
  */
 static inline int SkNextLog2(uint32_t value) {
     SkASSERT(value != 0);
     return 32 - SkCLZ(value - 1);
 }

 /**
  *  Returns true if value is a power of 2. Does not explicitly check for
  *  value <= 0.
  */
 static inline bool SkIsPow2(int value) {
     return (value & (value - 1)) == 0;
 }

 ///////////////////////////////////////////////////////////////////////////////

 /**
  *  SkMulS16(a, b) multiplies a * b, but requires that a and b are both int16_t.
  *  With this requirement, we can generate faster instructions on some
  *  architectures.
  */
 #ifdef SK_ARM_HAS_EDSP
     static inline int32_t SkMulS16(S16CPU x, S16CPU y) {
         SkASSERT((int16_t)x == x);
         SkASSERT((int16_t)y == y);
         int32_t product;
         asm("smulbb %0, %1, %2 \n"
             : "=r"(product)
             : "r"(x), "r"(y)
             );
         return product;
     }
 #else
     #ifdef SK_DEBUG
         static inline int32_t SkMulS16(S16CPU x, S16CPU y) {
             SkASSERT((int16_t)x == x);
             SkASSERT((int16_t)y == y);
             return x * y;
         }
     #else
         #define SkMulS16(x, y)  ((x) * (y))
     #endif
 #endif

 /**
  *  Return a*b/((1 << shift) - 1), rounding any fractional bits.
  *  Only valid if a and b are unsigned and <= 32767 and shift is > 0 and <= 8
  */
 static inline unsigned SkMul16ShiftRound(U16CPU a, U16CPU b, int shift) {
     SkASSERT(a <= 32767);
     SkASSERT(b <= 32767);
     SkASSERT(shift > 0 && shift <= 8);
     unsigned prod = SkMulS16(a, b) + (1 << (shift - 1));
     return (prod + (prod >> shift)) >> shift;
 }

 /**
  *  Return a*b/255, rounding any fractional bits.
  *  Only valid if a and b are unsigned and <= 32767.
  */
 static inline U8CPU SkMulDiv255Round(U16CPU a, U16CPU b) {
     SkASSERT(a <= 32767);
     SkASSERT(b <= 32767);
     unsigned prod = SkMulS16(a, b) + 128;
     return (prod + (prod >> 8)) >> 8;
 }

 /**
  * Stores numer/denom and numer%denom into div and mod respectively.
  */
 template <typename In, typename Out>
 inline void SkTDivMod(In numer, In denom, Out* div, Out* mod) {
 #ifdef SK_CPU_ARM32
     // If we wrote this as in the else branch, GCC won't fuse the two into one
     // divmod call, but rather a div call followed by a divmod.  Silly!  This
     // version is just as fast as calling __aeabi_[u]idivmod manually, but with
     // prettier code.
     //
     // This benches as around 2x faster than the code in the else branch.
     const In d = numer/denom;
     *div = static_cast<Out>(d);
     *mod = static_cast<Out>(numer-d*denom);
 #else
     // On x86 this will just be a single idiv.
     *div = static_cast<Out>(numer/denom);
     *mod = static_cast<Out>(numer%denom);
 #endif
 }

 #endif

	/*
	* Copyright 2006 The Android Open Source Project
	*
	* Use of this source code is governed by a BSD-style license that can be
	* found in the LICENSE file.
	*/


	#ifndef SkMath_DEFINED
	#define SkMath_DEFINED

	#include "SkTypes.h"

	// 64bit -> 32bit utilities

	/**
	* Return true iff the 64bit value can exactly be represented in signed 32bits
	*/
	static inline bool sk_64_isS32(int64_t value) {
	return (int32_t)value == value;
	}

	/**
	* Return the 64bit argument as signed 32bits, asserting in debug that the arg
	* exactly fits in signed 32bits. In the release build, no checks are preformed
	* and the return value if the arg does not fit is undefined.
	*/
	static inline int32_t sk_64_asS32(int64_t value) {
	SkASSERT(sk_64_isS32(value));
	return (int32_t)value;
	}

	// Handy util that can be passed two ints, and will automatically promote to
	// 64bits before the multiply, so the caller doesn't have to remember to cast
	// e.g. (int64_t)a * b;
	static inline int64_t sk_64_mul(int64_t a, int64_t b) {
	return a * b;
	}

	///////////////////////////////////////////////////////////////////////////////

	/**
	* Computes numer1 * numer2 / denom in full 64 intermediate precision.
	* It is an error for denom to be 0. There is no special handling if
	* the result overflows 32bits.
	*/
	static inline int32_t SkMulDiv(int32_t numer1, int32_t numer2, int32_t denom) {
	SkASSERT(denom);

	int64_t tmp = sk_64_mul(numer1, numer2) / denom;
	return sk_64_asS32(tmp);
	}

	/**
	* Computes (numer1 << shift) / denom in full 64 intermediate precision.
	* It is an error for denom to be 0. There is no special handling if
	* the result overflows 32bits.
	*/
	int32_t SkDivBits(int32_t numer, int32_t denom, int shift);

	/**
	* Return the integer square root of value, with a bias of bitBias
	*/
	int32_t SkSqrtBits(int32_t value, int bitBias);

	/** Return the integer square root of n, treated as a SkFixed (16.16)
	*/
	#define SkSqrt32(n) SkSqrtBits(n, 15)

	//! Returns the number of leading zero bits (0...32)
	int SkCLZ_portable(uint32_t);

	#ifndef SkCLZ
	#if defined(_MSC_VER) && _MSC_VER >= 1400
	#include <intrin.h>

	static inline int SkCLZ(uint32_t mask) {
	if (mask) {
	DWORD index;
	_BitScanReverse(&index, mask);
	return index ^ 0x1F;
	} else {
	return 32;
	}
	}
	#elif defined(SK_CPU_ARM32) \|\| defined(__GNUC__) \|\| defined(__clang__)
	static inline int SkCLZ(uint32_t mask) {
	// __builtin_clz(0) is undefined, so we have to detect that case.
	return mask ? __builtin_clz(mask) : 32;
	}
	#else
	#define SkCLZ(x) SkCLZ_portable(x)
	#endif
	#endif

	/**
	* Returns (value < 0 ? 0 : value) efficiently (i.e. no compares or branches)
	*/
	static inline int SkClampPos(int value) {
	return value & ~(value >> 31);
	}

	/** Given an integer and a positive (max) integer, return the value
	* pinned against 0 and max, inclusive.
	* @param value The value we want returned pinned between [0...max]
	* @param max The positive max value
	* @return 0 if value < 0, max if value > max, else value
	*/
	static inline int SkClampMax(int value, int max) {
	// ensure that max is positive
	SkASSERT(max >= 0);
	if (value < 0) {
	value = 0;
	}
	if (value > max) {
	value = max;
	}
	return value;
	}

	/**
	* Returns the smallest power-of-2 that is >= the specified value. If value
	* is already a power of 2, then it is returned unchanged. It is undefined
	* if value is <= 0.
	*/
	static inline int SkNextPow2(int value) {
	SkASSERT(value > 0);
	return 1 << (32 - SkCLZ(value - 1));
	}

	/**
	* Returns the log2 of the specified value, were that value to be rounded up
	* to the next power of 2. It is undefined to pass 0. Examples:
	* SkNextLog2(1) -> 0
	* SkNextLog2(2) -> 1
	* SkNextLog2(3) -> 2
	* SkNextLog2(4) -> 2
	* SkNextLog2(5) -> 3
	*/
	static inline int SkNextLog2(uint32_t value) {
	SkASSERT(value != 0);
	return 32 - SkCLZ(value - 1);
	}

	/**
	* Returns true if value is a power of 2. Does not explicitly check for
	* value <= 0.
	*/
	static inline bool SkIsPow2(int value) {
	return (value & (value - 1)) == 0;
	}

	///////////////////////////////////////////////////////////////////////////////

	/**
	* SkMulS16(a, b) multiplies a * b, but requires that a and b are both int16_t.
	* With this requirement, we can generate faster instructions on some
	* architectures.
	*/
	#ifdef SK_ARM_HAS_EDSP
	static inline int32_t SkMulS16(S16CPU x, S16CPU y) {
	SkASSERT((int16_t)x == x);
	SkASSERT((int16_t)y == y);
	int32_t product;
	asm("smulbb %0, %1, %2 \n"
	: "=r"(product)
	: "r"(x), "r"(y)
	);
	return product;
	}
	#else
	#ifdef SK_DEBUG
	static inline int32_t SkMulS16(S16CPU x, S16CPU y) {
	SkASSERT((int16_t)x == x);
	SkASSERT((int16_t)y == y);
	return x * y;
	}
	#else
	#define SkMulS16(x, y) ((x) * (y))
	#endif
	#endif

	/**
	* Return a*b/((1 << shift) - 1), rounding any fractional bits.
	* Only valid if a and b are unsigned and <= 32767 and shift is > 0 and <= 8
	*/
	static inline unsigned SkMul16ShiftRound(U16CPU a, U16CPU b, int shift) {
	SkASSERT(a <= 32767);
	SkASSERT(b <= 32767);
	SkASSERT(shift > 0 && shift <= 8);
	unsigned prod = SkMulS16(a, b) + (1 << (shift - 1));
	return (prod + (prod >> shift)) >> shift;
	}

	/**
	* Return a*b/255, rounding any fractional bits.
	* Only valid if a and b are unsigned and <= 32767.
	*/
	static inline U8CPU SkMulDiv255Round(U16CPU a, U16CPU b) {
	SkASSERT(a <= 32767);
	SkASSERT(b <= 32767);
	unsigned prod = SkMulS16(a, b) + 128;
	return (prod + (prod >> 8)) >> 8;
	}

	/**
	* Stores numer/denom and numer%denom into div and mod respectively.
	*/
	template <typename In, typename Out>
	inline void SkTDivMod(In numer, In denom, Out* div, Out* mod) {
	#ifdef SK_CPU_ARM32
	// If we wrote this as in the else branch, GCC won't fuse the two into one
	// divmod call, but rather a div call followed by a divmod. Silly! This
	// version is just as fast as calling __aeabi_[u]idivmod manually, but with
	// prettier code.
	//
	// This benches as around 2x faster than the code in the else branch.
	const In d = numer/denom;
	*div = static_cast<Out>(d);
	mod = static_cast<Out>(numer-ddenom);
	#else
	// On x86 this will just be a single idiv.
	*div = static_cast<Out>(numer/denom);
	*mod = static_cast<Out>(numer%denom);
	#endif
	}

	#endif