blob: ce2f2860d89e1262d14a700673b444439326bf22 [file] [log] [blame]
/*******************************************************************************
* Copyright 2012-2018 Intel Corporation
* All Rights Reserved.
*
* If this software was obtained under the Intel Simplified Software License,
* the following terms apply:
*
* The source code, information and material ("Material") contained herein is
* owned by Intel Corporation or its suppliers or licensors, and title to such
* Material remains with Intel Corporation or its suppliers or licensors. The
* Material contains proprietary information of Intel or its suppliers and
* licensors. The Material is protected by worldwide copyright laws and treaty
* provisions. No part of the Material may be used, copied, reproduced,
* modified, published, uploaded, posted, transmitted, distributed or disclosed
* in any way without Intel's prior express written permission. No license under
* any patent, copyright or other intellectual property rights in the Material
* is granted to or conferred upon you, either expressly, by implication,
* inducement, estoppel or otherwise. Any license under such intellectual
* property rights must be express and approved by Intel in writing.
*
* Unless otherwise agreed by Intel in writing, you may not remove or alter this
* notice or any other notice embedded in Materials by Intel or Intel's
* suppliers or licensors in any way.
*
*
* If this software was obtained under the Apache License, Version 2.0 (the
* "License"), the following terms apply:
*
* You may not use this file except in compliance with the License. You may
* obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0
*
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
*
* See the License for the specific language governing permissions and
* limitations under the License.
*******************************************************************************/
/*
// Purpose:
// Intel(R) Integrated Performance Primitives.
// BNU data type definition
//
//
//
*/
#if !defined(_CP_BNU_IMPL_H)
#define _CP_BNU_IMPL_H
#define BNU_CHUNK_64BIT (64)
#define BNU_CHUNK_32BIT (32)
/*
// define BNU chunk data type
*/
#if ((_IPP_ARCH == _IPP_ARCH_EM64T) || (_IPP_ARCH == _IPP_ARCH_LP64) || (_IPP_ARCH == _IPP_ARCH_LRB) || (_IPP_ARCH == _IPP_ARCH_LRB2))
typedef Ipp64u BNU_CHUNK_T;
typedef Ipp64s BNS_CHUNK_T;
#define BNU_CHUNK_LOG2 (6)
#define BNU_CHUNK_BITS BNU_CHUNK_64BIT
#else
typedef Ipp32u BNU_CHUNK_T;
typedef Ipp32s BNS_CHUNK_T;
#define BNU_CHUNK_LOG2 (5)
#define BNU_CHUNK_BITS BNU_CHUNK_32BIT
#endif
#define BNU_CHUNK_MASK (~(BNU_CHUNK_T)(0))
#if (BNU_CHUNK_BITS == BNU_CHUNK_64BIT)
#pragma message ("BNU_CHUNK_BITS = 64 bit")
#elif (BNU_CHUNK_BITS == BNU_CHUNK_32BIT)
#pragma message ("BNU_CHUNK_BITS = 32 bit")
#else
#error BNU_CHUNK_BITS should be either 64 or 32 bit!
#endif
#ifdef _MSC_VER
// #pragma warning( disable : 4127 4711 4206)
# pragma warning( disable : 4127)
#endif
/* user's API BNU chunk data type */
typedef Ipp32u API_BNU_CHUNK_T;
/* convert API_BNU_CHUNK_T (usual Ipp32u) length into the BNU_CHUNK_T length */
#define INTERNAL_BNU_LENGTH(apiLen) \
((apiLen) + sizeof(BNU_CHUNK_T)/sizeof(API_BNU_CHUNK_T) -1)/(sizeof(BNU_CHUNK_T)/sizeof(API_BNU_CHUNK_T))
/* Low and High parts of BNU_CHUNK_T value */
#define BNU_CHUNK_2H ((BNU_CHUNK_T)1 << (BNU_CHUNK_BITS/2))
#define LO_CHUNK(c) ((BNU_CHUNK_T)(c) & (BNU_CHUNK_2H - 1))
#define HI_CHUNK(c) ((BNU_CHUNK_T)(c) >> (BNU_CHUNK_BITS/2))
/* (carry,R) = A+B */
#define ADD_AB(CARRY,R, A,B) \
do { \
BNU_CHUNK_T __s = (A) + (B); \
(CARRY) = __s < (A); \
(R) = __s; \
} while(0)
/* (carry,R) = A+B+C */
#define ADD_ABC(CARRY,R, A,B,C) \
do { \
BNU_CHUNK_T __s = (A) + (B); \
BNU_CHUNK_T __t1= __s < (A); \
BNU_CHUNK_T __r = __s + (C); \
BNU_CHUNK_T __t2 = __r < __s; \
(CARRY) = __t1 + __t2; \
(R) = __r; \
} while(0)
/* (borrow,R) = A-B */
#define SUB_AB(BORROW,R, A,B) \
do { \
(BORROW) = (A)<(B); \
(R) = (A)-(B); \
} while(0)
/* (borrow,R) = A-B-C */
#define SUB_ABC(BORROW,R, A,B,C) \
do { \
BNU_CHUNK_T __s = (A) -( B); \
BNU_CHUNK_T __t1= __s > (A); \
BNU_CHUNK_T __r = __s - (C); \
BNU_CHUNK_T __t2 = __r > __s; \
(BORROW) = __t1 + __t2; \
(R) = __r; \
} while(0)
/* (RH,RL) = A*B */
#define MUL_AB(RH, RL, A, B) \
do { \
BNU_CHUNK_T __aL = LO_CHUNK((A)); \
BNU_CHUNK_T __aH = HI_CHUNK((A)); \
BNU_CHUNK_T __bL = LO_CHUNK((B)); \
BNU_CHUNK_T __bH = HI_CHUNK((B)); \
\
BNU_CHUNK_T __x0 = (BNU_CHUNK_T) __aL * __bL; \
BNU_CHUNK_T __x1 = (BNU_CHUNK_T) __aL * __bH; \
BNU_CHUNK_T __x2 = (BNU_CHUNK_T) __aH * __bL; \
BNU_CHUNK_T __x3 = (BNU_CHUNK_T) __aH * __bH; \
\
__x1 += HI_CHUNK(__x0); \
__x1 += __x2; \
if(__x1 < __x2) \
__x3 += BNU_CHUNK_2H; \
\
(RH) = __x3 + HI_CHUNK(__x1); \
(RL) = (__x1 << BNU_CHUNK_BITS/2) + LO_CHUNK(__x0); \
} while (0)
#endif /* _CP_BNU_IMPL_H */