1 /*******************************************************************************
2 * Copyright 2012-2018 Intel Corporation
3 * All Rights Reserved.
4 *
5 * If this  software was obtained  under the  Intel Simplified  Software License,
6 * the following terms apply:
7 *
8 * The source code,  information  and material  ("Material") contained  herein is
9 * owned by Intel Corporation or its  suppliers or licensors,  and  title to such
10 * Material remains with Intel  Corporation or its  suppliers or  licensors.  The
11 * Material  contains  proprietary  information  of  Intel or  its suppliers  and
12 * licensors.  The Material is protected by  worldwide copyright  laws and treaty
13 * provisions.  No part  of  the  Material   may  be  used,  copied,  reproduced,
14 * modified, published,  uploaded, posted, transmitted,  distributed or disclosed
15 * in any way without Intel's prior express written permission.  No license under
16 * any patent,  copyright or other  intellectual property rights  in the Material
17 * is granted to  or  conferred  upon  you,  either   expressly,  by implication,
18 * inducement,  estoppel  or  otherwise.  Any  license   under such  intellectual
19 * property rights must be express and approved by Intel in writing.
20 *
21 * Unless otherwise agreed by Intel in writing,  you may not remove or alter this
22 * notice or  any  other  notice   embedded  in  Materials  by  Intel  or Intel's
23 * suppliers or licensors in any way.
24 *
25 *
26 * If this  software  was obtained  under the  Apache License,  Version  2.0 (the
27 * "License"), the following terms apply:
28 *
29 * You may  not use this  file except  in compliance  with  the License.  You may
30 * obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0
31 *
32 *
33 * Unless  required  by   applicable  law  or  agreed  to  in  writing,  software
34 * distributed under the License  is distributed  on an  "AS IS"  BASIS,  WITHOUT
35 * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
36 *
37 * See the   License  for the   specific  language   governing   permissions  and
38 * limitations under the License.
39 *******************************************************************************/
40 
41 /*
42 //  Purpose:
43 //     Intel(R) Integrated Performance Primitives.
44 //     BNU data type definition
45 //
46 //
47 //
48 */
49 
50 #if !defined(_CP_BNU_IMPL_H)
51 #define _CP_BNU_IMPL_H
52 
53 #define BNU_CHUNK_64BIT        (64)
54 #define BNU_CHUNK_32BIT        (32)
55 
56 
57 /*
58 // define BNU chunk data type
59 */
60 #if ((_IPP_ARCH == _IPP_ARCH_EM64T) || (_IPP_ARCH == _IPP_ARCH_LP64) || (_IPP_ARCH == _IPP_ARCH_LRB) || (_IPP_ARCH == _IPP_ARCH_LRB2))
61    typedef Ipp64u BNU_CHUNK_T;
62    typedef Ipp64s BNS_CHUNK_T;
63    #define BNU_CHUNK_LOG2  (6)
64    #define BNU_CHUNK_BITS  BNU_CHUNK_64BIT
65 
66 #else
67    typedef Ipp32u BNU_CHUNK_T;
68    typedef Ipp32s BNS_CHUNK_T;
69    #define BNU_CHUNK_LOG2  (5)
70    #define BNU_CHUNK_BITS  BNU_CHUNK_32BIT
71 #endif
72 
73 #define BNU_CHUNK_MASK        (~(BNU_CHUNK_T)(0))
74 
75 #if (BNU_CHUNK_BITS == BNU_CHUNK_64BIT)
76    #pragma message ("BNU_CHUNK_BITS = 64 bit")
77 #elif (BNU_CHUNK_BITS == BNU_CHUNK_32BIT)
78    #pragma message ("BNU_CHUNK_BITS = 32 bit")
79 #else
80    #error BNU_CHUNK_BITS should be either 64 or 32 bit!
81 #endif
82 
83 
84 #ifdef _MSC_VER
85 //  #pragma warning( disable : 4127 4711 4206)
86 #  pragma warning( disable : 4127)
87 #endif
88 
89 /* user's API BNU chunk data type */
90 typedef Ipp32u API_BNU_CHUNK_T;
91 
92 /* convert API_BNU_CHUNK_T (usual Ipp32u) length into the BNU_CHUNK_T length */
93 #define INTERNAL_BNU_LENGTH(apiLen) \
94    ((apiLen) + sizeof(BNU_CHUNK_T)/sizeof(API_BNU_CHUNK_T) -1)/(sizeof(BNU_CHUNK_T)/sizeof(API_BNU_CHUNK_T))
95 
96 /* Low and High parts of BNU_CHUNK_T value */
97 #define BNU_CHUNK_2H ((BNU_CHUNK_T)1 << (BNU_CHUNK_BITS/2))
98 #define LO_CHUNK(c)  ((BNU_CHUNK_T)(c) & (BNU_CHUNK_2H - 1))
99 #define HI_CHUNK(c)  ((BNU_CHUNK_T)(c) >> (BNU_CHUNK_BITS/2))
100 
101 /* (carry,R) = A+B */
102 #define ADD_AB(CARRY,R, A,B)     \
103 do {                             \
104    BNU_CHUNK_T __s = (A) + (B);  \
105    (CARRY) = __s < (A);          \
106    (R) = __s;                    \
107 } while(0)
108 
109 /* (carry,R) = A+B+C */
110 #define ADD_ABC(CARRY,R, A,B,C)  \
111 do {                             \
112    BNU_CHUNK_T __s = (A) + (B);  \
113    BNU_CHUNK_T __t1= __s < (A);  \
114    BNU_CHUNK_T __r = __s + (C);  \
115    BNU_CHUNK_T __t2 = __r < __s; \
116    (CARRY) = __t1 + __t2;        \
117    (R) = __r;                    \
118 } while(0)
119 
120 /* (borrow,R) = A-B */
121 #define SUB_AB(BORROW,R, A,B)  \
122 do {                          \
123    (BORROW) = (A)<(B);        \
124    (R) = (A)-(B);             \
125 } while(0)
126 
127 /* (borrow,R) = A-B-C */
128 #define SUB_ABC(BORROW,R, A,B,C)  \
129 do {                             \
130    BNU_CHUNK_T __s = (A) -( B);  \
131    BNU_CHUNK_T __t1= __s > (A);  \
132    BNU_CHUNK_T __r = __s - (C);  \
133    BNU_CHUNK_T __t2 = __r > __s; \
134    (BORROW) = __t1 + __t2;       \
135    (R) = __r;                    \
136 } while(0)
137 
138 /* (RH,RL) = A*B */
139 #define MUL_AB(RH, RL, A, B)  \
140    do {                       \
141    BNU_CHUNK_T __aL = LO_CHUNK((A));   \
142    BNU_CHUNK_T __aH = HI_CHUNK((A));   \
143    BNU_CHUNK_T __bL = LO_CHUNK((B));   \
144    BNU_CHUNK_T __bH = HI_CHUNK((B));   \
145    \
146    BNU_CHUNK_T __x0 = (BNU_CHUNK_T) __aL * __bL;   \
147    BNU_CHUNK_T __x1 = (BNU_CHUNK_T) __aL * __bH;   \
148    BNU_CHUNK_T __x2 = (BNU_CHUNK_T) __aH * __bL;   \
149    BNU_CHUNK_T __x3 = (BNU_CHUNK_T) __aH * __bH;   \
150    \
151    __x1 += HI_CHUNK(__x0);    \
152    __x1 += __x2;              \
153    if(__x1 < __x2)            \
154       __x3 += BNU_CHUNK_2H;   \
155    \
156    (RH) = __x3 + HI_CHUNK(__x1); \
157    (RL) = (__x1 << BNU_CHUNK_BITS/2) + LO_CHUNK(__x0); \
158    } while (0)
159 
160 #endif /* _CP_BNU_IMPL_H */
161