#ifndef _CORECRYPTO_CC_PRIV_H_
#define _CORECRYPTO_CC_PRIV_H_
#include <corecrypto/cc.h>
#include <stdint.h>
#define CC_MEMCPY(D,S,L) memcpy((D),(S),(L))
#define CC_MEMMOVE(D,S,L) memmove((D),(S),(L))
#define CC_MEMSET(D,V,L) memset((D),(V),(L))
#define CC_BZERO(D,L) memset((D),0,(L))
#define CC_STORE32_LE(x, y) do { \
((unsigned char *)(y))[3] = (unsigned char)(((x)>>24)&255); \
((unsigned char *)(y))[2] = (unsigned char)(((x)>>16)&255); \
((unsigned char *)(y))[1] = (unsigned char)(((x)>>8)&255); \
((unsigned char *)(y))[0] = (unsigned char)((x)&255); \
} while(0)
#define CC_LOAD32_LE(x, y) do { \
x = ((uint32_t)(((unsigned char *)(y))[3] & 255)<<24) | \
((uint32_t)(((unsigned char *)(y))[2] & 255)<<16) | \
((uint32_t)(((unsigned char *)(y))[1] & 255)<<8) | \
((uint32_t)(((unsigned char *)(y))[0] & 255)); \
} while(0)
#define CC_STORE64_LE(x, y) do { \
((unsigned char *)(y))[7] = (unsigned char)(((x)>>56)&255); \
((unsigned char *)(y))[6] = (unsigned char)(((x)>>48)&255); \
((unsigned char *)(y))[5] = (unsigned char)(((x)>>40)&255); \
((unsigned char *)(y))[4] = (unsigned char)(((x)>>32)&255); \
((unsigned char *)(y))[3] = (unsigned char)(((x)>>24)&255); \
((unsigned char *)(y))[2] = (unsigned char)(((x)>>16)&255); \
((unsigned char *)(y))[1] = (unsigned char)(((x)>>8)&255); \
((unsigned char *)(y))[0] = (unsigned char)((x)&255); \
} while(0)
#define CC_LOAD64_LE(x, y) do { \
x = (((uint64_t)(((unsigned char *)(y))[7] & 255))<<56) | \
(((uint64_t)(((unsigned char *)(y))[6] & 255))<<48) | \
(((uint64_t)(((unsigned char *)(y))[5] & 255))<<40) | \
(((uint64_t)(((unsigned char *)(y))[4] & 255))<<32) | \
(((uint64_t)(((unsigned char *)(y))[3] & 255))<<24) | \
(((uint64_t)(((unsigned char *)(y))[2] & 255))<<16) | \
(((uint64_t)(((unsigned char *)(y))[1] & 255))<<8) | \
(((uint64_t)(((unsigned char *)(y))[0] & 255))); \
} while(0)
#if (defined(__i386__) || defined(__x86_64__))
#define CC_STORE32_BE(x, y) \
__asm__ __volatile__ ( \
"bswapl %0 \n\t" \
"movl %0,(%1)\n\t" \
"bswapl %0 \n\t" \
::"r"(x), "r"(y))
#define CC_LOAD32_BE(x, y) \
__asm__ __volatile__ ( \
"movl (%1),%0\n\t" \
"bswapl %0\n\t" \
:"=r"(x): "r"(y))
#else
#define CC_STORE32_BE(x, y) do { \
((unsigned char *)(y))[0] = (unsigned char)(((x)>>24)&255); \
((unsigned char *)(y))[1] = (unsigned char)(((x)>>16)&255); \
((unsigned char *)(y))[2] = (unsigned char)(((x)>>8)&255); \
((unsigned char *)(y))[3] = (unsigned char)((x)&255); \
} while(0)
#define CC_LOAD32_BE(x, y) do { \
x = ((uint32_t)(((unsigned char *)(y))[0] & 255)<<24) | \
((uint32_t)(((unsigned char *)(y))[1] & 255)<<16) | \
((uint32_t)(((unsigned char *)(y))[2] & 255)<<8) | \
((uint32_t)(((unsigned char *)(y))[3] & 255)); \
} while(0)
#endif
#if defined(__x86_64__)
#define CC_STORE64_BE(x, y) \
__asm__ __volatile__ ( \
"bswapq %0 \n\t" \
"movq %0,(%1)\n\t" \
"bswapq %0 \n\t" \
::"r"(x), "r"(y))
#define CC_LOAD64_BE(x, y) \
__asm__ __volatile__ ( \
"movq (%1),%0\n\t" \
"bswapq %0\n\t" \
:"=r"(x): "r"(y))
#else
#define CC_STORE64_BE(x, y) do { \
((unsigned char *)(y))[0] = (unsigned char)(((x)>>56)&255); \
((unsigned char *)(y))[1] = (unsigned char)(((x)>>48)&255); \
((unsigned char *)(y))[2] = (unsigned char)(((x)>>40)&255); \
((unsigned char *)(y))[3] = (unsigned char)(((x)>>32)&255); \
((unsigned char *)(y))[4] = (unsigned char)(((x)>>24)&255); \
((unsigned char *)(y))[5] = (unsigned char)(((x)>>16)&255); \
((unsigned char *)(y))[6] = (unsigned char)(((x)>>8)&255); \
((unsigned char *)(y))[7] = (unsigned char)((x)&255); \
} while(0)
#define CC_LOAD64_BE(x, y) do { \
x = (((uint64_t)(((unsigned char *)(y))[0] & 255))<<56) | \
(((uint64_t)(((unsigned char *)(y))[1] & 255))<<48) | \
(((uint64_t)(((unsigned char *)(y))[2] & 255))<<40) | \
(((uint64_t)(((unsigned char *)(y))[3] & 255))<<32) | \
(((uint64_t)(((unsigned char *)(y))[4] & 255))<<24) | \
(((uint64_t)(((unsigned char *)(y))[5] & 255))<<16) | \
(((uint64_t)(((unsigned char *)(y))[6] & 255))<<8) | \
(((uint64_t)(((unsigned char *)(y))[7] & 255))); \
} while(0)
#endif
#if defined(_MSC_VER)
#include <stdlib.h>
#pragma intrinsic(_lrotr,_lrotl)
#define CC_ROR(x,n) _lrotr(x,n)
#define CC_ROL(x,n) _lrotl(x,n)
#define CC_RORc(x,n) _lrotr(x,n)
#define CC_ROLc(x,n) _lrotl(x,n)
#elif (defined(__i386__) || defined(__x86_64__))
static inline uint32_t CC_ROL(uint32_t word, int i)
{
__asm__ ("roll %%cl,%0"
:"=r" (word)
:"0" (word),"c" (i));
return word;
}
static inline uint32_t CC_ROR(uint32_t word, int i)
{
__asm__ ("rorl %%cl,%0"
:"=r" (word)
:"0" (word),"c" (i));
return word;
}
#define CC_ROLc(word, i) \
({ uint32_t _word=(word); \
__asm__ __volatile__ ("roll %2,%0" \
:"=r" (_word) \
:"0" (_word),"I" (i)); \
_word; \
})
#define CC_RORc(word, i) \
({ uint32_t _word=(word); \
__asm__ __volatile__ ("rorl %2,%0" \
:"=r" (_word) \
:"0" (_word),"I" (i)); \
_word; \
})
#else
static inline uint32_t CC_ROL(uint32_t word, int i)
{
return ( (word<<(i&31)) | (word>>(32-(i&31))) );
}
static inline uint32_t CC_ROR(uint32_t word, int i)
{
return ( (word>>(i&31)) | (word<<(32-(i&31))) );
}
#define CC_ROLc(x, y) CC_ROL(x, y)
#define CC_RORc(x, y) CC_ROR(x, y)
#endif
#if defined(__x86_64__)
static inline uint64_t CC_ROL64(uint64_t word, int i)
{
__asm__("rolq %%cl,%0"
:"=r" (word)
:"0" (word),"c" (i));
return word;
}
static inline uint64_t CC_ROR64(uint64_t word, int i)
{
__asm__("rorq %%cl,%0"
:"=r" (word)
:"0" (word),"c" (i));
return word;
}
#define CC_ROL64c(word, i) \
({ \
uint64_t _word=(word); \
__asm__("rolq %2,%0" \
:"=r" (_word) \
:"0" (_word),"J" (i)); \
_word; \
})
#define CC_ROR64c(word, i) \
({ \
uint64_t _word=(word); \
__asm__("rorq %2,%0" \
:"=r" (_word) \
:"0" (_word),"J" (i)); \
_word; \
})
#else
static inline uint64_t CC_ROL64(uint64_t word, int i)
{
return ( (word<<(i&63)) | (word>>(64-(i&63))) );
}
static inline uint64_t CC_ROR64(uint64_t word, int i)
{
return ( (word>>(i&63)) | (word<<(64-(i&63))) );
}
#define CC_ROL64c(x, y) CC_ROL64(x, y)
#define CC_ROR64c(x, y) CC_ROR64(x, y)
#endif
static inline uint32_t CC_BSWAP(uint32_t x)
{
return (
((x>>24)&0x000000FF) |
((x<<24)&0xFF000000) |
((x>>8) &0x0000FF00) |
((x<<8) &0x00FF0000)
);
}
#define CC_BSWAP64(x) \
((uint64_t)((((uint64_t)(x) & 0xff00000000000000ULL) >> 56) | \
(((uint64_t)(x) & 0x00ff000000000000ULL) >> 40) | \
(((uint64_t)(x) & 0x0000ff0000000000ULL) >> 24) | \
(((uint64_t)(x) & 0x000000ff00000000ULL) >> 8) | \
(((uint64_t)(x) & 0x00000000ff000000ULL) << 8) | \
(((uint64_t)(x) & 0x0000000000ff0000ULL) << 24) | \
(((uint64_t)(x) & 0x000000000000ff00ULL) << 40) | \
(((uint64_t)(x) & 0x00000000000000ffULL) << 56)))
#ifdef __LITTLE_ENDIAN__
#define CC_H2BE32(x) CC_BSWAP(x)
#define CC_H2LE32(x) (x)
#else
#define CC_H2BE32(x) (x)
#define CC_H2LE32(x) CC_BSWAP(x)
#endif
#ifdef _MSC_VER
#define cc_byte(x, n) ((unsigned char)((x) >> (8 * (n))))
#else
#define cc_byte(x, n) (((x) >> (8 * (n))) & 255)
#endif
#define HEAVISIDE_STEP_UINT64(x) {unsigned long t; \
t=(((uint64_t)x>>32) | (unsigned long)x); \
t=((t>>16) | t); \
t=((t>>8) | t); \
t=((t>>4) | t); \
t=((t>>2) | t); \
t=((t>>1) | t); \
x=t & 0x1;}
#define HEAVISIDE_STEP_UINT32(x) {uint16_t t; \
t=(((unsigned long)x>>16) | (uint16_t)x); \
t=((t>>8) | t); \
t=((t>>4) | t); \
t=((t>>2) | t); \
t=((t>>1) | t); \
x=t & 0x1;}
#define HEAVISIDE_STEP_UINT16(x) {uint8_t t; \
t=(((uint16_t)x>>8) | (uint8_t)x); \
t=((t>>4) | t); \
t=((t>>2) | t); \
t=((t>>1) | t); \
x=t & 0x1;}
#define HEAVISIDE_STEP_UINT8(x) {uint8_t t; \
t=(((uint8_t)x>>4) | (uint8_t)x); \
t=((t>>2) | t); \
t=((t>>1) | t); \
x=t & 0x1;}
#define CC_HEAVISIDE_STEP(x) { \
if (sizeof(x) == 1) {HEAVISIDE_STEP_UINT8(x);} \
else if (sizeof(x) == 2) {HEAVISIDE_STEP_UINT16(x);} \
else if (sizeof(x) == 4) {HEAVISIDE_STEP_UINT32(x);} \
else if (sizeof(x) == 8) {HEAVISIDE_STEP_UINT64(x);} \
else {x=((x==0)?0:1);} \
}
#define MAX_POWER_OF_2(x) ((__typeof__(x))1<<(8*sizeof(x)-1))
#endif