X-Git-Url: http://wagner.pp.ru/gitweb/?a=blobdiff_plain;f=gosthash2012.c;h=6399a9edd2d5dca686c78434de4ecabe0dc9ef33;hb=c0eadfee19963e68a96f8a7720d39d262a34005d;hp=ddd35fad45c7cf32faefc58d933f88378e098a13;hpb=31138d02d9c3698c039154b3078c16f205e25902;p=openssl-gost%2Fengine.git diff --git a/gosthash2012.c b/gosthash2012.c index ddd35fa..6399a9e 100644 --- a/gosthash2012.c +++ b/gosthash2012.c @@ -9,6 +9,10 @@ */ #include "gosthash2012.h" +#ifdef __x86_64__ +# include +# include +#endif #if defined(_WIN32) || defined(_WINDOWS) # define INLINE __inline @@ -57,10 +61,13 @@ static INLINE void add512(union uint512_u * RESTRICT x, const union uint512_u * RESTRICT y) { #ifndef __GOST3411_BIG_ENDIAN__ - unsigned int CF; + unsigned int CF = 0; unsigned int i; - CF = 0; +# ifdef __x86_64__ + for (i = 0; i < 8; i++) + CF = _addcarry_u64(CF, x->QWORD[i] , y->QWORD[i], &(x->QWORD[i])); +# else for (i = 0; i < 8; i++) { const unsigned long long left = x->QWORD[i]; unsigned long long sum; @@ -82,7 +89,8 @@ static INLINE void add512(union uint512_u * RESTRICT x, CF = (sum < left); x->QWORD[i] = sum; } -#else +# endif /* !__x86_64__ */ +#else /* __GOST3411_BIG_ENDIAN__ */ const unsigned char *yp; unsigned char *xp; unsigned int i; @@ -96,7 +104,7 @@ static INLINE void add512(union uint512_u * RESTRICT x, buf = xp[i] + yp[i] + (buf >> 8); xp[i] = (unsigned char)buf & 0xFF; } -#endif +#endif /* __GOST3411_BIG_ENDIAN__ */ } static void g(union uint512_u *h, const union uint512_u * RESTRICT N, @@ -110,7 +118,7 @@ static void g(union uint512_u *h, const union uint512_u * RESTRICT N, LOAD(N, xmm0, xmm2, xmm4, xmm6); XLPS128M(h, xmm0, xmm2, xmm4, xmm6); - LOAD(m, xmm1, xmm3, xmm5, xmm7); + ULOAD(m, xmm1, xmm3, xmm5, xmm7); XLPS128R(xmm0, xmm2, xmm4, xmm6, xmm1, xmm3, xmm5, xmm7); for (i = 0; i < 11; i++) @@ -120,12 +128,10 @@ static void g(union uint512_u *h, const union uint512_u * RESTRICT N, X128R(xmm0, xmm2, xmm4, xmm6, xmm1, xmm3, xmm5, xmm7); X128M(h, xmm0, xmm2, xmm4, xmm6); - X128M(m, xmm0, xmm2, xmm4, xmm6); - - UNLOAD(h, xmm0, xmm2, xmm4, xmm6); + ULOAD(m, xmm1, xmm3, xmm5, xmm7); + X128R(xmm0, xmm2, xmm4, xmm6, xmm1, xmm3, xmm5, xmm7); - /* Restore the Floating-point status on the CPU */ - _mm_empty(); + STORE(h, xmm0, xmm2, xmm4, xmm6); #else union uint512_u Ki, data; unsigned int i;