Project Alice
Loading...
Searching...
No Matches
ars.h
Go to the documentation of this file.
1/*
2Copyright 2010-2011, D. E. Shaw Research.
3All rights reserved.
4
5Redistribution and use in source and binary forms, with or without
6modification, are permitted provided that the following conditions are
7met:
8
9* Redistributions of source code must retain the above copyright
10 notice, this list of conditions, and the following disclaimer.
11
12* Redistributions in binary form must reproduce the above copyright
13 notice, this list of conditions, and the following disclaimer in the
14 documentation and/or other materials provided with the distribution.
15
16* Neither the name of D. E. Shaw Research nor the names of its
17 contributors may be used to endorse or promote products derived from
18 this software without specific prior written permission.
19
20THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
21"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
22LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
23A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
24OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
25SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
26LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
27DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
28THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
29(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
30OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
31*/
32#ifndef __Random123_ars_dot_hpp__
33#define __Random123_ars_dot_hpp__
34
36#include "array.h"
37
38#if R123_USE_AES_NI
39
40#ifndef ARS1xm128i_DEFAULT_ROUNDS
41#define ARS1xm128i_DEFAULT_ROUNDS 7
42#endif
43
45enum r123_enum_ars1xm128i { ars1xm128i_rounds = ARS1xm128i_DEFAULT_ROUNDS };
46
47/* ARS1xm128i with Weyl keys. Fast, and Crush-resistant, but NOT CRYPTO. */
49typedef struct r123array1xm128i ars1xm128i_ctr_t;
51typedef struct r123array1xm128i ars1xm128i_key_t;
53typedef struct r123array1xm128i ars1xm128i_ukey_t;
55R123_STATIC_INLINE ars1xm128i_key_t ars1xm128ikeyinit(ars1xm128i_ukey_t uk) { return uk; }
57R123_STATIC_INLINE ars1xm128i_ctr_t ars1xm128i_R(unsigned int Nrounds, ars1xm128i_ctr_t in, ars1xm128i_key_t k) {
58 __m128i kweyl = _mm_set_epi64x(R123_64BIT(0xBB67AE8584CAA73B), /* sqrt(3) - 1.0 */
59 R123_64BIT(0x9E3779B97F4A7C15)); /* golden ratio */
60 /* N.B. the aesenc instructions do the xor *after*
61 // so if we want to follow the AES pattern, we
62 // have to do the initial xor explicitly */
63 __m128i kk = k.v[0].m;
64 __m128i v = _mm_xor_si128(in.v[0].m, kk);
65 ars1xm128i_ctr_t ret;
66 R123_ASSERT(Nrounds <= 10);
67 if(Nrounds > 1) {
68 kk = _mm_add_epi64(kk, kweyl);
69 v = _mm_aesenc_si128(v, kk);
70 }
71 if(Nrounds > 2) {
72 kk = _mm_add_epi64(kk, kweyl);
73 v = _mm_aesenc_si128(v, kk);
74 }
75 if(Nrounds > 3) {
76 kk = _mm_add_epi64(kk, kweyl);
77 v = _mm_aesenc_si128(v, kk);
78 }
79 if(Nrounds > 4) {
80 kk = _mm_add_epi64(kk, kweyl);
81 v = _mm_aesenc_si128(v, kk);
82 }
83 if(Nrounds > 5) {
84 kk = _mm_add_epi64(kk, kweyl);
85 v = _mm_aesenc_si128(v, kk);
86 }
87 if(Nrounds > 6) {
88 kk = _mm_add_epi64(kk, kweyl);
89 v = _mm_aesenc_si128(v, kk);
90 }
91 if(Nrounds > 7) {
92 kk = _mm_add_epi64(kk, kweyl);
93 v = _mm_aesenc_si128(v, kk);
94 }
95 if(Nrounds > 8) {
96 kk = _mm_add_epi64(kk, kweyl);
97 v = _mm_aesenc_si128(v, kk);
98 }
99 if(Nrounds > 9) {
100 kk = _mm_add_epi64(kk, kweyl);
101 v = _mm_aesenc_si128(v, kk);
102 }
103 kk = _mm_add_epi64(kk, kweyl);
104 v = _mm_aesenclast_si128(v, kk);
105 ret.v[0].m = v;
106 return ret;
107}
108
113#define ars1xm128i(c, k) ars1xm128i_R(ars1xm128i_rounds, c, k)
114
116typedef struct r123array4x32 ars4x32_ctr_t;
118typedef struct r123array4x32 ars4x32_key_t;
120typedef struct r123array4x32 ars4x32_ukey_t;
122enum r123_enum_ars4x32 { ars4x32_rounds = ARS1xm128i_DEFAULT_ROUNDS };
124R123_STATIC_INLINE ars4x32_key_t ars4x32keyinit(ars4x32_ukey_t uk) { return uk; }
126R123_STATIC_INLINE ars4x32_ctr_t ars4x32_R(unsigned int Nrounds, ars4x32_ctr_t c, ars4x32_key_t k) {
127 ars1xm128i_ctr_t c128;
128 ars1xm128i_key_t k128;
129 c128.v[0].m = _mm_set_epi32(c.v[3], c.v[2], c.v[1], c.v[0]);
130 k128.v[0].m = _mm_set_epi32(k.v[3], k.v[2], k.v[1], k.v[0]);
131 c128 = ars1xm128i_R(Nrounds, c128, k128);
132 _mm_storeu_si128((__m128i*)&c.v[0], c128.v[0].m);
133 return c;
134}
135
139#define ars4x32(c, k) ars4x32_R(ars4x32_rounds, c, k)
140
141#ifdef __cplusplus
142namespace r123 {
164template<unsigned int ROUNDS> struct ARS1xm128i_R {
165 typedef ars1xm128i_ctr_t ctr_type;
166 typedef ars1xm128i_key_t key_type;
167 typedef ars1xm128i_key_t ukey_type;
168 static unsigned int const rounds = ROUNDS;
169 R123_FORCE_INLINE(ctr_type operator()(ctr_type ctr, key_type key) const) { return ars1xm128i_R(ROUNDS, ctr, key); }
170};
171
176template<unsigned int ROUNDS> struct ARS4x32_R {
177 typedef ars4x32_ctr_t ctr_type;
178 typedef ars4x32_key_t key_type;
179 typedef ars4x32_key_t ukey_type;
180 static unsigned int const rounds = ROUNDS;
181 R123_FORCE_INLINE(ctr_type operator()(ctr_type ctr, key_type key) const) { return ars4x32_R(ROUNDS, ctr, key); }
182};
191typedef ARS1xm128i_R<ars1xm128i_rounds> ARS1xm128i;
192typedef ARS4x32_R<ars4x32_rounds> ARS4x32;
193} // namespace r123
194
195#endif /* __cplusplus */
196
197#endif /* R123_USE_AES_NI */
198
199#endif
#define R123_STATIC_INLINE
#define R123_FORCE_INLINE(decl)
#define R123_ASSERT(x)
Definition: array.h:344