/root/bitcoin/src/crypto/poly1305.cpp
| Line | Count | Source | 
| 1 |  | // Copyright (c) 2019-present The Bitcoin Core developers | 
| 2 |  | // Distributed under the MIT software license, see the accompanying | 
| 3 |  | // file COPYING or http://www.opensource.org/licenses/mit-license.php. | 
| 4 |  |  | 
| 5 |  | #include <crypto/common.h> | 
| 6 |  | #include <crypto/poly1305.h> | 
| 7 |  |  | 
| 8 |  | #include <cstring> | 
| 9 |  |  | 
| 10 |  | namespace poly1305_donna { | 
| 11 |  |  | 
| 12 |  | // Based on the public domain implementation by Andrew Moon | 
| 13 |  | // poly1305-donna-32.h from https://github.com/floodyberry/poly1305-donna | 
| 14 |  |  | 
| 15 | 0 | void poly1305_init(poly1305_context *st, const unsigned char key[32]) noexcept { | 
| 16 |  |     /* r &= 0xffffffc0ffffffc0ffffffc0fffffff */ | 
| 17 | 0 |     st->r[0] = (ReadLE32(&key[ 0])     ) & 0x3ffffff; | 
| 18 | 0 |     st->r[1] = (ReadLE32(&key[ 3]) >> 2) & 0x3ffff03; | 
| 19 | 0 |     st->r[2] = (ReadLE32(&key[ 6]) >> 4) & 0x3ffc0ff; | 
| 20 | 0 |     st->r[3] = (ReadLE32(&key[ 9]) >> 6) & 0x3f03fff; | 
| 21 | 0 |     st->r[4] = (ReadLE32(&key[12]) >> 8) & 0x00fffff; | 
| 22 |  |  | 
| 23 |  |     /* h = 0 */ | 
| 24 | 0 |     st->h[0] = 0; | 
| 25 | 0 |     st->h[1] = 0; | 
| 26 | 0 |     st->h[2] = 0; | 
| 27 | 0 |     st->h[3] = 0; | 
| 28 | 0 |     st->h[4] = 0; | 
| 29 |  |  | 
| 30 |  |     /* save pad for later */ | 
| 31 | 0 |     st->pad[0] = ReadLE32(&key[16]); | 
| 32 | 0 |     st->pad[1] = ReadLE32(&key[20]); | 
| 33 | 0 |     st->pad[2] = ReadLE32(&key[24]); | 
| 34 | 0 |     st->pad[3] = ReadLE32(&key[28]); | 
| 35 |  | 
 | 
| 36 | 0 |     st->leftover = 0; | 
| 37 | 0 |     st->final = 0; | 
| 38 | 0 | } | 
| 39 |  |  | 
| 40 | 0 | static void poly1305_blocks(poly1305_context *st, const unsigned char *m, size_t bytes) noexcept { | 
| 41 | 0 |     const uint32_t hibit = (st->final) ? 0 : (1UL << 24); /* 1 << 128 */ | 
| 42 | 0 |     uint32_t r0,r1,r2,r3,r4; | 
| 43 | 0 |     uint32_t s1,s2,s3,s4; | 
| 44 | 0 |     uint32_t h0,h1,h2,h3,h4; | 
| 45 | 0 |     uint64_t d0,d1,d2,d3,d4; | 
| 46 | 0 |     uint32_t c; | 
| 47 |  | 
 | 
| 48 | 0 |     r0 = st->r[0]; | 
| 49 | 0 |     r1 = st->r[1]; | 
| 50 | 0 |     r2 = st->r[2]; | 
| 51 | 0 |     r3 = st->r[3]; | 
| 52 | 0 |     r4 = st->r[4]; | 
| 53 |  | 
 | 
| 54 | 0 |     s1 = r1 * 5; | 
| 55 | 0 |     s2 = r2 * 5; | 
| 56 | 0 |     s3 = r3 * 5; | 
| 57 | 0 |     s4 = r4 * 5; | 
| 58 |  | 
 | 
| 59 | 0 |     h0 = st->h[0]; | 
| 60 | 0 |     h1 = st->h[1]; | 
| 61 | 0 |     h2 = st->h[2]; | 
| 62 | 0 |     h3 = st->h[3]; | 
| 63 | 0 |     h4 = st->h[4]; | 
| 64 |  | 
 | 
| 65 | 0 |     while (bytes >= POLY1305_BLOCK_SIZE) { | 
| 66 |  |         /* h += m[i] */ | 
| 67 | 0 |         h0 += (ReadLE32(m+ 0)     ) & 0x3ffffff; | 
| 68 | 0 |         h1 += (ReadLE32(m+ 3) >> 2) & 0x3ffffff; | 
| 69 | 0 |         h2 += (ReadLE32(m+ 6) >> 4) & 0x3ffffff; | 
| 70 | 0 |         h3 += (ReadLE32(m+ 9) >> 6) & 0x3ffffff; | 
| 71 | 0 |         h4 += (ReadLE32(m+12) >> 8) | hibit; | 
| 72 |  |  | 
| 73 |  |         /* h *= r */ | 
| 74 | 0 |         d0 = ((uint64_t)h0 * r0) + ((uint64_t)h1 * s4) + ((uint64_t)h2 * s3) + ((uint64_t)h3 * s2) + ((uint64_t)h4 * s1); | 
| 75 | 0 |         d1 = ((uint64_t)h0 * r1) + ((uint64_t)h1 * r0) + ((uint64_t)h2 * s4) + ((uint64_t)h3 * s3) + ((uint64_t)h4 * s2); | 
| 76 | 0 |         d2 = ((uint64_t)h0 * r2) + ((uint64_t)h1 * r1) + ((uint64_t)h2 * r0) + ((uint64_t)h3 * s4) + ((uint64_t)h4 * s3); | 
| 77 | 0 |         d3 = ((uint64_t)h0 * r3) + ((uint64_t)h1 * r2) + ((uint64_t)h2 * r1) + ((uint64_t)h3 * r0) + ((uint64_t)h4 * s4); | 
| 78 | 0 |         d4 = ((uint64_t)h0 * r4) + ((uint64_t)h1 * r3) + ((uint64_t)h2 * r2) + ((uint64_t)h3 * r1) + ((uint64_t)h4 * r0); | 
| 79 |  |  | 
| 80 |  |         /* (partial) h %= p */ | 
| 81 | 0 |                       c = (uint32_t)(d0 >> 26); h0 = (uint32_t)d0 & 0x3ffffff; | 
| 82 | 0 |         d1 += c;      c = (uint32_t)(d1 >> 26); h1 = (uint32_t)d1 & 0x3ffffff; | 
| 83 | 0 |         d2 += c;      c = (uint32_t)(d2 >> 26); h2 = (uint32_t)d2 & 0x3ffffff; | 
| 84 | 0 |         d3 += c;      c = (uint32_t)(d3 >> 26); h3 = (uint32_t)d3 & 0x3ffffff; | 
| 85 | 0 |         d4 += c;      c = (uint32_t)(d4 >> 26); h4 = (uint32_t)d4 & 0x3ffffff; | 
| 86 | 0 |         h0 += c * 5;  c =           (h0 >> 26); h0 =           h0 & 0x3ffffff; | 
| 87 | 0 |         h1 += c; | 
| 88 |  | 
 | 
| 89 | 0 |         m += POLY1305_BLOCK_SIZE; | 
| 90 | 0 |         bytes -= POLY1305_BLOCK_SIZE; | 
| 91 | 0 |     } | 
| 92 |  | 
 | 
| 93 | 0 |     st->h[0] = h0; | 
| 94 | 0 |     st->h[1] = h1; | 
| 95 | 0 |     st->h[2] = h2; | 
| 96 | 0 |     st->h[3] = h3; | 
| 97 | 0 |     st->h[4] = h4; | 
| 98 | 0 | } | 
| 99 |  |  | 
| 100 | 0 | void poly1305_finish(poly1305_context *st, unsigned char mac[16]) noexcept { | 
| 101 | 0 |     uint32_t h0,h1,h2,h3,h4,c; | 
| 102 | 0 |     uint32_t g0,g1,g2,g3,g4; | 
| 103 | 0 |     uint64_t f; | 
| 104 | 0 |     uint32_t mask; | 
| 105 |  |  | 
| 106 |  |     /* process the remaining block */ | 
| 107 | 0 |     if (st->leftover) { | 
| 108 | 0 |         size_t i = st->leftover; | 
| 109 | 0 |         st->buffer[i++] = 1; | 
| 110 | 0 |         for (; i < POLY1305_BLOCK_SIZE; i++) { | 
| 111 | 0 |             st->buffer[i] = 0; | 
| 112 | 0 |         } | 
| 113 | 0 |         st->final = 1; | 
| 114 | 0 |         poly1305_blocks(st, st->buffer, POLY1305_BLOCK_SIZE); | 
| 115 | 0 |     } | 
| 116 |  |  | 
| 117 |  |     /* fully carry h */ | 
| 118 | 0 |     h0 = st->h[0]; | 
| 119 | 0 |     h1 = st->h[1]; | 
| 120 | 0 |     h2 = st->h[2]; | 
| 121 | 0 |     h3 = st->h[3]; | 
| 122 | 0 |     h4 = st->h[4]; | 
| 123 |  | 
 | 
| 124 | 0 |                  c = h1 >> 26; h1 = h1 & 0x3ffffff; | 
| 125 | 0 |     h2 +=     c; c = h2 >> 26; h2 = h2 & 0x3ffffff; | 
| 126 | 0 |     h3 +=     c; c = h3 >> 26; h3 = h3 & 0x3ffffff; | 
| 127 | 0 |     h4 +=     c; c = h4 >> 26; h4 = h4 & 0x3ffffff; | 
| 128 | 0 |     h0 += c * 5; c = h0 >> 26; h0 = h0 & 0x3ffffff; | 
| 129 | 0 |     h1 +=     c; | 
| 130 |  |  | 
| 131 |  |     /* compute h + -p */ | 
| 132 | 0 |     g0 = h0 + 5; c = g0 >> 26; g0 &= 0x3ffffff; | 
| 133 | 0 |     g1 = h1 + c; c = g1 >> 26; g1 &= 0x3ffffff; | 
| 134 | 0 |     g2 = h2 + c; c = g2 >> 26; g2 &= 0x3ffffff; | 
| 135 | 0 |     g3 = h3 + c; c = g3 >> 26; g3 &= 0x3ffffff; | 
| 136 | 0 |     g4 = h4 + c - (1UL << 26); | 
| 137 |  |  | 
| 138 |  |     /* select h if h < p, or h + -p if h >= p */ | 
| 139 | 0 |     mask = (g4 >> ((sizeof(uint32_t) * 8) - 1)) - 1; | 
| 140 | 0 |     g0 &= mask; | 
| 141 | 0 |     g1 &= mask; | 
| 142 | 0 |     g2 &= mask; | 
| 143 | 0 |     g3 &= mask; | 
| 144 | 0 |     g4 &= mask; | 
| 145 | 0 |     mask = ~mask; | 
| 146 | 0 |     h0 = (h0 & mask) | g0; | 
| 147 | 0 |     h1 = (h1 & mask) | g1; | 
| 148 | 0 |     h2 = (h2 & mask) | g2; | 
| 149 | 0 |     h3 = (h3 & mask) | g3; | 
| 150 | 0 |     h4 = (h4 & mask) | g4; | 
| 151 |  |  | 
| 152 |  |     /* h = h % (2^128) */ | 
| 153 | 0 |     h0 = ((h0      ) | (h1 << 26)) & 0xffffffff; | 
| 154 | 0 |     h1 = ((h1 >>  6) | (h2 << 20)) & 0xffffffff; | 
| 155 | 0 |     h2 = ((h2 >> 12) | (h3 << 14)) & 0xffffffff; | 
| 156 | 0 |     h3 = ((h3 >> 18) | (h4 <<  8)) & 0xffffffff; | 
| 157 |  |  | 
| 158 |  |     /* mac = (h + pad) % (2^128) */ | 
| 159 | 0 |     f = (uint64_t)h0 + st->pad[0]            ; h0 = (uint32_t)f; | 
| 160 | 0 |     f = (uint64_t)h1 + st->pad[1] + (f >> 32); h1 = (uint32_t)f; | 
| 161 | 0 |     f = (uint64_t)h2 + st->pad[2] + (f >> 32); h2 = (uint32_t)f; | 
| 162 | 0 |     f = (uint64_t)h3 + st->pad[3] + (f >> 32); h3 = (uint32_t)f; | 
| 163 |  | 
 | 
| 164 | 0 |     WriteLE32(mac +  0, h0); | 
| 165 | 0 |     WriteLE32(mac +  4, h1); | 
| 166 | 0 |     WriteLE32(mac +  8, h2); | 
| 167 | 0 |     WriteLE32(mac + 12, h3); | 
| 168 |  |  | 
| 169 |  |     /* zero out the state */ | 
| 170 | 0 |     st->h[0] = 0; | 
| 171 | 0 |     st->h[1] = 0; | 
| 172 | 0 |     st->h[2] = 0; | 
| 173 | 0 |     st->h[3] = 0; | 
| 174 | 0 |     st->h[4] = 0; | 
| 175 | 0 |     st->r[0] = 0; | 
| 176 | 0 |     st->r[1] = 0; | 
| 177 | 0 |     st->r[2] = 0; | 
| 178 | 0 |     st->r[3] = 0; | 
| 179 | 0 |     st->r[4] = 0; | 
| 180 | 0 |     st->pad[0] = 0; | 
| 181 | 0 |     st->pad[1] = 0; | 
| 182 | 0 |     st->pad[2] = 0; | 
| 183 | 0 |     st->pad[3] = 0; | 
| 184 | 0 | } | 
| 185 |  |  | 
| 186 | 0 | void poly1305_update(poly1305_context *st, const unsigned char *m, size_t bytes) noexcept { | 
| 187 | 0 |     size_t i; | 
| 188 |  |  | 
| 189 |  |     /* handle leftover */ | 
| 190 | 0 |     if (st->leftover) { | 
| 191 | 0 |         size_t want = (POLY1305_BLOCK_SIZE - st->leftover); | 
| 192 | 0 |         if (want > bytes) { | 
| 193 | 0 |             want = bytes; | 
| 194 | 0 |         } | 
| 195 | 0 |         for (i = 0; i < want; i++) { | 
| 196 | 0 |             st->buffer[st->leftover + i] = m[i]; | 
| 197 | 0 |         } | 
| 198 | 0 |         bytes -= want; | 
| 199 | 0 |         m += want; | 
| 200 | 0 |         st->leftover += want; | 
| 201 | 0 |         if (st->leftover < POLY1305_BLOCK_SIZE) return; | 
| 202 | 0 |         poly1305_blocks(st, st->buffer, POLY1305_BLOCK_SIZE); | 
| 203 | 0 |         st->leftover = 0; | 
| 204 | 0 |     } | 
| 205 |  |  | 
| 206 |  |     /* process full blocks */ | 
| 207 | 0 |     if (bytes >= POLY1305_BLOCK_SIZE) { | 
| 208 | 0 |         size_t want = (bytes & ~(POLY1305_BLOCK_SIZE - 1)); | 
| 209 | 0 |         poly1305_blocks(st, m, want); | 
| 210 | 0 |         m += want; | 
| 211 | 0 |         bytes -= want; | 
| 212 | 0 |     } | 
| 213 |  |  | 
| 214 |  |     /* store leftover */ | 
| 215 | 0 |     if (bytes) { | 
| 216 | 0 |         for (i = 0; i < bytes; i++) { | 
| 217 | 0 |             st->buffer[st->leftover + i] = m[i]; | 
| 218 | 0 |         } | 
| 219 | 0 |         st->leftover += bytes; | 
| 220 | 0 |     } | 
| 221 | 0 | } | 
| 222 |  |  | 
| 223 |  | }  // namespace poly1305_donna |