25'ten fazla konu seçemezsiniz Konular bir harf veya rakamla başlamalı, kısa çizgiler ('-') içerebilir ve en fazla 35 karakter uzunluğunda olabilir.
 
 
 
 
 
 

247 satır
7.7 KiB

  1. /* Copyright (c) 2015, Google Inc.
  2. *
  3. * Permission to use, copy, modify, and/or distribute this software for any
  4. * purpose with or without fee is hereby granted, provided that the above
  5. * copyright notice and this permission notice appear in all copies.
  6. *
  7. * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
  8. * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
  9. * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
  10. * SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
  11. * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION
  12. * OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN
  13. * CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. */
  14. /* This code is mostly taken from the ref10 version of Ed25519 in SUPERCOP
  15. * 20141124 (http://bench.cr.yp.to/supercop.html). That code is released as
  16. * public domain but this file has the ISC license just to keep licencing
  17. * simple.
  18. *
  19. * The field functions are shared by Ed25519 and X25519 where possible. */
  20. #include <openssl/curve25519.h>
  21. #include <string.h>
  22. #include "internal.h"
  23. #if defined(BORINGSSL_X25519_X86_64)
  24. typedef struct { uint64_t v[5]; } fe25519;
  25. /* These functions are defined in asm/x25519-x86_64.S */
  26. void x25519_x86_64_work_cswap(fe25519 *, uint64_t);
  27. void x25519_x86_64_mul(fe25519 *out, const fe25519 *a, const fe25519 *b);
  28. void x25519_x86_64_square(fe25519 *out, const fe25519 *a);
  29. void x25519_x86_64_freeze(fe25519 *);
  30. void x25519_x86_64_ladderstep(fe25519 *work);
  31. static void fe25519_setint(fe25519 *r, unsigned v) {
  32. r->v[0] = v;
  33. r->v[1] = 0;
  34. r->v[2] = 0;
  35. r->v[3] = 0;
  36. r->v[4] = 0;
  37. }
  38. /* Assumes input x being reduced below 2^255 */
  39. static void fe25519_pack(unsigned char r[32], const fe25519 *x) {
  40. fe25519 t;
  41. t = *x;
  42. x25519_x86_64_freeze(&t);
  43. r[0] = (uint8_t)(t.v[0] & 0xff);
  44. r[1] = (uint8_t)((t.v[0] >> 8) & 0xff);
  45. r[2] = (uint8_t)((t.v[0] >> 16) & 0xff);
  46. r[3] = (uint8_t)((t.v[0] >> 24) & 0xff);
  47. r[4] = (uint8_t)((t.v[0] >> 32) & 0xff);
  48. r[5] = (uint8_t)((t.v[0] >> 40) & 0xff);
  49. r[6] = (uint8_t)((t.v[0] >> 48));
  50. r[6] ^= (uint8_t)((t.v[1] << 3) & 0xf8);
  51. r[7] = (uint8_t)((t.v[1] >> 5) & 0xff);
  52. r[8] = (uint8_t)((t.v[1] >> 13) & 0xff);
  53. r[9] = (uint8_t)((t.v[1] >> 21) & 0xff);
  54. r[10] = (uint8_t)((t.v[1] >> 29) & 0xff);
  55. r[11] = (uint8_t)((t.v[1] >> 37) & 0xff);
  56. r[12] = (uint8_t)((t.v[1] >> 45));
  57. r[12] ^= (uint8_t)((t.v[2] << 6) & 0xc0);
  58. r[13] = (uint8_t)((t.v[2] >> 2) & 0xff);
  59. r[14] = (uint8_t)((t.v[2] >> 10) & 0xff);
  60. r[15] = (uint8_t)((t.v[2] >> 18) & 0xff);
  61. r[16] = (uint8_t)((t.v[2] >> 26) & 0xff);
  62. r[17] = (uint8_t)((t.v[2] >> 34) & 0xff);
  63. r[18] = (uint8_t)((t.v[2] >> 42) & 0xff);
  64. r[19] = (uint8_t)((t.v[2] >> 50));
  65. r[19] ^= (uint8_t)((t.v[3] << 1) & 0xfe);
  66. r[20] = (uint8_t)((t.v[3] >> 7) & 0xff);
  67. r[21] = (uint8_t)((t.v[3] >> 15) & 0xff);
  68. r[22] = (uint8_t)((t.v[3] >> 23) & 0xff);
  69. r[23] = (uint8_t)((t.v[3] >> 31) & 0xff);
  70. r[24] = (uint8_t)((t.v[3] >> 39) & 0xff);
  71. r[25] = (uint8_t)((t.v[3] >> 47));
  72. r[25] ^= (uint8_t)((t.v[4] << 4) & 0xf0);
  73. r[26] = (uint8_t)((t.v[4] >> 4) & 0xff);
  74. r[27] = (uint8_t)((t.v[4] >> 12) & 0xff);
  75. r[28] = (uint8_t)((t.v[4] >> 20) & 0xff);
  76. r[29] = (uint8_t)((t.v[4] >> 28) & 0xff);
  77. r[30] = (uint8_t)((t.v[4] >> 36) & 0xff);
  78. r[31] = (uint8_t)((t.v[4] >> 44));
  79. }
  80. static void fe25519_unpack(fe25519 *r, const uint8_t x[32]) {
  81. r->v[0] = x[0];
  82. r->v[0] += (uint64_t)x[1] << 8;
  83. r->v[0] += (uint64_t)x[2] << 16;
  84. r->v[0] += (uint64_t)x[3] << 24;
  85. r->v[0] += (uint64_t)x[4] << 32;
  86. r->v[0] += (uint64_t)x[5] << 40;
  87. r->v[0] += ((uint64_t)x[6] & 7) << 48;
  88. r->v[1] = x[6] >> 3;
  89. r->v[1] += (uint64_t)x[7] << 5;
  90. r->v[1] += (uint64_t)x[8] << 13;
  91. r->v[1] += (uint64_t)x[9] << 21;
  92. r->v[1] += (uint64_t)x[10] << 29;
  93. r->v[1] += (uint64_t)x[11] << 37;
  94. r->v[1] += ((uint64_t)x[12] & 63) << 45;
  95. r->v[2] = x[12] >> 6;
  96. r->v[2] += (uint64_t)x[13] << 2;
  97. r->v[2] += (uint64_t)x[14] << 10;
  98. r->v[2] += (uint64_t)x[15] << 18;
  99. r->v[2] += (uint64_t)x[16] << 26;
  100. r->v[2] += (uint64_t)x[17] << 34;
  101. r->v[2] += (uint64_t)x[18] << 42;
  102. r->v[2] += ((uint64_t)x[19] & 1) << 50;
  103. r->v[3] = x[19] >> 1;
  104. r->v[3] += (uint64_t)x[20] << 7;
  105. r->v[3] += (uint64_t)x[21] << 15;
  106. r->v[3] += (uint64_t)x[22] << 23;
  107. r->v[3] += (uint64_t)x[23] << 31;
  108. r->v[3] += (uint64_t)x[24] << 39;
  109. r->v[3] += ((uint64_t)x[25] & 15) << 47;
  110. r->v[4] = x[25] >> 4;
  111. r->v[4] += (uint64_t)x[26] << 4;
  112. r->v[4] += (uint64_t)x[27] << 12;
  113. r->v[4] += (uint64_t)x[28] << 20;
  114. r->v[4] += (uint64_t)x[29] << 28;
  115. r->v[4] += (uint64_t)x[30] << 36;
  116. r->v[4] += ((uint64_t)x[31] & 127) << 44;
  117. }
  118. static void fe25519_invert(fe25519 *r, const fe25519 *x) {
  119. fe25519 z2;
  120. fe25519 z9;
  121. fe25519 z11;
  122. fe25519 z2_5_0;
  123. fe25519 z2_10_0;
  124. fe25519 z2_20_0;
  125. fe25519 z2_50_0;
  126. fe25519 z2_100_0;
  127. fe25519 t;
  128. int i;
  129. /* 2 */ x25519_x86_64_square(&z2, x);
  130. /* 4 */ x25519_x86_64_square(&t, &z2);
  131. /* 8 */ x25519_x86_64_square(&t, &t);
  132. /* 9 */ x25519_x86_64_mul(&z9, &t, x);
  133. /* 11 */ x25519_x86_64_mul(&z11, &z9, &z2);
  134. /* 22 */ x25519_x86_64_square(&t, &z11);
  135. /* 2^5 - 2^0 = 31 */ x25519_x86_64_mul(&z2_5_0, &t, &z9);
  136. /* 2^6 - 2^1 */ x25519_x86_64_square(&t, &z2_5_0);
  137. /* 2^20 - 2^10 */ for (i = 1; i < 5; i++) { x25519_x86_64_square(&t, &t); }
  138. /* 2^10 - 2^0 */ x25519_x86_64_mul(&z2_10_0, &t, &z2_5_0);
  139. /* 2^11 - 2^1 */ x25519_x86_64_square(&t, &z2_10_0);
  140. /* 2^20 - 2^10 */ for (i = 1; i < 10; i++) { x25519_x86_64_square(&t, &t); }
  141. /* 2^20 - 2^0 */ x25519_x86_64_mul(&z2_20_0, &t, &z2_10_0);
  142. /* 2^21 - 2^1 */ x25519_x86_64_square(&t, &z2_20_0);
  143. /* 2^40 - 2^20 */ for (i = 1; i < 20; i++) { x25519_x86_64_square(&t, &t); }
  144. /* 2^40 - 2^0 */ x25519_x86_64_mul(&t, &t, &z2_20_0);
  145. /* 2^41 - 2^1 */ x25519_x86_64_square(&t, &t);
  146. /* 2^50 - 2^10 */ for (i = 1; i < 10; i++) { x25519_x86_64_square(&t, &t); }
  147. /* 2^50 - 2^0 */ x25519_x86_64_mul(&z2_50_0, &t, &z2_10_0);
  148. /* 2^51 - 2^1 */ x25519_x86_64_square(&t, &z2_50_0);
  149. /* 2^100 - 2^50 */ for (i = 1; i < 50; i++) { x25519_x86_64_square(&t, &t); }
  150. /* 2^100 - 2^0 */ x25519_x86_64_mul(&z2_100_0, &t, &z2_50_0);
  151. /* 2^101 - 2^1 */ x25519_x86_64_square(&t, &z2_100_0);
  152. /* 2^200 - 2^100 */ for (i = 1; i < 100; i++) {
  153. x25519_x86_64_square(&t, &t);
  154. }
  155. /* 2^200 - 2^0 */ x25519_x86_64_mul(&t, &t, &z2_100_0);
  156. /* 2^201 - 2^1 */ x25519_x86_64_square(&t, &t);
  157. /* 2^250 - 2^50 */ for (i = 1; i < 50; i++) { x25519_x86_64_square(&t, &t); }
  158. /* 2^250 - 2^0 */ x25519_x86_64_mul(&t, &t, &z2_50_0);
  159. /* 2^251 - 2^1 */ x25519_x86_64_square(&t, &t);
  160. /* 2^252 - 2^2 */ x25519_x86_64_square(&t, &t);
  161. /* 2^253 - 2^3 */ x25519_x86_64_square(&t, &t);
  162. /* 2^254 - 2^4 */ x25519_x86_64_square(&t, &t);
  163. /* 2^255 - 2^5 */ x25519_x86_64_square(&t, &t);
  164. /* 2^255 - 21 */ x25519_x86_64_mul(r, &t, &z11);
  165. }
  166. static void mladder(fe25519 *xr, fe25519 *zr, const uint8_t s[32]) {
  167. fe25519 work[5];
  168. work[0] = *xr;
  169. fe25519_setint(work + 1, 1);
  170. fe25519_setint(work + 2, 0);
  171. work[3] = *xr;
  172. fe25519_setint(work + 4, 1);
  173. int i, j;
  174. uint8_t prevbit = 0;
  175. j = 6;
  176. for (i = 31; i >= 0; i--) {
  177. while (j >= 0) {
  178. const uint8_t bit = 1 & (s[i] >> j);
  179. const uint64_t swap = bit ^ prevbit;
  180. prevbit = bit;
  181. x25519_x86_64_work_cswap(work + 1, swap);
  182. x25519_x86_64_ladderstep(work);
  183. j -= 1;
  184. }
  185. j = 7;
  186. }
  187. *xr = work[1];
  188. *zr = work[2];
  189. }
  190. void x25519_x86_64(uint8_t out[32], const uint8_t scalar[32],
  191. const uint8_t point[32]) {
  192. uint8_t e[32];
  193. memcpy(e, scalar, sizeof(e));
  194. e[0] &= 248;
  195. e[31] &= 127;
  196. e[31] |= 64;
  197. fe25519 t;
  198. fe25519 z;
  199. fe25519_unpack(&t, point);
  200. mladder(&t, &z, e);
  201. fe25519_invert(&z, &z);
  202. x25519_x86_64_mul(&t, &t, &z);
  203. fe25519_pack(out, &t);
  204. }
  205. #endif /* BORINGSSL_X25519_X86_64 */