From 6a289b3ec439d24729cdbdb69b8d99b82a9904fc Mon Sep 17 00:00:00 2001
From: David Benjamin <davidben@google.com>
Date: Sun, 22 Apr 2018 22:34:29 -0400
Subject: [PATCH] Remove EC_POINTs_make_affine and related logic.

This does not appear to actually pull its weight. The purpose of this
logic is to switch some adds to the faster add_mixed in the wNAF code,
at the cost of a rather expensive inversion. This optimization kicks in
for generic curves, so P-384 and P-521:

With:
Did 32130 ECDSA P-384 signing operations in 30077563us (1068.2 ops/sec)
Did 27456 ECDSA P-384 verify operations in 30073086us (913.0 ops/sec)
Did 14122 ECDSA P-521 signing operations in 30077407us (469.5 ops/sec)
Did 11973 ECDSA P-521 verify operations in 30037330us (398.6 ops/sec)

Without:
Did 32445 ECDSA P-384 signing operations in 30069721us (1079.0 ops/sec)
Did 27056 ECDSA P-384 verify operations in 30032303us (900.9 ops/sec)
Did 13905 ECDSA P-521 signing operations in 30000430us (463.5 ops/sec)
Did 11433 ECDSA P-521 verify operations in 30021876us (380.8 ops/sec)

For single-point multiplication, the optimization is not useful. This
makes sense as we only have one table's worth of additions to convert
but still pay for the inversion. For double-point multiplication, it is
slightly useful for P-384 and very useful for P-521. However, the next
change to stack-allocate EC_FELEMs will more than compensate for
removing it.  (The immediate goal here is to simplify the EC_FELEM
story.)

Additionally, that this optimization was not useful for single-point
multiplication implies that, should we wish to recover this, a modest
8-entry pre-computed (affine) base point table should have the same
effect or better.

Update-Note: I do not believe anything was calling either of these
functions. (If necessary, we can always add no-op stubs as whether a
point is affine is not visible to external code. It previously kicked in
some optimizations, but those were removed for constant-time needs
anyway.)

Bug: 239
Change-Id: Ic9c51b001c45595cfe592274c7d5d652f4234839
Reviewed-on: https://boringssl-review.googlesource.com/27667
Reviewed-by: Adam Langley <agl@google.com>
---
 crypto/fipsmodule/ec/ec.c       |  32 +----
 crypto/fipsmodule/ec/internal.h |  10 +-
 crypto/fipsmodule/ec/simple.c   | 231 ++------------------------------
 crypto/fipsmodule/ec/wnaf.c     |  10 +-
 include/openssl/ec.h            |  11 --
 5 files changed, 17 insertions(+), 277 deletions(-)

diff --git a/crypto/fipsmodule/ec/ec.c b/crypto/fipsmodule/ec/ec.c
index 07f9c343..1b683276 100644
--- a/crypto/fipsmodule/ec/ec.c
+++ b/crypto/fipsmodule/ec/ec.c
@@ -723,25 +723,6 @@ int EC_POINT_cmp(const EC_GROUP *group, const EC_POINT *a, const EC_POINT *b,
   return ec_GFp_simple_cmp(group, a, b, ctx);
 }
 
-int EC_POINT_make_affine(const EC_GROUP *group, EC_POINT *point, BN_CTX *ctx) {
-  if (EC_GROUP_cmp(group, point->group, NULL) != 0) {
-    OPENSSL_PUT_ERROR(EC, EC_R_INCOMPATIBLE_OBJECTS);
-    return 0;
-  }
-  return ec_GFp_simple_make_affine(group, point, ctx);
-}
-
-int EC_POINTs_make_affine(const EC_GROUP *group, size_t num, EC_POINT *points[],
-                          BN_CTX *ctx) {
-  for (size_t i = 0; i < num; i++) {
-    if (EC_GROUP_cmp(group, points[i]->group, NULL) != 0) {
-      OPENSSL_PUT_ERROR(EC, EC_R_INCOMPATIBLE_OBJECTS);
-      return 0;
-    }
-  }
-  return ec_GFp_simple_points_make_affine(group, num, points, ctx);
-}
-
 int EC_POINT_get_affine_coordinates_GFp(const EC_GROUP *group,
                                         const EC_POINT *point, BIGNUM *x,
                                         BIGNUM *y, BN_CTX *ctx) {
@@ -792,18 +773,7 @@ int EC_POINT_add(const EC_GROUP *group, EC_POINT *r, const EC_POINT *a,
     OPENSSL_PUT_ERROR(EC, EC_R_INCOMPATIBLE_OBJECTS);
     return 0;
   }
-  return ec_GFp_simple_add(group, r, a, b, 0 /* both Jacobian */, ctx);
-}
-
-int ec_point_add_mixed(const EC_GROUP *group, EC_POINT *r, const EC_POINT *a,
-                       const EC_POINT *b, BN_CTX *ctx) {
-  if (EC_GROUP_cmp(group, r->group, NULL) != 0 ||
-      EC_GROUP_cmp(group, a->group, NULL) != 0 ||
-      EC_GROUP_cmp(group, b->group, NULL) != 0) {
-    OPENSSL_PUT_ERROR(EC, EC_R_INCOMPATIBLE_OBJECTS);
-    return 0;
-  }
-  return ec_GFp_simple_add(group, r, a, b, 1 /* |b| is affine */, ctx);
+  return ec_GFp_simple_add(group, r, a, b, ctx);
 }
 
 int EC_POINT_dbl(const EC_GROUP *group, EC_POINT *r, const EC_POINT *a,
diff --git a/crypto/fipsmodule/ec/internal.h b/crypto/fipsmodule/ec/internal.h
index 7f72c31c..66e18436 100644
--- a/crypto/fipsmodule/ec/internal.h
+++ b/crypto/fipsmodule/ec/internal.h
@@ -216,11 +216,6 @@ void ec_scalar_mul_montgomery(const EC_GROUP *group, EC_SCALAR *r,
 void ec_scalar_inv_montgomery(const EC_GROUP *group, EC_SCALAR *r,
                               const EC_SCALAR *a);
 
-// ec_point_add_mixed behaves like |EC_POINT_add|, but |&b->Z| must be zero or
-// one.
-int ec_point_add_mixed(const EC_GROUP *group, EC_POINT *r, const EC_POINT *a,
-                       const EC_POINT *b, BN_CTX *ctx);
-
 // ec_point_mul_scalar sets |r| to generator * |g_scalar| + |p| *
 // |p_scalar|. Unlike other functions which take |EC_SCALAR|, |g_scalar| and
 // |p_scalar| need not be fully reduced. They need only contain as many bits as
@@ -266,7 +261,7 @@ int ec_GFp_simple_point_set_affine_coordinates(const EC_GROUP *, EC_POINT *,
                                                const BIGNUM *x, const BIGNUM *y,
                                                BN_CTX *);
 int ec_GFp_simple_add(const EC_GROUP *, EC_POINT *r, const EC_POINT *a,
-                      const EC_POINT *b, int mixed, BN_CTX *);
+                      const EC_POINT *b, BN_CTX *);
 int ec_GFp_simple_dbl(const EC_GROUP *, EC_POINT *r, const EC_POINT *a,
                       BN_CTX *);
 int ec_GFp_simple_invert(const EC_GROUP *, EC_POINT *, BN_CTX *);
@@ -274,9 +269,6 @@ int ec_GFp_simple_is_at_infinity(const EC_GROUP *, const EC_POINT *);
 int ec_GFp_simple_is_on_curve(const EC_GROUP *, const EC_POINT *, BN_CTX *);
 int ec_GFp_simple_cmp(const EC_GROUP *, const EC_POINT *a, const EC_POINT *b,
                       BN_CTX *);
-int ec_GFp_simple_make_affine(const EC_GROUP *, EC_POINT *, BN_CTX *);
-int ec_GFp_simple_points_make_affine(const EC_GROUP *, size_t num,
-                                     EC_POINT * [], BN_CTX *);
 void ec_simple_scalar_inv_montgomery(const EC_GROUP *group, EC_SCALAR *r,
                                      const EC_SCALAR *a);
 
diff --git a/crypto/fipsmodule/ec/simple.c b/crypto/fipsmodule/ec/simple.c
index 4fb394c5..511788c4 100644
--- a/crypto/fipsmodule/ec/simple.c
+++ b/crypto/fipsmodule/ec/simple.c
@@ -303,11 +303,7 @@ err:
 }
 
 int ec_GFp_simple_add(const EC_GROUP *group, EC_POINT *r, const EC_POINT *a,
-                      const EC_POINT *b, int mixed, BN_CTX *ctx) {
-  if (mixed) {
-    assert(BN_is_zero(&b->Z) || BN_cmp(&b->Z, &group->one) == 0);
-  }
-
+                      const EC_POINT *b, BN_CTX *ctx) {
   int (*field_mul)(const EC_GROUP *, BIGNUM *, const BIGNUM *, const BIGNUM *,
                    BN_CTX *);
   int (*field_sqr)(const EC_GROUP *, BIGNUM *, const BIGNUM *, BN_CTX *);
@@ -354,25 +350,17 @@ int ec_GFp_simple_add(const EC_GROUP *group, EC_POINT *r, const EC_POINT *a,
   // ('r' might be one of 'a' or 'b'.)
 
   // n1, n2
-  if (mixed) {
-    if (!BN_copy(n1, &a->X) || !BN_copy(n2, &a->Y)) {
-      goto end;
-    }
-    // n1 = X_a
-    // n2 = Y_a
-  } else {
-    if (!field_sqr(group, n0, &b->Z, ctx) ||
-        !field_mul(group, n1, &a->X, n0, ctx)) {
-      goto end;
-    }
-    // n1 = X_a * Z_b^2
+  if (!field_sqr(group, n0, &b->Z, ctx) ||
+      !field_mul(group, n1, &a->X, n0, ctx)) {
+    goto end;
+  }
+  // n1 = X_a * Z_b^2
 
-    if (!field_mul(group, n0, n0, &b->Z, ctx) ||
-        !field_mul(group, n2, &a->Y, n0, ctx)) {
-      goto end;
-    }
-    // n2 = Y_a * Z_b^3
+  if (!field_mul(group, n0, n0, &b->Z, ctx) ||
+      !field_mul(group, n2, &a->Y, n0, ctx)) {
+    goto end;
   }
+  // n2 = Y_a * Z_b^3
 
   // n3, n4
   if (!field_sqr(group, n0, &a->Z, ctx) ||
@@ -419,14 +407,8 @@ int ec_GFp_simple_add(const EC_GROUP *group, EC_POINT *r, const EC_POINT *a,
   // 'n8' = n2 + n4
 
   // Z_r
-  if (mixed) {
-    if (!BN_copy(n0, &a->Z)) {
-      goto end;
-    }
-  } else if (!field_mul(group, n0, &a->Z, &b->Z, ctx)) {
-    goto end;
-  }
-  if (!field_mul(group, &r->Z, n0, n5, ctx)) {
+  if (!field_mul(group, n0, &a->Z, &b->Z, ctx) ||
+      !field_mul(group, &r->Z, n0, n5, ctx)) {
     goto end;
   }
 
@@ -814,192 +796,3 @@ end:
   BN_CTX_free(new_ctx);
   return ret;
 }
-
-int ec_GFp_simple_make_affine(const EC_GROUP *group, EC_POINT *point,
-                              BN_CTX *ctx) {
-  BN_CTX *new_ctx = NULL;
-  BIGNUM *x, *y;
-  int ret = 0;
-
-  if (BN_cmp(&point->Z, &group->one) == 0 ||
-      EC_POINT_is_at_infinity(group, point)) {
-    return 1;
-  }
-
-  if (ctx == NULL) {
-    ctx = new_ctx = BN_CTX_new();
-    if (ctx == NULL) {
-      return 0;
-    }
-  }
-
-  BN_CTX_start(ctx);
-  x = BN_CTX_get(ctx);
-  y = BN_CTX_get(ctx);
-  if (y == NULL) {
-    goto err;
-  }
-
-  if (!EC_POINT_get_affine_coordinates_GFp(group, point, x, y, ctx) ||
-      !EC_POINT_set_affine_coordinates_GFp(group, point, x, y, ctx)) {
-    goto err;
-  }
-  if (BN_cmp(&point->Z, &group->one) != 0) {
-    OPENSSL_PUT_ERROR(EC, ERR_R_INTERNAL_ERROR);
-    goto err;
-  }
-
-  ret = 1;
-
-err:
-  BN_CTX_end(ctx);
-  BN_CTX_free(new_ctx);
-  return ret;
-}
-
-int ec_GFp_simple_points_make_affine(const EC_GROUP *group, size_t num,
-                                     EC_POINT *points[], BN_CTX *ctx) {
-  BN_CTX *new_ctx = NULL;
-  BIGNUM *tmp, *tmp_Z;
-  BIGNUM **prod_Z = NULL;
-  int ret = 0;
-
-  if (num == 0) {
-    return 1;
-  }
-
-  if (ctx == NULL) {
-    ctx = new_ctx = BN_CTX_new();
-    if (ctx == NULL) {
-      return 0;
-    }
-  }
-
-  BN_CTX_start(ctx);
-  tmp = BN_CTX_get(ctx);
-  tmp_Z = BN_CTX_get(ctx);
-  if (tmp == NULL || tmp_Z == NULL) {
-    goto err;
-  }
-
-  prod_Z = OPENSSL_malloc(num * sizeof(prod_Z[0]));
-  if (prod_Z == NULL) {
-    goto err;
-  }
-  OPENSSL_memset(prod_Z, 0, num * sizeof(prod_Z[0]));
-  for (size_t i = 0; i < num; i++) {
-    prod_Z[i] = BN_new();
-    if (prod_Z[i] == NULL) {
-      goto err;
-    }
-  }
-
-  // Set each prod_Z[i] to the product of points[0]->Z .. points[i]->Z,
-  // skipping any zero-valued inputs (pretend that they're 1).
-
-  if (!BN_is_zero(&points[0]->Z)) {
-    if (!BN_copy(prod_Z[0], &points[0]->Z)) {
-      goto err;
-    }
-  } else {
-    if (BN_copy(prod_Z[0], &group->one) == NULL) {
-      goto err;
-    }
-  }
-
-  for (size_t i = 1; i < num; i++) {
-    if (!BN_is_zero(&points[i]->Z)) {
-      if (!group->meth->field_mul(group, prod_Z[i], prod_Z[i - 1],
-                                  &points[i]->Z, ctx)) {
-        goto err;
-      }
-    } else {
-      if (!BN_copy(prod_Z[i], prod_Z[i - 1])) {
-        goto err;
-      }
-    }
-  }
-
-  // Now use a single explicit inversion to replace every non-zero points[i]->Z
-  // by its inverse. We use |BN_mod_inverse_odd| instead of doing a constant-
-  // time inversion using Fermat's Little Theorem because this function is
-  // usually only used for converting multiples of a public key point to
-  // affine, and a public key point isn't secret. If we were to use Fermat's
-  // Little Theorem then the cost of the inversion would usually be so high
-  // that converting the multiples to affine would be counterproductive.
-  int no_inverse;
-  if (!BN_mod_inverse_odd(tmp, &no_inverse, prod_Z[num - 1], &group->field,
-                          ctx)) {
-    OPENSSL_PUT_ERROR(EC, ERR_R_BN_LIB);
-    goto err;
-  }
-
-  if (group->meth->field_encode != NULL) {
-    // In the Montgomery case, we just turned R*H (representing H)
-    // into 1/(R*H), but we need R*(1/H) (representing 1/H);
-    // i.e. we need to multiply by the Montgomery factor twice.
-    if (!group->meth->field_encode(group, tmp, tmp, ctx) ||
-        !group->meth->field_encode(group, tmp, tmp, ctx)) {
-      goto err;
-    }
-  }
-
-  for (size_t i = num - 1; i > 0; --i) {
-    // Loop invariant: tmp is the product of the inverses of
-    // points[0]->Z .. points[i]->Z (zero-valued inputs skipped).
-    if (BN_is_zero(&points[i]->Z)) {
-      continue;
-    }
-
-    // Set tmp_Z to the inverse of points[i]->Z (as product
-    // of Z inverses 0 .. i, Z values 0 .. i - 1).
-    if (!group->meth->field_mul(group, tmp_Z, prod_Z[i - 1], tmp, ctx) ||
-        // Update tmp to satisfy the loop invariant for i - 1.
-        !group->meth->field_mul(group, tmp, tmp, &points[i]->Z, ctx) ||
-        // Replace points[i]->Z by its inverse.
-        !BN_copy(&points[i]->Z, tmp_Z)) {
-      goto err;
-    }
-  }
-
-  // Replace points[0]->Z by its inverse.
-  if (!BN_is_zero(&points[0]->Z) && !BN_copy(&points[0]->Z, tmp)) {
-    goto err;
-  }
-
-  // Finally, fix up the X and Y coordinates for all points.
-  for (size_t i = 0; i < num; i++) {
-    EC_POINT *p = points[i];
-
-    if (!BN_is_zero(&p->Z)) {
-      // turn (X, Y, 1/Z) into (X/Z^2, Y/Z^3, 1).
-      if (!group->meth->field_sqr(group, tmp, &p->Z, ctx) ||
-          !group->meth->field_mul(group, &p->X, &p->X, tmp, ctx) ||
-          !group->meth->field_mul(group, tmp, tmp, &p->Z, ctx) ||
-          !group->meth->field_mul(group, &p->Y, &p->Y, tmp, ctx)) {
-        goto err;
-      }
-
-      if (BN_copy(&p->Z, &group->one) == NULL) {
-        goto err;
-      }
-    }
-  }
-
-  ret = 1;
-
-err:
-  BN_CTX_end(ctx);
-  BN_CTX_free(new_ctx);
-  if (prod_Z != NULL) {
-    for (size_t i = 0; i < num; i++) {
-      if (prod_Z[i] == NULL) {
-        break;
-      }
-      BN_clear_free(prod_Z[i]);
-    }
-    OPENSSL_free(prod_Z);
-  }
-
-  return ret;
-}
diff --git a/crypto/fipsmodule/ec/wnaf.c b/crypto/fipsmodule/ec/wnaf.c
index 49fc8bca..0209d983 100644
--- a/crypto/fipsmodule/ec/wnaf.c
+++ b/crypto/fipsmodule/ec/wnaf.c
@@ -290,11 +290,7 @@ int ec_wNAF_mul(const EC_GROUP *group, EC_POINT *r, const EC_SCALAR *g_scalar,
   }
 
   tmp = EC_POINT_new(group);
-  if (tmp == NULL ||
-      // Convert the points to affine coordinates. This allows us to use the
-      // slightly faster |ec_point_add_mixed|. The conversion itself is not
-      // cheap, but it is worthwhile when there are two points.
-      !EC_POINTs_make_affine(group, total_precomp, precomp_storage, ctx)) {
+  if (tmp == NULL) {
     goto err;
   }
 
@@ -313,7 +309,7 @@ int ec_wNAF_mul(const EC_GROUP *group, EC_POINT *r, const EC_SCALAR *g_scalar,
           goto err;
         }
         r_is_at_infinity = 0;
-      } else if (!ec_point_add_mixed(group, r, r, tmp, ctx)) {
+      } else if (!EC_POINT_add(group, r, r, tmp, ctx)) {
         goto err;
       }
     }
@@ -327,7 +323,7 @@ int ec_wNAF_mul(const EC_GROUP *group, EC_POINT *r, const EC_SCALAR *g_scalar,
           goto err;
         }
         r_is_at_infinity = 0;
-      } else if (!ec_point_add_mixed(group, r, r, tmp, ctx)) {
+      } else if (!EC_POINT_add(group, r, r, tmp, ctx)) {
         goto err;
       }
     }
diff --git a/include/openssl/ec.h b/include/openssl/ec.h
index 5eee3661..53f22fd0 100644
--- a/include/openssl/ec.h
+++ b/include/openssl/ec.h
@@ -195,17 +195,6 @@ OPENSSL_EXPORT int EC_POINT_is_on_curve(const EC_GROUP *group,
 OPENSSL_EXPORT int EC_POINT_cmp(const EC_GROUP *group, const EC_POINT *a,
                                 const EC_POINT *b, BN_CTX *ctx);
 
-// EC_POINT_make_affine converts |point| to affine form, internally. It returns
-// one on success and zero otherwise. If |ctx| is not NULL, it may be used.
-OPENSSL_EXPORT int EC_POINT_make_affine(const EC_GROUP *group, EC_POINT *point,
-                                        BN_CTX *ctx);
-
-// EC_POINTs_make_affine converts |num| points from |points| to affine form,
-// internally. It returns one on success and zero otherwise. If |ctx| is not
-// NULL, it may be used.
-OPENSSL_EXPORT int EC_POINTs_make_affine(const EC_GROUP *group, size_t num,
-                                         EC_POINT *points[], BN_CTX *ctx);
-
 
 // Point conversion.