crypto/ec/ecp_nistputil.c

238384Sjkim/* crypto/ec/ecp_nistputil.c */
238384Sjkim/*
238384Sjkim * Written by Bodo Moeller for the OpenSSL project.
238384Sjkim */
238384Sjkim/* Copyright 2011 Google Inc.
238384Sjkim *
238384Sjkim * Licensed under the Apache License, Version 2.0 (the "License");
238384Sjkim *
238384Sjkim * you may not use this file except in compliance with the License.
238384Sjkim * You may obtain a copy of the License at
238384Sjkim *
238384Sjkim *     http://www.apache.org/licenses/LICENSE-2.0
238384Sjkim *
238384Sjkim *  Unless required by applicable law or agreed to in writing, software
238384Sjkim *  distributed under the License is distributed on an "AS IS" BASIS,
238384Sjkim *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
238384Sjkim *  See the License for the specific language governing permissions and
238384Sjkim *  limitations under the License.
238384Sjkim */
238384Sjkim
238384Sjkim#include <openssl/opensslconf.h>
238384Sjkim#ifndef OPENSSL_NO_EC_NISTP_64_GCC_128
238384Sjkim
238384Sjkim/*
238384Sjkim * Common utility functions for ecp_nistp224.c, ecp_nistp256.c, ecp_nistp521.c.
238384Sjkim */
238384Sjkim
280304Sjkim# include <stddef.h>
280304Sjkim# include "ec_lcl.h"
238384Sjkim
280304Sjkim/*
280304Sjkim * Convert an array of points into affine coordinates. (If the point at
280304Sjkim * infinity is found (Z = 0), it remains unchanged.) This function is
280304Sjkim * essentially an equivalent to EC_POINTs_make_affine(), but works with the
280304Sjkim * internal representation of points as used by ecp_nistp###.c rather than
280304Sjkim * with (BIGNUM-based) EC_POINT data structures. point_array is the
280304Sjkim * input/output buffer ('num' points in projective form, i.e. three
280304Sjkim * coordinates each), based on an internal representation of field elements
280304Sjkim * of size 'felem_size'. tmp_felems needs to point to a temporary array of
280304Sjkim * 'num'+1 field elements for storage of intermediate values.
238384Sjkim */
238384Sjkimvoid ec_GFp_nistp_points_make_affine_internal(size_t num, void *point_array,
280304Sjkim                                              size_t felem_size,
280304Sjkim                                              void *tmp_felems,
280304Sjkim                                              void (*felem_one) (void *out),
280304Sjkim                                              int (*felem_is_zero) (const void
280304Sjkim                                                                    *in),
280304Sjkim                                              void (*felem_assign) (void *out,
280304Sjkim                                                                    const void
280304Sjkim                                                                    *in),
280304Sjkim                                              void (*felem_square) (void *out,
280304Sjkim                                                                    const void
280304Sjkim                                                                    *in),
280304Sjkim                                              void (*felem_mul) (void *out,
280304Sjkim                                                                 const void
280304Sjkim                                                                 *in1,
280304Sjkim                                                                 const void
280304Sjkim                                                                 *in2),
280304Sjkim                                              void (*felem_inv) (void *out,
280304Sjkim                                                                 const void
280304Sjkim                                                                 *in),
280304Sjkim                                              void (*felem_contract) (void
280304Sjkim                                                                      *out,
280304Sjkim                                                                      const
280304Sjkim                                                                      void
280304Sjkim                                                                      *in))
280304Sjkim{
280304Sjkim    int i = 0;
238384Sjkim
280304Sjkim# define tmp_felem(I) (&((char *)tmp_felems)[(I) * felem_size])
280304Sjkim# define X(I) (&((char *)point_array)[3*(I) * felem_size])
280304Sjkim# define Y(I) (&((char *)point_array)[(3*(I) + 1) * felem_size])
280304Sjkim# define Z(I) (&((char *)point_array)[(3*(I) + 2) * felem_size])
238384Sjkim
280304Sjkim    if (!felem_is_zero(Z(0)))
280304Sjkim        felem_assign(tmp_felem(0), Z(0));
280304Sjkim    else
280304Sjkim        felem_one(tmp_felem(0));
280304Sjkim    for (i = 1; i < (int)num; i++) {
280304Sjkim        if (!felem_is_zero(Z(i)))
280304Sjkim            felem_mul(tmp_felem(i), tmp_felem(i - 1), Z(i));
280304Sjkim        else
280304Sjkim            felem_assign(tmp_felem(i), tmp_felem(i - 1));
280304Sjkim    }
280304Sjkim    /*
280304Sjkim     * Now each tmp_felem(i) is the product of Z(0) .. Z(i), skipping any
280304Sjkim     * zero-valued factors: if Z(i) = 0, we essentially pretend that Z(i) = 1
280304Sjkim     */
238384Sjkim
280304Sjkim    felem_inv(tmp_felem(num - 1), tmp_felem(num - 1));
280304Sjkim    for (i = num - 1; i >= 0; i--) {
280304Sjkim        if (i > 0)
280304Sjkim            /*
280304Sjkim             * tmp_felem(i-1) is the product of Z(0) .. Z(i-1), tmp_felem(i)
280304Sjkim             * is the inverse of the product of Z(0) .. Z(i)
280304Sjkim             */
280304Sjkim            /* 1/Z(i) */
280304Sjkim            felem_mul(tmp_felem(num), tmp_felem(i - 1), tmp_felem(i));
280304Sjkim        else
280304Sjkim            felem_assign(tmp_felem(num), tmp_felem(0)); /* 1/Z(0) */
238384Sjkim
280304Sjkim        if (!felem_is_zero(Z(i))) {
280304Sjkim            if (i > 0)
280304Sjkim                /*
280304Sjkim                 * For next iteration, replace tmp_felem(i-1) by its inverse
280304Sjkim                 */
280304Sjkim                felem_mul(tmp_felem(i - 1), tmp_felem(i), Z(i));
238384Sjkim
280304Sjkim            /*
280304Sjkim             * Convert point (X, Y, Z) into affine form (X/(Z^2), Y/(Z^3), 1)
280304Sjkim             */
280304Sjkim            felem_square(Z(i), tmp_felem(num)); /* 1/(Z^2) */
280304Sjkim            felem_mul(X(i), X(i), Z(i)); /* X/(Z^2) */
280304Sjkim            felem_mul(Z(i), Z(i), tmp_felem(num)); /* 1/(Z^3) */
280304Sjkim            felem_mul(Y(i), Y(i), Z(i)); /* Y/(Z^3) */
280304Sjkim            felem_contract(X(i), X(i));
280304Sjkim            felem_contract(Y(i), Y(i));
280304Sjkim            felem_one(Z(i));
280304Sjkim        } else {
280304Sjkim            if (i > 0)
280304Sjkim                /*
280304Sjkim                 * For next iteration, replace tmp_felem(i-1) by its inverse
280304Sjkim                 */
280304Sjkim                felem_assign(tmp_felem(i - 1), tmp_felem(i));
280304Sjkim        }
280304Sjkim    }
280304Sjkim}
238384Sjkim
280304Sjkim/*-
238384Sjkim * This function looks at 5+1 scalar bits (5 current, 1 adjacent less
238384Sjkim * significant bit), and recodes them into a signed digit for use in fast point
238384Sjkim * multiplication: the use of signed rather than unsigned digits means that
238384Sjkim * fewer points need to be precomputed, given that point inversion is easy
238384Sjkim * (a precomputed point dP makes -dP available as well).
238384Sjkim *
238384Sjkim * BACKGROUND:
238384Sjkim *
238384Sjkim * Signed digits for multiplication were introduced by Booth ("A signed binary
238384Sjkim * multiplication technique", Quart. Journ. Mech. and Applied Math., vol. IV,
238384Sjkim * pt. 2 (1951), pp. 236-240), in that case for multiplication of integers.
238384Sjkim * Booth's original encoding did not generally improve the density of nonzero
238384Sjkim * digits over the binary representation, and was merely meant to simplify the
238384Sjkim * handling of signed factors given in two's complement; but it has since been
238384Sjkim * shown to be the basis of various signed-digit representations that do have
238384Sjkim * further advantages, including the wNAF, using the following general approach:
238384Sjkim *
238384Sjkim * (1) Given a binary representation
238384Sjkim *
238384Sjkim *       b_k  ...  b_2  b_1  b_0,
238384Sjkim *
238384Sjkim *     of a nonnegative integer (b_k in {0, 1}), rewrite it in digits 0, 1, -1
238384Sjkim *     by using bit-wise subtraction as follows:
238384Sjkim *
238384Sjkim *        b_k b_(k-1)  ...  b_2  b_1  b_0
238384Sjkim *      -     b_k      ...  b_3  b_2  b_1  b_0
238384Sjkim *       -------------------------------------
238384Sjkim *        s_k b_(k-1)  ...  s_3  s_2  s_1  s_0
238384Sjkim *
238384Sjkim *     A left-shift followed by subtraction of the original value yields a new
238384Sjkim *     representation of the same value, using signed bits s_i = b_(i+1) - b_i.
238384Sjkim *     This representation from Booth's paper has since appeared in the
238384Sjkim *     literature under a variety of different names including "reversed binary
238384Sjkim *     form", "alternating greedy expansion", "mutual opposite form", and
238384Sjkim *     "sign-alternating {+-1}-representation".
238384Sjkim *
238384Sjkim *     An interesting property is that among the nonzero bits, values 1 and -1
238384Sjkim *     strictly alternate.
238384Sjkim *
238384Sjkim * (2) Various window schemes can be applied to the Booth representation of
238384Sjkim *     integers: for example, right-to-left sliding windows yield the wNAF
238384Sjkim *     (a signed-digit encoding independently discovered by various researchers
238384Sjkim *     in the 1990s), and left-to-right sliding windows yield a left-to-right
238384Sjkim *     equivalent of the wNAF (independently discovered by various researchers
238384Sjkim *     around 2004).
238384Sjkim *
238384Sjkim * To prevent leaking information through side channels in point multiplication,
238384Sjkim * we need to recode the given integer into a regular pattern: sliding windows
238384Sjkim * as in wNAFs won't do, we need their fixed-window equivalent -- which is a few
238384Sjkim * decades older: we'll be using the so-called "modified Booth encoding" due to
238384Sjkim * MacSorley ("High-speed arithmetic in binary computers", Proc. IRE, vol. 49
238384Sjkim * (1961), pp. 67-91), in a radix-2^5 setting.  That is, we always combine five
238384Sjkim * signed bits into a signed digit:
238384Sjkim *
238384Sjkim *       s_(4j + 4) s_(4j + 3) s_(4j + 2) s_(4j + 1) s_(4j)
238384Sjkim *
238384Sjkim * The sign-alternating property implies that the resulting digit values are
238384Sjkim * integers from -16 to 16.
238384Sjkim *
238384Sjkim * Of course, we don't actually need to compute the signed digits s_i as an
238384Sjkim * intermediate step (that's just a nice way to see how this scheme relates
238384Sjkim * to the wNAF): a direct computation obtains the recoded digit from the
238384Sjkim * six bits b_(4j + 4) ... b_(4j - 1).
238384Sjkim *
238384Sjkim * This function takes those five bits as an integer (0 .. 63), writing the
238384Sjkim * recoded digit to *sign (0 for positive, 1 for negative) and *digit (absolute
238384Sjkim * value, in the range 0 .. 8).  Note that this integer essentially provides the
238384Sjkim * input bits "shifted to the left" by one position: for example, the input to
238384Sjkim * compute the least significant recoded digit, given that there's no bit b_-1,
238384Sjkim * has to be b_4 b_3 b_2 b_1 b_0 0.
238384Sjkim *
238384Sjkim */
280304Sjkimvoid ec_GFp_nistp_recode_scalar_bits(unsigned char *sign,
280304Sjkim                                     unsigned char *digit, unsigned char in)
280304Sjkim{
280304Sjkim    unsigned char s, d;
238384Sjkim
280304Sjkim    s = ~((in >> 5) - 1);       /* sets all bits to MSB(in), 'in' seen as
280304Sjkim                                 * 6-bit value */
280304Sjkim    d = (1 << 6) - in - 1;
280304Sjkim    d = (d & s) | (in & ~s);
280304Sjkim    d = (d >> 1) + (d & 1);
238384Sjkim
280304Sjkim    *sign = s & 1;
280304Sjkim    *digit = d;
280304Sjkim}
238384Sjkim#else
280304Sjkimstatic void *dummy = &dummy;
238384Sjkim#endif