Blame crypto/bn/bn_mul.c

Packit c4476c
/*
Packit c4476c
 * Copyright 1995-2018 The OpenSSL Project Authors. All Rights Reserved.
Packit c4476c
 *
Packit c4476c
 * Licensed under the OpenSSL license (the "License").  You may not use
Packit c4476c
 * this file except in compliance with the License.  You can obtain a copy
Packit c4476c
 * in the file LICENSE in the source distribution or at
Packit c4476c
 * https://www.openssl.org/source/license.html
Packit c4476c
 */
Packit c4476c
Packit c4476c
#include <assert.h>
Packit c4476c
#include "internal/cryptlib.h"
Packit c4476c
#include "bn_local.h"
Packit c4476c
Packit c4476c
#if defined(OPENSSL_NO_ASM) || !defined(OPENSSL_BN_ASM_PART_WORDS)
Packit c4476c
/*
Packit c4476c
 * Here follows specialised variants of bn_add_words() and bn_sub_words().
Packit c4476c
 * They have the property performing operations on arrays of different sizes.
Packit c4476c
 * The sizes of those arrays is expressed through cl, which is the common
Packit c4476c
 * length ( basically, min(len(a),len(b)) ), and dl, which is the delta
Packit c4476c
 * between the two lengths, calculated as len(a)-len(b). All lengths are the
Packit c4476c
 * number of BN_ULONGs...  For the operations that require a result array as
Packit c4476c
 * parameter, it must have the length cl+abs(dl). These functions should
Packit c4476c
 * probably end up in bn_asm.c as soon as there are assembler counterparts
Packit c4476c
 * for the systems that use assembler files.
Packit c4476c
 */
Packit c4476c
Packit c4476c
BN_ULONG bn_sub_part_words(BN_ULONG *r,
Packit c4476c
                           const BN_ULONG *a, const BN_ULONG *b,
Packit c4476c
                           int cl, int dl)
Packit c4476c
{
Packit c4476c
    BN_ULONG c, t;
Packit c4476c
Packit c4476c
    assert(cl >= 0);
Packit c4476c
    c = bn_sub_words(r, a, b, cl);
Packit c4476c
Packit c4476c
    if (dl == 0)
Packit c4476c
        return c;
Packit c4476c
Packit c4476c
    r += cl;
Packit c4476c
    a += cl;
Packit c4476c
    b += cl;
Packit c4476c
Packit c4476c
    if (dl < 0) {
Packit c4476c
        for (;;) {
Packit c4476c
            t = b[0];
Packit c4476c
            r[0] = (0 - t - c) & BN_MASK2;
Packit c4476c
            if (t != 0)
Packit c4476c
                c = 1;
Packit c4476c
            if (++dl >= 0)
Packit c4476c
                break;
Packit c4476c
Packit c4476c
            t = b[1];
Packit c4476c
            r[1] = (0 - t - c) & BN_MASK2;
Packit c4476c
            if (t != 0)
Packit c4476c
                c = 1;
Packit c4476c
            if (++dl >= 0)
Packit c4476c
                break;
Packit c4476c
Packit c4476c
            t = b[2];
Packit c4476c
            r[2] = (0 - t - c) & BN_MASK2;
Packit c4476c
            if (t != 0)
Packit c4476c
                c = 1;
Packit c4476c
            if (++dl >= 0)
Packit c4476c
                break;
Packit c4476c
Packit c4476c
            t = b[3];
Packit c4476c
            r[3] = (0 - t - c) & BN_MASK2;
Packit c4476c
            if (t != 0)
Packit c4476c
                c = 1;
Packit c4476c
            if (++dl >= 0)
Packit c4476c
                break;
Packit c4476c
Packit c4476c
            b += 4;
Packit c4476c
            r += 4;
Packit c4476c
        }
Packit c4476c
    } else {
Packit c4476c
        int save_dl = dl;
Packit c4476c
        while (c) {
Packit c4476c
            t = a[0];
Packit c4476c
            r[0] = (t - c) & BN_MASK2;
Packit c4476c
            if (t != 0)
Packit c4476c
                c = 0;
Packit c4476c
            if (--dl <= 0)
Packit c4476c
                break;
Packit c4476c
Packit c4476c
            t = a[1];
Packit c4476c
            r[1] = (t - c) & BN_MASK2;
Packit c4476c
            if (t != 0)
Packit c4476c
                c = 0;
Packit c4476c
            if (--dl <= 0)
Packit c4476c
                break;
Packit c4476c
Packit c4476c
            t = a[2];
Packit c4476c
            r[2] = (t - c) & BN_MASK2;
Packit c4476c
            if (t != 0)
Packit c4476c
                c = 0;
Packit c4476c
            if (--dl <= 0)
Packit c4476c
                break;
Packit c4476c
Packit c4476c
            t = a[3];
Packit c4476c
            r[3] = (t - c) & BN_MASK2;
Packit c4476c
            if (t != 0)
Packit c4476c
                c = 0;
Packit c4476c
            if (--dl <= 0)
Packit c4476c
                break;
Packit c4476c
Packit c4476c
            save_dl = dl;
Packit c4476c
            a += 4;
Packit c4476c
            r += 4;
Packit c4476c
        }
Packit c4476c
        if (dl > 0) {
Packit c4476c
            if (save_dl > dl) {
Packit c4476c
                switch (save_dl - dl) {
Packit c4476c
                case 1:
Packit c4476c
                    r[1] = a[1];
Packit c4476c
                    if (--dl <= 0)
Packit c4476c
                        break;
Packit c4476c
                    /* fall thru */
Packit c4476c
                case 2:
Packit c4476c
                    r[2] = a[2];
Packit c4476c
                    if (--dl <= 0)
Packit c4476c
                        break;
Packit c4476c
                    /* fall thru */
Packit c4476c
                case 3:
Packit c4476c
                    r[3] = a[3];
Packit c4476c
                    if (--dl <= 0)
Packit c4476c
                        break;
Packit c4476c
                }
Packit c4476c
                a += 4;
Packit c4476c
                r += 4;
Packit c4476c
            }
Packit c4476c
        }
Packit c4476c
        if (dl > 0) {
Packit c4476c
            for (;;) {
Packit c4476c
                r[0] = a[0];
Packit c4476c
                if (--dl <= 0)
Packit c4476c
                    break;
Packit c4476c
                r[1] = a[1];
Packit c4476c
                if (--dl <= 0)
Packit c4476c
                    break;
Packit c4476c
                r[2] = a[2];
Packit c4476c
                if (--dl <= 0)
Packit c4476c
                    break;
Packit c4476c
                r[3] = a[3];
Packit c4476c
                if (--dl <= 0)
Packit c4476c
                    break;
Packit c4476c
Packit c4476c
                a += 4;
Packit c4476c
                r += 4;
Packit c4476c
            }
Packit c4476c
        }
Packit c4476c
    }
Packit c4476c
    return c;
Packit c4476c
}
Packit c4476c
#endif
Packit c4476c
Packit c4476c
#ifdef BN_RECURSION
Packit c4476c
/*
Packit c4476c
 * Karatsuba recursive multiplication algorithm (cf. Knuth, The Art of
Packit c4476c
 * Computer Programming, Vol. 2)
Packit c4476c
 */
Packit c4476c
Packit c4476c
/*-
Packit c4476c
 * r is 2*n2 words in size,
Packit c4476c
 * a and b are both n2 words in size.
Packit c4476c
 * n2 must be a power of 2.
Packit c4476c
 * We multiply and return the result.
Packit c4476c
 * t must be 2*n2 words in size
Packit c4476c
 * We calculate
Packit c4476c
 * a[0]*b[0]
Packit c4476c
 * a[0]*b[0]+a[1]*b[1]+(a[0]-a[1])*(b[1]-b[0])
Packit c4476c
 * a[1]*b[1]
Packit c4476c
 */
Packit c4476c
/* dnX may not be positive, but n2/2+dnX has to be */
Packit c4476c
void bn_mul_recursive(BN_ULONG *r, BN_ULONG *a, BN_ULONG *b, int n2,
Packit c4476c
                      int dna, int dnb, BN_ULONG *t)
Packit c4476c
{
Packit c4476c
    int n = n2 / 2, c1, c2;
Packit c4476c
    int tna = n + dna, tnb = n + dnb;
Packit c4476c
    unsigned int neg, zero;
Packit c4476c
    BN_ULONG ln, lo, *p;
Packit c4476c
Packit c4476c
# ifdef BN_MUL_COMBA
Packit c4476c
#  if 0
Packit c4476c
    if (n2 == 4) {
Packit c4476c
        bn_mul_comba4(r, a, b);
Packit c4476c
        return;
Packit c4476c
    }
Packit c4476c
#  endif
Packit c4476c
    /*
Packit c4476c
     * Only call bn_mul_comba 8 if n2 == 8 and the two arrays are complete
Packit c4476c
     * [steve]
Packit c4476c
     */
Packit c4476c
    if (n2 == 8 && dna == 0 && dnb == 0) {
Packit c4476c
        bn_mul_comba8(r, a, b);
Packit c4476c
        return;
Packit c4476c
    }
Packit c4476c
# endif                         /* BN_MUL_COMBA */
Packit c4476c
    /* Else do normal multiply */
Packit c4476c
    if (n2 < BN_MUL_RECURSIVE_SIZE_NORMAL) {
Packit c4476c
        bn_mul_normal(r, a, n2 + dna, b, n2 + dnb);
Packit c4476c
        if ((dna + dnb) < 0)
Packit c4476c
            memset(&r[2 * n2 + dna + dnb], 0,
Packit c4476c
                   sizeof(BN_ULONG) * -(dna + dnb));
Packit c4476c
        return;
Packit c4476c
    }
Packit c4476c
    /* r=(a[0]-a[1])*(b[1]-b[0]) */
Packit c4476c
    c1 = bn_cmp_part_words(a, &(a[n]), tna, n - tna);
Packit c4476c
    c2 = bn_cmp_part_words(&(b[n]), b, tnb, tnb - n);
Packit c4476c
    zero = neg = 0;
Packit c4476c
    switch (c1 * 3 + c2) {
Packit c4476c
    case -4:
Packit c4476c
        bn_sub_part_words(t, &(a[n]), a, tna, tna - n); /* - */
Packit c4476c
        bn_sub_part_words(&(t[n]), b, &(b[n]), tnb, n - tnb); /* - */
Packit c4476c
        break;
Packit c4476c
    case -3:
Packit c4476c
        zero = 1;
Packit c4476c
        break;
Packit c4476c
    case -2:
Packit c4476c
        bn_sub_part_words(t, &(a[n]), a, tna, tna - n); /* - */
Packit c4476c
        bn_sub_part_words(&(t[n]), &(b[n]), b, tnb, tnb - n); /* + */
Packit c4476c
        neg = 1;
Packit c4476c
        break;
Packit c4476c
    case -1:
Packit c4476c
    case 0:
Packit c4476c
    case 1:
Packit c4476c
        zero = 1;
Packit c4476c
        break;
Packit c4476c
    case 2:
Packit c4476c
        bn_sub_part_words(t, a, &(a[n]), tna, n - tna); /* + */
Packit c4476c
        bn_sub_part_words(&(t[n]), b, &(b[n]), tnb, n - tnb); /* - */
Packit c4476c
        neg = 1;
Packit c4476c
        break;
Packit c4476c
    case 3:
Packit c4476c
        zero = 1;
Packit c4476c
        break;
Packit c4476c
    case 4:
Packit c4476c
        bn_sub_part_words(t, a, &(a[n]), tna, n - tna);
Packit c4476c
        bn_sub_part_words(&(t[n]), &(b[n]), b, tnb, tnb - n);
Packit c4476c
        break;
Packit c4476c
    }
Packit c4476c
Packit c4476c
# ifdef BN_MUL_COMBA
Packit c4476c
    if (n == 4 && dna == 0 && dnb == 0) { /* XXX: bn_mul_comba4 could take
Packit c4476c
                                           * extra args to do this well */
Packit c4476c
        if (!zero)
Packit c4476c
            bn_mul_comba4(&(t[n2]), t, &(t[n]));
Packit c4476c
        else
Packit c4476c
            memset(&t[n2], 0, sizeof(*t) * 8);
Packit c4476c
Packit c4476c
        bn_mul_comba4(r, a, b);
Packit c4476c
        bn_mul_comba4(&(r[n2]), &(a[n]), &(b[n]));
Packit c4476c
    } else if (n == 8 && dna == 0 && dnb == 0) { /* XXX: bn_mul_comba8 could
Packit c4476c
                                                  * take extra args to do
Packit c4476c
                                                  * this well */
Packit c4476c
        if (!zero)
Packit c4476c
            bn_mul_comba8(&(t[n2]), t, &(t[n]));
Packit c4476c
        else
Packit c4476c
            memset(&t[n2], 0, sizeof(*t) * 16);
Packit c4476c
Packit c4476c
        bn_mul_comba8(r, a, b);
Packit c4476c
        bn_mul_comba8(&(r[n2]), &(a[n]), &(b[n]));
Packit c4476c
    } else
Packit c4476c
# endif                         /* BN_MUL_COMBA */
Packit c4476c
    {
Packit c4476c
        p = &(t[n2 * 2]);
Packit c4476c
        if (!zero)
Packit c4476c
            bn_mul_recursive(&(t[n2]), t, &(t[n]), n, 0, 0, p);
Packit c4476c
        else
Packit c4476c
            memset(&t[n2], 0, sizeof(*t) * n2);
Packit c4476c
        bn_mul_recursive(r, a, b, n, 0, 0, p);
Packit c4476c
        bn_mul_recursive(&(r[n2]), &(a[n]), &(b[n]), n, dna, dnb, p);
Packit c4476c
    }
Packit c4476c
Packit c4476c
    /*-
Packit c4476c
     * t[32] holds (a[0]-a[1])*(b[1]-b[0]), c1 is the sign
Packit c4476c
     * r[10] holds (a[0]*b[0])
Packit c4476c
     * r[32] holds (b[1]*b[1])
Packit c4476c
     */
Packit c4476c
Packit c4476c
    c1 = (int)(bn_add_words(t, r, &(r[n2]), n2));
Packit c4476c
Packit c4476c
    if (neg) {                  /* if t[32] is negative */
Packit c4476c
        c1 -= (int)(bn_sub_words(&(t[n2]), t, &(t[n2]), n2));
Packit c4476c
    } else {
Packit c4476c
        /* Might have a carry */
Packit c4476c
        c1 += (int)(bn_add_words(&(t[n2]), &(t[n2]), t, n2));
Packit c4476c
    }
Packit c4476c
Packit c4476c
    /*-
Packit c4476c
     * t[32] holds (a[0]-a[1])*(b[1]-b[0])+(a[0]*b[0])+(a[1]*b[1])
Packit c4476c
     * r[10] holds (a[0]*b[0])
Packit c4476c
     * r[32] holds (b[1]*b[1])
Packit c4476c
     * c1 holds the carry bits
Packit c4476c
     */
Packit c4476c
    c1 += (int)(bn_add_words(&(r[n]), &(r[n]), &(t[n2]), n2));
Packit c4476c
    if (c1) {
Packit c4476c
        p = &(r[n + n2]);
Packit c4476c
        lo = *p;
Packit c4476c
        ln = (lo + c1) & BN_MASK2;
Packit c4476c
        *p = ln;
Packit c4476c
Packit c4476c
        /*
Packit c4476c
         * The overflow will stop before we over write words we should not
Packit c4476c
         * overwrite
Packit c4476c
         */
Packit c4476c
        if (ln < (BN_ULONG)c1) {
Packit c4476c
            do {
Packit c4476c
                p++;
Packit c4476c
                lo = *p;
Packit c4476c
                ln = (lo + 1) & BN_MASK2;
Packit c4476c
                *p = ln;
Packit c4476c
            } while (ln == 0);
Packit c4476c
        }
Packit c4476c
    }
Packit c4476c
}
Packit c4476c
Packit c4476c
/*
Packit c4476c
 * n+tn is the word length t needs to be n*4 is size, as does r
Packit c4476c
 */
Packit c4476c
/* tnX may not be negative but less than n */
Packit c4476c
void bn_mul_part_recursive(BN_ULONG *r, BN_ULONG *a, BN_ULONG *b, int n,
Packit c4476c
                           int tna, int tnb, BN_ULONG *t)
Packit c4476c
{
Packit c4476c
    int i, j, n2 = n * 2;
Packit c4476c
    int c1, c2, neg;
Packit c4476c
    BN_ULONG ln, lo, *p;
Packit c4476c
Packit c4476c
    if (n < 8) {
Packit c4476c
        bn_mul_normal(r, a, n + tna, b, n + tnb);
Packit c4476c
        return;
Packit c4476c
    }
Packit c4476c
Packit c4476c
    /* r=(a[0]-a[1])*(b[1]-b[0]) */
Packit c4476c
    c1 = bn_cmp_part_words(a, &(a[n]), tna, n - tna);
Packit c4476c
    c2 = bn_cmp_part_words(&(b[n]), b, tnb, tnb - n);
Packit c4476c
    neg = 0;
Packit c4476c
    switch (c1 * 3 + c2) {
Packit c4476c
    case -4:
Packit c4476c
        bn_sub_part_words(t, &(a[n]), a, tna, tna - n); /* - */
Packit c4476c
        bn_sub_part_words(&(t[n]), b, &(b[n]), tnb, n - tnb); /* - */
Packit c4476c
        break;
Packit c4476c
    case -3:
Packit c4476c
    case -2:
Packit c4476c
        bn_sub_part_words(t, &(a[n]), a, tna, tna - n); /* - */
Packit c4476c
        bn_sub_part_words(&(t[n]), &(b[n]), b, tnb, tnb - n); /* + */
Packit c4476c
        neg = 1;
Packit c4476c
        break;
Packit c4476c
    case -1:
Packit c4476c
    case 0:
Packit c4476c
    case 1:
Packit c4476c
    case 2:
Packit c4476c
        bn_sub_part_words(t, a, &(a[n]), tna, n - tna); /* + */
Packit c4476c
        bn_sub_part_words(&(t[n]), b, &(b[n]), tnb, n - tnb); /* - */
Packit c4476c
        neg = 1;
Packit c4476c
        break;
Packit c4476c
    case 3:
Packit c4476c
    case 4:
Packit c4476c
        bn_sub_part_words(t, a, &(a[n]), tna, n - tna);
Packit c4476c
        bn_sub_part_words(&(t[n]), &(b[n]), b, tnb, tnb - n);
Packit c4476c
        break;
Packit c4476c
    }
Packit c4476c
    /*
Packit c4476c
     * The zero case isn't yet implemented here. The speedup would probably
Packit c4476c
     * be negligible.
Packit c4476c
     */
Packit c4476c
# if 0
Packit c4476c
    if (n == 4) {
Packit c4476c
        bn_mul_comba4(&(t[n2]), t, &(t[n]));
Packit c4476c
        bn_mul_comba4(r, a, b);
Packit c4476c
        bn_mul_normal(&(r[n2]), &(a[n]), tn, &(b[n]), tn);
Packit c4476c
        memset(&r[n2 + tn * 2], 0, sizeof(*r) * (n2 - tn * 2));
Packit c4476c
    } else
Packit c4476c
# endif
Packit c4476c
    if (n == 8) {
Packit c4476c
        bn_mul_comba8(&(t[n2]), t, &(t[n]));
Packit c4476c
        bn_mul_comba8(r, a, b);
Packit c4476c
        bn_mul_normal(&(r[n2]), &(a[n]), tna, &(b[n]), tnb);
Packit c4476c
        memset(&r[n2 + tna + tnb], 0, sizeof(*r) * (n2 - tna - tnb));
Packit c4476c
    } else {
Packit c4476c
        p = &(t[n2 * 2]);
Packit c4476c
        bn_mul_recursive(&(t[n2]), t, &(t[n]), n, 0, 0, p);
Packit c4476c
        bn_mul_recursive(r, a, b, n, 0, 0, p);
Packit c4476c
        i = n / 2;
Packit c4476c
        /*
Packit c4476c
         * If there is only a bottom half to the number, just do it
Packit c4476c
         */
Packit c4476c
        if (tna > tnb)
Packit c4476c
            j = tna - i;
Packit c4476c
        else
Packit c4476c
            j = tnb - i;
Packit c4476c
        if (j == 0) {
Packit c4476c
            bn_mul_recursive(&(r[n2]), &(a[n]), &(b[n]),
Packit c4476c
                             i, tna - i, tnb - i, p);
Packit c4476c
            memset(&r[n2 + i * 2], 0, sizeof(*r) * (n2 - i * 2));
Packit c4476c
        } else if (j > 0) {     /* eg, n == 16, i == 8 and tn == 11 */
Packit c4476c
            bn_mul_part_recursive(&(r[n2]), &(a[n]), &(b[n]),
Packit c4476c
                                  i, tna - i, tnb - i, p);
Packit c4476c
            memset(&(r[n2 + tna + tnb]), 0,
Packit c4476c
                   sizeof(BN_ULONG) * (n2 - tna - tnb));
Packit c4476c
        } else {                /* (j < 0) eg, n == 16, i == 8 and tn == 5 */
Packit c4476c
Packit c4476c
            memset(&r[n2], 0, sizeof(*r) * n2);
Packit c4476c
            if (tna < BN_MUL_RECURSIVE_SIZE_NORMAL
Packit c4476c
                && tnb < BN_MUL_RECURSIVE_SIZE_NORMAL) {
Packit c4476c
                bn_mul_normal(&(r[n2]), &(a[n]), tna, &(b[n]), tnb);
Packit c4476c
            } else {
Packit c4476c
                for (;;) {
Packit c4476c
                    i /= 2;
Packit c4476c
                    /*
Packit c4476c
                     * these simplified conditions work exclusively because
Packit c4476c
                     * difference between tna and tnb is 1 or 0
Packit c4476c
                     */
Packit c4476c
                    if (i < tna || i < tnb) {
Packit c4476c
                        bn_mul_part_recursive(&(r[n2]),
Packit c4476c
                                              &(a[n]), &(b[n]),
Packit c4476c
                                              i, tna - i, tnb - i, p);
Packit c4476c
                        break;
Packit c4476c
                    } else if (i == tna || i == tnb) {
Packit c4476c
                        bn_mul_recursive(&(r[n2]),
Packit c4476c
                                         &(a[n]), &(b[n]),
Packit c4476c
                                         i, tna - i, tnb - i, p);
Packit c4476c
                        break;
Packit c4476c
                    }
Packit c4476c
                }
Packit c4476c
            }
Packit c4476c
        }
Packit c4476c
    }
Packit c4476c
Packit c4476c
    /*-
Packit c4476c
     * t[32] holds (a[0]-a[1])*(b[1]-b[0]), c1 is the sign
Packit c4476c
     * r[10] holds (a[0]*b[0])
Packit c4476c
     * r[32] holds (b[1]*b[1])
Packit c4476c
     */
Packit c4476c
Packit c4476c
    c1 = (int)(bn_add_words(t, r, &(r[n2]), n2));
Packit c4476c
Packit c4476c
    if (neg) {                  /* if t[32] is negative */
Packit c4476c
        c1 -= (int)(bn_sub_words(&(t[n2]), t, &(t[n2]), n2));
Packit c4476c
    } else {
Packit c4476c
        /* Might have a carry */
Packit c4476c
        c1 += (int)(bn_add_words(&(t[n2]), &(t[n2]), t, n2));
Packit c4476c
    }
Packit c4476c
Packit c4476c
    /*-
Packit c4476c
     * t[32] holds (a[0]-a[1])*(b[1]-b[0])+(a[0]*b[0])+(a[1]*b[1])
Packit c4476c
     * r[10] holds (a[0]*b[0])
Packit c4476c
     * r[32] holds (b[1]*b[1])
Packit c4476c
     * c1 holds the carry bits
Packit c4476c
     */
Packit c4476c
    c1 += (int)(bn_add_words(&(r[n]), &(r[n]), &(t[n2]), n2));
Packit c4476c
    if (c1) {
Packit c4476c
        p = &(r[n + n2]);
Packit c4476c
        lo = *p;
Packit c4476c
        ln = (lo + c1) & BN_MASK2;
Packit c4476c
        *p = ln;
Packit c4476c
Packit c4476c
        /*
Packit c4476c
         * The overflow will stop before we over write words we should not
Packit c4476c
         * overwrite
Packit c4476c
         */
Packit c4476c
        if (ln < (BN_ULONG)c1) {
Packit c4476c
            do {
Packit c4476c
                p++;
Packit c4476c
                lo = *p;
Packit c4476c
                ln = (lo + 1) & BN_MASK2;
Packit c4476c
                *p = ln;
Packit c4476c
            } while (ln == 0);
Packit c4476c
        }
Packit c4476c
    }
Packit c4476c
}
Packit c4476c
Packit c4476c
/*-
Packit c4476c
 * a and b must be the same size, which is n2.
Packit c4476c
 * r needs to be n2 words and t needs to be n2*2
Packit c4476c
 */
Packit c4476c
void bn_mul_low_recursive(BN_ULONG *r, BN_ULONG *a, BN_ULONG *b, int n2,
Packit c4476c
                          BN_ULONG *t)
Packit c4476c
{
Packit c4476c
    int n = n2 / 2;
Packit c4476c
Packit c4476c
    bn_mul_recursive(r, a, b, n, 0, 0, &(t[0]));
Packit c4476c
    if (n >= BN_MUL_LOW_RECURSIVE_SIZE_NORMAL) {
Packit c4476c
        bn_mul_low_recursive(&(t[0]), &(a[0]), &(b[n]), n, &(t[n2]));
Packit c4476c
        bn_add_words(&(r[n]), &(r[n]), &(t[0]), n);
Packit c4476c
        bn_mul_low_recursive(&(t[0]), &(a[n]), &(b[0]), n, &(t[n2]));
Packit c4476c
        bn_add_words(&(r[n]), &(r[n]), &(t[0]), n);
Packit c4476c
    } else {
Packit c4476c
        bn_mul_low_normal(&(t[0]), &(a[0]), &(b[n]), n);
Packit c4476c
        bn_mul_low_normal(&(t[n]), &(a[n]), &(b[0]), n);
Packit c4476c
        bn_add_words(&(r[n]), &(r[n]), &(t[0]), n);
Packit c4476c
        bn_add_words(&(r[n]), &(r[n]), &(t[n]), n);
Packit c4476c
    }
Packit c4476c
}
Packit c4476c
#endif                          /* BN_RECURSION */
Packit c4476c
Packit c4476c
int BN_mul(BIGNUM *r, const BIGNUM *a, const BIGNUM *b, BN_CTX *ctx)
Packit c4476c
{
Packit c4476c
    int ret = bn_mul_fixed_top(r, a, b, ctx);
Packit c4476c
Packit c4476c
    bn_correct_top(r);
Packit c4476c
    bn_check_top(r);
Packit c4476c
Packit c4476c
    return ret;
Packit c4476c
}
Packit c4476c
Packit c4476c
int bn_mul_fixed_top(BIGNUM *r, const BIGNUM *a, const BIGNUM *b, BN_CTX *ctx)
Packit c4476c
{
Packit c4476c
    int ret = 0;
Packit c4476c
    int top, al, bl;
Packit c4476c
    BIGNUM *rr;
Packit c4476c
#if defined(BN_MUL_COMBA) || defined(BN_RECURSION)
Packit c4476c
    int i;
Packit c4476c
#endif
Packit c4476c
#ifdef BN_RECURSION
Packit c4476c
    BIGNUM *t = NULL;
Packit c4476c
    int j = 0, k;
Packit c4476c
#endif
Packit c4476c
Packit c4476c
    bn_check_top(a);
Packit c4476c
    bn_check_top(b);
Packit c4476c
    bn_check_top(r);
Packit c4476c
Packit c4476c
    al = a->top;
Packit c4476c
    bl = b->top;
Packit c4476c
Packit c4476c
    if ((al == 0) || (bl == 0)) {
Packit c4476c
        BN_zero(r);
Packit c4476c
        return 1;
Packit c4476c
    }
Packit c4476c
    top = al + bl;
Packit c4476c
Packit c4476c
    BN_CTX_start(ctx);
Packit c4476c
    if ((r == a) || (r == b)) {
Packit c4476c
        if ((rr = BN_CTX_get(ctx)) == NULL)
Packit c4476c
            goto err;
Packit c4476c
    } else
Packit c4476c
        rr = r;
Packit c4476c
Packit c4476c
#if defined(BN_MUL_COMBA) || defined(BN_RECURSION)
Packit c4476c
    i = al - bl;
Packit c4476c
#endif
Packit c4476c
#ifdef BN_MUL_COMBA
Packit c4476c
    if (i == 0) {
Packit c4476c
# if 0
Packit c4476c
        if (al == 4) {
Packit c4476c
            if (bn_wexpand(rr, 8) == NULL)
Packit c4476c
                goto err;
Packit c4476c
            rr->top = 8;
Packit c4476c
            bn_mul_comba4(rr->d, a->d, b->d);
Packit c4476c
            goto end;
Packit c4476c
        }
Packit c4476c
# endif
Packit c4476c
        if (al == 8) {
Packit c4476c
            if (bn_wexpand(rr, 16) == NULL)
Packit c4476c
                goto err;
Packit c4476c
            rr->top = 16;
Packit c4476c
            bn_mul_comba8(rr->d, a->d, b->d);
Packit c4476c
            goto end;
Packit c4476c
        }
Packit c4476c
    }
Packit c4476c
#endif                          /* BN_MUL_COMBA */
Packit c4476c
#ifdef BN_RECURSION
Packit c4476c
    if ((al >= BN_MULL_SIZE_NORMAL) && (bl >= BN_MULL_SIZE_NORMAL)) {
Packit c4476c
        if (i >= -1 && i <= 1) {
Packit c4476c
            /*
Packit c4476c
             * Find out the power of two lower or equal to the longest of the
Packit c4476c
             * two numbers
Packit c4476c
             */
Packit c4476c
            if (i >= 0) {
Packit c4476c
                j = BN_num_bits_word((BN_ULONG)al);
Packit c4476c
            }
Packit c4476c
            if (i == -1) {
Packit c4476c
                j = BN_num_bits_word((BN_ULONG)bl);
Packit c4476c
            }
Packit c4476c
            j = 1 << (j - 1);
Packit c4476c
            assert(j <= al || j <= bl);
Packit c4476c
            k = j + j;
Packit c4476c
            t = BN_CTX_get(ctx);
Packit c4476c
            if (t == NULL)
Packit c4476c
                goto err;
Packit c4476c
            if (al > j || bl > j) {
Packit c4476c
                if (bn_wexpand(t, k * 4) == NULL)
Packit c4476c
                    goto err;
Packit c4476c
                if (bn_wexpand(rr, k * 4) == NULL)
Packit c4476c
                    goto err;
Packit c4476c
                bn_mul_part_recursive(rr->d, a->d, b->d,
Packit c4476c
                                      j, al - j, bl - j, t->d);
Packit c4476c
            } else {            /* al <= j || bl <= j */
Packit c4476c
Packit c4476c
                if (bn_wexpand(t, k * 2) == NULL)
Packit c4476c
                    goto err;
Packit c4476c
                if (bn_wexpand(rr, k * 2) == NULL)
Packit c4476c
                    goto err;
Packit c4476c
                bn_mul_recursive(rr->d, a->d, b->d, j, al - j, bl - j, t->d);
Packit c4476c
            }
Packit c4476c
            rr->top = top;
Packit c4476c
            goto end;
Packit c4476c
        }
Packit c4476c
    }
Packit c4476c
#endif                          /* BN_RECURSION */
Packit c4476c
    if (bn_wexpand(rr, top) == NULL)
Packit c4476c
        goto err;
Packit c4476c
    rr->top = top;
Packit c4476c
    bn_mul_normal(rr->d, a->d, al, b->d, bl);
Packit c4476c
Packit c4476c
#if defined(BN_MUL_COMBA) || defined(BN_RECURSION)
Packit c4476c
 end:
Packit c4476c
#endif
Packit c4476c
    rr->neg = a->neg ^ b->neg;
Packit c4476c
    rr->flags |= BN_FLG_FIXED_TOP;
Packit c4476c
    if (r != rr && BN_copy(r, rr) == NULL)
Packit c4476c
        goto err;
Packit c4476c
Packit c4476c
    ret = 1;
Packit c4476c
 err:
Packit c4476c
    bn_check_top(r);
Packit c4476c
    BN_CTX_end(ctx);
Packit c4476c
    return ret;
Packit c4476c
}
Packit c4476c
Packit c4476c
void bn_mul_normal(BN_ULONG *r, BN_ULONG *a, int na, BN_ULONG *b, int nb)
Packit c4476c
{
Packit c4476c
    BN_ULONG *rr;
Packit c4476c
Packit c4476c
    if (na < nb) {
Packit c4476c
        int itmp;
Packit c4476c
        BN_ULONG *ltmp;
Packit c4476c
Packit c4476c
        itmp = na;
Packit c4476c
        na = nb;
Packit c4476c
        nb = itmp;
Packit c4476c
        ltmp = a;
Packit c4476c
        a = b;
Packit c4476c
        b = ltmp;
Packit c4476c
Packit c4476c
    }
Packit c4476c
    rr = &(r[na]);
Packit c4476c
    if (nb <= 0) {
Packit c4476c
        (void)bn_mul_words(r, a, na, 0);
Packit c4476c
        return;
Packit c4476c
    } else
Packit c4476c
        rr[0] = bn_mul_words(r, a, na, b[0]);
Packit c4476c
Packit c4476c
    for (;;) {
Packit c4476c
        if (--nb <= 0)
Packit c4476c
            return;
Packit c4476c
        rr[1] = bn_mul_add_words(&(r[1]), a, na, b[1]);
Packit c4476c
        if (--nb <= 0)
Packit c4476c
            return;
Packit c4476c
        rr[2] = bn_mul_add_words(&(r[2]), a, na, b[2]);
Packit c4476c
        if (--nb <= 0)
Packit c4476c
            return;
Packit c4476c
        rr[3] = bn_mul_add_words(&(r[3]), a, na, b[3]);
Packit c4476c
        if (--nb <= 0)
Packit c4476c
            return;
Packit c4476c
        rr[4] = bn_mul_add_words(&(r[4]), a, na, b[4]);
Packit c4476c
        rr += 4;
Packit c4476c
        r += 4;
Packit c4476c
        b += 4;
Packit c4476c
    }
Packit c4476c
}
Packit c4476c
Packit c4476c
void bn_mul_low_normal(BN_ULONG *r, BN_ULONG *a, BN_ULONG *b, int n)
Packit c4476c
{
Packit c4476c
    bn_mul_words(r, a, n, b[0]);
Packit c4476c
Packit c4476c
    for (;;) {
Packit c4476c
        if (--n <= 0)
Packit c4476c
            return;
Packit c4476c
        bn_mul_add_words(&(r[1]), a, n, b[1]);
Packit c4476c
        if (--n <= 0)
Packit c4476c
            return;
Packit c4476c
        bn_mul_add_words(&(r[2]), a, n, b[2]);
Packit c4476c
        if (--n <= 0)
Packit c4476c
            return;
Packit c4476c
        bn_mul_add_words(&(r[3]), a, n, b[3]);
Packit c4476c
        if (--n <= 0)
Packit c4476c
            return;
Packit c4476c
        bn_mul_add_words(&(r[4]), a, n, b[4]);
Packit c4476c
        r += 4;
Packit c4476c
        b += 4;
Packit c4476c
    }
Packit c4476c
}