common/mpi/mpi.c

*5697Smcpowers/*
*5697Smcpowers *  mpi.c
*5697Smcpowers *
*5697Smcpowers *  Arbitrary precision integer arithmetic library
*5697Smcpowers *
*5697Smcpowers * ***** BEGIN LICENSE BLOCK *****
*5697Smcpowers * Version: MPL 1.1/GPL 2.0/LGPL 2.1
*5697Smcpowers *
*5697Smcpowers * The contents of this file are subject to the Mozilla Public License Version
*5697Smcpowers * 1.1 (the "License"); you may not use this file except in compliance with
*5697Smcpowers * the License. You may obtain a copy of the License at
*5697Smcpowers * http://www.mozilla.org/MPL/
*5697Smcpowers *
*5697Smcpowers * Software distributed under the License is distributed on an "AS IS" basis,
*5697Smcpowers * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
*5697Smcpowers * for the specific language governing rights and limitations under the
*5697Smcpowers * License.
*5697Smcpowers *
*5697Smcpowers * The Original Code is the MPI Arbitrary Precision Integer Arithmetic library.
*5697Smcpowers *
*5697Smcpowers * The Initial Developer of the Original Code is
*5697Smcpowers * Michael J. Fromberger.
*5697Smcpowers * Portions created by the Initial Developer are Copyright (C) 1998
*5697Smcpowers * the Initial Developer. All Rights Reserved.
*5697Smcpowers *
*5697Smcpowers * Contributor(s):
*5697Smcpowers *   Netscape Communications Corporation
*5697Smcpowers *   Douglas Stebila <douglas@stebila.ca> of Sun Laboratories.
*5697Smcpowers *
*5697Smcpowers * Alternatively, the contents of this file may be used under the terms of
*5697Smcpowers * either the GNU General Public License Version 2 or later (the "GPL"), or
*5697Smcpowers * the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
*5697Smcpowers * in which case the provisions of the GPL or the LGPL are applicable instead
*5697Smcpowers * of those above. If you wish to allow use of your version of this file only
*5697Smcpowers * under the terms of either the GPL or the LGPL, and not to allow others to
*5697Smcpowers * use your version of this file under the terms of the MPL, indicate your
*5697Smcpowers * decision by deleting the provisions above and replace them with the notice
*5697Smcpowers * and other provisions required by the GPL or the LGPL. If you do not delete
*5697Smcpowers * the provisions above, a recipient may use your version of this file under
*5697Smcpowers * the terms of any one of the MPL, the GPL or the LGPL.
*5697Smcpowers *
*5697Smcpowers * ***** END LICENSE BLOCK ***** */
*5697Smcpowers/*
*5697Smcpowers * Copyright 2007 Sun Microsystems, Inc.  All rights reserved.
*5697Smcpowers * Use is subject to license terms.
*5697Smcpowers *
*5697Smcpowers * Sun elects to use this software under the MPL license.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowers#pragma ident	"%Z%%M%	%I%	%E% SMI"
*5697Smcpowers
*5697Smcpowers/* $Id: mpi.c,v 1.45 2006/09/29 20:12:21 alexei.volkov.bugs%sun.com Exp $ */
*5697Smcpowers
*5697Smcpowers#include "mpi-priv.h"
*5697Smcpowers#if defined(OSF1)
*5697Smcpowers#include <c_asm.h>
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers#if MP_LOGTAB
*5697Smcpowers/*
*5697Smcpowers  A table of the logs of 2 for various bases (the 0 and 1 entries of
*5697Smcpowers  this table are meaningless and should not be referenced).
*5697Smcpowers
*5697Smcpowers  This table is used to compute output lengths for the mp_toradix()
*5697Smcpowers  function.  Since a number n in radix r takes up about log_r(n)
*5697Smcpowers  digits, we estimate the output size by taking the least integer
*5697Smcpowers  greater than log_r(n), where:
*5697Smcpowers
*5697Smcpowers  log_r(n) = log_2(n) * log_r(2)
*5697Smcpowers
*5697Smcpowers  This table, therefore, is a table of log_r(2) for 2 <= r <= 36,
*5697Smcpowers  which are the output bases supported.
*5697Smcpowers */
*5697Smcpowers#include "logtab.h"
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers/* {{{ Constant strings */
*5697Smcpowers
*5697Smcpowers/* Constant strings returned by mp_strerror() */
*5697Smcpowersstatic const char *mp_err_string[] = {
*5697Smcpowers  "unknown result code",     /* say what?            */
*5697Smcpowers  "boolean true",            /* MP_OKAY, MP_YES      */
*5697Smcpowers  "boolean false",           /* MP_NO                */
*5697Smcpowers  "out of memory",           /* MP_MEM               */
*5697Smcpowers  "argument out of range",   /* MP_RANGE             */
*5697Smcpowers  "invalid input parameter", /* MP_BADARG            */
*5697Smcpowers  "result is undefined"      /* MP_UNDEF             */
*5697Smcpowers};
*5697Smcpowers
*5697Smcpowers/* Value to digit maps for radix conversion   */
*5697Smcpowers
*5697Smcpowers/* s_dmap_1 - standard digits and letters */
*5697Smcpowersstatic const char *s_dmap_1 =
*5697Smcpowers  "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz+/";
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowersunsigned long mp_allocs;
*5697Smcpowersunsigned long mp_frees;
*5697Smcpowersunsigned long mp_copies;
*5697Smcpowers
*5697Smcpowers/* {{{ Default precision manipulation */
*5697Smcpowers
*5697Smcpowers/* Default precision for newly created mp_int's      */
*5697Smcpowersstatic mp_size s_mp_defprec = MP_DEFPREC;
*5697Smcpowers
*5697Smcpowersmp_size mp_get_prec(void)
*5697Smcpowers{
*5697Smcpowers  return s_mp_defprec;
*5697Smcpowers
*5697Smcpowers} /* end mp_get_prec() */
*5697Smcpowers
*5697Smcpowersvoid         mp_set_prec(mp_size prec)
*5697Smcpowers{
*5697Smcpowers  if(prec == 0)
*5697Smcpowers    s_mp_defprec = MP_DEFPREC;
*5697Smcpowers  else
*5697Smcpowers    s_mp_defprec = prec;
*5697Smcpowers
*5697Smcpowers} /* end mp_set_prec() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/*------------------------------------------------------------------------*/
*5697Smcpowers/* {{{ mp_init(mp, kmflag) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_init(mp, kmflag)
*5697Smcpowers
*5697Smcpowers  Initialize a new zero-valued mp_int.  Returns MP_OKAY if successful,
*5697Smcpowers  MP_MEM if memory could not be allocated for the structure.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_init(mp_int *mp, int kmflag)
*5697Smcpowers{
*5697Smcpowers  return mp_init_size(mp, s_mp_defprec, kmflag);
*5697Smcpowers
*5697Smcpowers} /* end mp_init() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_init_size(mp, prec, kmflag) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_init_size(mp, prec, kmflag)
*5697Smcpowers
*5697Smcpowers  Initialize a new zero-valued mp_int with at least the given
*5697Smcpowers  precision; returns MP_OKAY if successful, or MP_MEM if memory could
*5697Smcpowers  not be allocated for the structure.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_init_size(mp_int *mp, mp_size prec, int kmflag)
*5697Smcpowers{
*5697Smcpowers  ARGCHK(mp != NULL && prec > 0, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  prec = MP_ROUNDUP(prec, s_mp_defprec);
*5697Smcpowers  if((DIGITS(mp) = s_mp_alloc(prec, sizeof(mp_digit), kmflag)) == NULL)
*5697Smcpowers    return MP_MEM;
*5697Smcpowers
*5697Smcpowers  SIGN(mp) = ZPOS;
*5697Smcpowers  USED(mp) = 1;
*5697Smcpowers  ALLOC(mp) = prec;
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end mp_init_size() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_init_copy(mp, from) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_init_copy(mp, from)
*5697Smcpowers
*5697Smcpowers  Initialize mp as an exact copy of from.  Returns MP_OKAY if
*5697Smcpowers  successful, MP_MEM if memory could not be allocated for the new
*5697Smcpowers  structure.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_init_copy(mp_int *mp, const mp_int *from)
*5697Smcpowers{
*5697Smcpowers  ARGCHK(mp != NULL && from != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if(mp == from)
*5697Smcpowers    return MP_OKAY;
*5697Smcpowers
*5697Smcpowers  if((DIGITS(mp) = s_mp_alloc(ALLOC(from), sizeof(mp_digit), FLAG(from))) == NULL)
*5697Smcpowers    return MP_MEM;
*5697Smcpowers
*5697Smcpowers  s_mp_copy(DIGITS(from), DIGITS(mp), USED(from));
*5697Smcpowers  USED(mp) = USED(from);
*5697Smcpowers  ALLOC(mp) = ALLOC(from);
*5697Smcpowers  SIGN(mp) = SIGN(from);
*5697Smcpowers  FLAG(mp) = FLAG(from);
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end mp_init_copy() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_copy(from, to) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_copy(from, to)
*5697Smcpowers
*5697Smcpowers  Copies the mp_int 'from' to the mp_int 'to'.  It is presumed that
*5697Smcpowers  'to' has already been initialized (if not, use mp_init_copy()
*5697Smcpowers  instead). If 'from' and 'to' are identical, nothing happens.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_copy(const mp_int *from, mp_int *to)
*5697Smcpowers{
*5697Smcpowers  ARGCHK(from != NULL && to != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if(from == to)
*5697Smcpowers    return MP_OKAY;
*5697Smcpowers
*5697Smcpowers  ++mp_copies;
*5697Smcpowers  { /* copy */
*5697Smcpowers    mp_digit   *tmp;
*5697Smcpowers
*5697Smcpowers    /*
*5697Smcpowers      If the allocated buffer in 'to' already has enough space to hold
*5697Smcpowers      all the used digits of 'from', we'll re-use it to avoid hitting
*5697Smcpowers      the memory allocater more than necessary; otherwise, we'd have
*5697Smcpowers      to grow anyway, so we just allocate a hunk and make the copy as
*5697Smcpowers      usual
*5697Smcpowers     */
*5697Smcpowers    if(ALLOC(to) >= USED(from)) {
*5697Smcpowers      s_mp_setz(DIGITS(to) + USED(from), ALLOC(to) - USED(from));
*5697Smcpowers      s_mp_copy(DIGITS(from), DIGITS(to), USED(from));
*5697Smcpowers
*5697Smcpowers    } else {
*5697Smcpowers      if((tmp = s_mp_alloc(ALLOC(from), sizeof(mp_digit), FLAG(from))) == NULL)
*5697Smcpowers	return MP_MEM;
*5697Smcpowers
*5697Smcpowers      s_mp_copy(DIGITS(from), tmp, USED(from));
*5697Smcpowers
*5697Smcpowers      if(DIGITS(to) != NULL) {
*5697Smcpowers#if MP_CRYPTO
*5697Smcpowers	s_mp_setz(DIGITS(to), ALLOC(to));
*5697Smcpowers#endif
*5697Smcpowers	s_mp_free(DIGITS(to), ALLOC(to));
*5697Smcpowers      }
*5697Smcpowers
*5697Smcpowers      DIGITS(to) = tmp;
*5697Smcpowers      ALLOC(to) = ALLOC(from);
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    /* Copy the precision and sign from the original */
*5697Smcpowers    USED(to) = USED(from);
*5697Smcpowers    SIGN(to) = SIGN(from);
*5697Smcpowers  } /* end copy */
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end mp_copy() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_exch(mp1, mp2) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_exch(mp1, mp2)
*5697Smcpowers
*5697Smcpowers  Exchange mp1 and mp2 without allocating any intermediate memory
*5697Smcpowers  (well, unless you count the stack space needed for this call and the
*5697Smcpowers  locals it creates...).  This cannot fail.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersvoid mp_exch(mp_int *mp1, mp_int *mp2)
*5697Smcpowers{
*5697Smcpowers#if MP_ARGCHK == 2
*5697Smcpowers  assert(mp1 != NULL && mp2 != NULL);
*5697Smcpowers#else
*5697Smcpowers  if(mp1 == NULL || mp2 == NULL)
*5697Smcpowers    return;
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers  s_mp_exch(mp1, mp2);
*5697Smcpowers
*5697Smcpowers} /* end mp_exch() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_clear(mp) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_clear(mp)
*5697Smcpowers
*5697Smcpowers  Release the storage used by an mp_int, and void its fields so that
*5697Smcpowers  if someone calls mp_clear() again for the same int later, we won't
*5697Smcpowers  get tollchocked.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersvoid   mp_clear(mp_int *mp)
*5697Smcpowers{
*5697Smcpowers  if(mp == NULL)
*5697Smcpowers    return;
*5697Smcpowers
*5697Smcpowers  if(DIGITS(mp) != NULL) {
*5697Smcpowers#if MP_CRYPTO
*5697Smcpowers    s_mp_setz(DIGITS(mp), ALLOC(mp));
*5697Smcpowers#endif
*5697Smcpowers    s_mp_free(DIGITS(mp), ALLOC(mp));
*5697Smcpowers    DIGITS(mp) = NULL;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  USED(mp) = 0;
*5697Smcpowers  ALLOC(mp) = 0;
*5697Smcpowers
*5697Smcpowers} /* end mp_clear() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_zero(mp) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_zero(mp)
*5697Smcpowers
*5697Smcpowers  Set mp to zero.  Does not change the allocated size of the structure,
*5697Smcpowers  and therefore cannot fail (except on a bad argument, which we ignore)
*5697Smcpowers */
*5697Smcpowersvoid   mp_zero(mp_int *mp)
*5697Smcpowers{
*5697Smcpowers  if(mp == NULL)
*5697Smcpowers    return;
*5697Smcpowers
*5697Smcpowers  s_mp_setz(DIGITS(mp), ALLOC(mp));
*5697Smcpowers  USED(mp) = 1;
*5697Smcpowers  SIGN(mp) = ZPOS;
*5697Smcpowers
*5697Smcpowers} /* end mp_zero() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_set(mp, d) */
*5697Smcpowers
*5697Smcpowersvoid   mp_set(mp_int *mp, mp_digit d)
*5697Smcpowers{
*5697Smcpowers  if(mp == NULL)
*5697Smcpowers    return;
*5697Smcpowers
*5697Smcpowers  mp_zero(mp);
*5697Smcpowers  DIGIT(mp, 0) = d;
*5697Smcpowers
*5697Smcpowers} /* end mp_set() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_set_int(mp, z) */
*5697Smcpowers
*5697Smcpowersmp_err mp_set_int(mp_int *mp, long z)
*5697Smcpowers{
*5697Smcpowers  int            ix;
*5697Smcpowers  unsigned long  v = labs(z);
*5697Smcpowers  mp_err         res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(mp != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  mp_zero(mp);
*5697Smcpowers  if(z == 0)
*5697Smcpowers    return MP_OKAY;  /* shortcut for zero */
*5697Smcpowers
*5697Smcpowers  if (sizeof v <= sizeof(mp_digit)) {
*5697Smcpowers    DIGIT(mp,0) = v;
*5697Smcpowers  } else {
*5697Smcpowers    for (ix = sizeof(long) - 1; ix >= 0; ix--) {
*5697Smcpowers      if ((res = s_mp_mul_d(mp, (UCHAR_MAX + 1))) != MP_OKAY)
*5697Smcpowers	return res;
*5697Smcpowers
*5697Smcpowers      res = s_mp_add_d(mp, (mp_digit)((v >> (ix * CHAR_BIT)) & UCHAR_MAX));
*5697Smcpowers      if (res != MP_OKAY)
*5697Smcpowers	return res;
*5697Smcpowers    }
*5697Smcpowers  }
*5697Smcpowers  if(z < 0)
*5697Smcpowers    SIGN(mp) = NEG;
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end mp_set_int() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_set_ulong(mp, z) */
*5697Smcpowers
*5697Smcpowersmp_err mp_set_ulong(mp_int *mp, unsigned long z)
*5697Smcpowers{
*5697Smcpowers  int            ix;
*5697Smcpowers  mp_err         res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(mp != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  mp_zero(mp);
*5697Smcpowers  if(z == 0)
*5697Smcpowers    return MP_OKAY;  /* shortcut for zero */
*5697Smcpowers
*5697Smcpowers  if (sizeof z <= sizeof(mp_digit)) {
*5697Smcpowers    DIGIT(mp,0) = z;
*5697Smcpowers  } else {
*5697Smcpowers    for (ix = sizeof(long) - 1; ix >= 0; ix--) {
*5697Smcpowers      if ((res = s_mp_mul_d(mp, (UCHAR_MAX + 1))) != MP_OKAY)
*5697Smcpowers	return res;
*5697Smcpowers
*5697Smcpowers      res = s_mp_add_d(mp, (mp_digit)((z >> (ix * CHAR_BIT)) & UCHAR_MAX));
*5697Smcpowers      if (res != MP_OKAY)
*5697Smcpowers	return res;
*5697Smcpowers    }
*5697Smcpowers  }
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers} /* end mp_set_ulong() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/*------------------------------------------------------------------------*/
*5697Smcpowers/* {{{ Digit arithmetic */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_add_d(a, d, b) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_add_d(a, d, b)
*5697Smcpowers
*5697Smcpowers  Compute the sum b = a + d, for a single digit d.  Respects the sign of
*5697Smcpowers  its primary addend (single digits are unsigned anyway).
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_add_d(const mp_int *a, mp_digit d, mp_int *b)
*5697Smcpowers{
*5697Smcpowers  mp_int   tmp;
*5697Smcpowers  mp_err   res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if((res = mp_init_copy(&tmp, a)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  if(SIGN(&tmp) == ZPOS) {
*5697Smcpowers    if((res = s_mp_add_d(&tmp, d)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers  } else if(s_mp_cmp_d(&tmp, d) >= 0) {
*5697Smcpowers    if((res = s_mp_sub_d(&tmp, d)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers  } else {
*5697Smcpowers    mp_neg(&tmp, &tmp);
*5697Smcpowers
*5697Smcpowers    DIGIT(&tmp, 0) = d - DIGIT(&tmp, 0);
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if(s_mp_cmp_d(&tmp, 0) == 0)
*5697Smcpowers    SIGN(&tmp) = ZPOS;
*5697Smcpowers
*5697Smcpowers  s_mp_exch(&tmp, b);
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  mp_clear(&tmp);
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end mp_add_d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_sub_d(a, d, b) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_sub_d(a, d, b)
*5697Smcpowers
*5697Smcpowers  Compute the difference b = a - d, for a single digit d.  Respects the
*5697Smcpowers  sign of its subtrahend (single digits are unsigned anyway).
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_sub_d(const mp_int *a, mp_digit d, mp_int *b)
*5697Smcpowers{
*5697Smcpowers  mp_int   tmp;
*5697Smcpowers  mp_err   res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if((res = mp_init_copy(&tmp, a)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  if(SIGN(&tmp) == NEG) {
*5697Smcpowers    if((res = s_mp_add_d(&tmp, d)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers  } else if(s_mp_cmp_d(&tmp, d) >= 0) {
*5697Smcpowers    if((res = s_mp_sub_d(&tmp, d)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers  } else {
*5697Smcpowers    mp_neg(&tmp, &tmp);
*5697Smcpowers
*5697Smcpowers    DIGIT(&tmp, 0) = d - DIGIT(&tmp, 0);
*5697Smcpowers    SIGN(&tmp) = NEG;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if(s_mp_cmp_d(&tmp, 0) == 0)
*5697Smcpowers    SIGN(&tmp) = ZPOS;
*5697Smcpowers
*5697Smcpowers  s_mp_exch(&tmp, b);
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  mp_clear(&tmp);
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end mp_sub_d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_mul_d(a, d, b) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_mul_d(a, d, b)
*5697Smcpowers
*5697Smcpowers  Compute the product b = a * d, for a single digit d.  Respects the sign
*5697Smcpowers  of its multiplicand (single digits are unsigned anyway)
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_mul_d(const mp_int *a, mp_digit d, mp_int *b)
*5697Smcpowers{
*5697Smcpowers  mp_err  res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if(d == 0) {
*5697Smcpowers    mp_zero(b);
*5697Smcpowers    return MP_OKAY;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if((res = mp_copy(a, b)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  res = s_mp_mul_d(b, d);
*5697Smcpowers
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end mp_mul_d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_mul_2(a, c) */
*5697Smcpowers
*5697Smcpowersmp_err mp_mul_2(const mp_int *a, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_err  res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if((res = mp_copy(a, c)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  return s_mp_mul_2(c);
*5697Smcpowers
*5697Smcpowers} /* end mp_mul_2() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_div_d(a, d, q, r) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_div_d(a, d, q, r)
*5697Smcpowers
*5697Smcpowers  Compute the quotient q = a / d and remainder r = a mod d, for a
*5697Smcpowers  single digit d.  Respects the sign of its divisor (single digits are
*5697Smcpowers  unsigned anyway).
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_div_d(const mp_int *a, mp_digit d, mp_int *q, mp_digit *r)
*5697Smcpowers{
*5697Smcpowers  mp_err   res;
*5697Smcpowers  mp_int   qp;
*5697Smcpowers  mp_digit rem;
*5697Smcpowers  int      pow;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if(d == 0)
*5697Smcpowers    return MP_RANGE;
*5697Smcpowers
*5697Smcpowers  /* Shortcut for powers of two ... */
*5697Smcpowers  if((pow = s_mp_ispow2d(d)) >= 0) {
*5697Smcpowers    mp_digit  mask;
*5697Smcpowers
*5697Smcpowers    mask = ((mp_digit)1 << pow) - 1;
*5697Smcpowers    rem = DIGIT(a, 0) & mask;
*5697Smcpowers
*5697Smcpowers    if(q) {
*5697Smcpowers      mp_copy(a, q);
*5697Smcpowers      s_mp_div_2d(q, pow);
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    if(r)
*5697Smcpowers      *r = rem;
*5697Smcpowers
*5697Smcpowers    return MP_OKAY;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if((res = mp_init_copy(&qp, a)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  res = s_mp_div_d(&qp, d, &rem);
*5697Smcpowers
*5697Smcpowers  if(s_mp_cmp_d(&qp, 0) == 0)
*5697Smcpowers    SIGN(q) = ZPOS;
*5697Smcpowers
*5697Smcpowers  if(r)
*5697Smcpowers    *r = rem;
*5697Smcpowers
*5697Smcpowers  if(q)
*5697Smcpowers    s_mp_exch(&qp, q);
*5697Smcpowers
*5697Smcpowers  mp_clear(&qp);
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end mp_div_d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_div_2(a, c) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_div_2(a, c)
*5697Smcpowers
*5697Smcpowers  Compute c = a / 2, disregarding the remainder.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_div_2(const mp_int *a, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_err  res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if((res = mp_copy(a, c)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  s_mp_div_2(c);
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end mp_div_2() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_expt_d(a, d, b) */
*5697Smcpowers
*5697Smcpowersmp_err mp_expt_d(const mp_int *a, mp_digit d, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_int   s, x;
*5697Smcpowers  mp_err   res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if((res = mp_init(&s, FLAG(a))) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers  if((res = mp_init_copy(&x, a)) != MP_OKAY)
*5697Smcpowers    goto X;
*5697Smcpowers
*5697Smcpowers  DIGIT(&s, 0) = 1;
*5697Smcpowers
*5697Smcpowers  while(d != 0) {
*5697Smcpowers    if(d & 1) {
*5697Smcpowers      if((res = s_mp_mul(&s, &x)) != MP_OKAY)
*5697Smcpowers	goto CLEANUP;
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    d /= 2;
*5697Smcpowers
*5697Smcpowers    if((res = s_mp_sqr(&x)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  s_mp_exch(&s, c);
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  mp_clear(&x);
*5697SmcpowersX:
*5697Smcpowers  mp_clear(&s);
*5697Smcpowers
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end mp_expt_d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/*------------------------------------------------------------------------*/
*5697Smcpowers/* {{{ Full arithmetic */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_abs(a, b) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_abs(a, b)
*5697Smcpowers
*5697Smcpowers  Compute b = |a|.  'a' and 'b' may be identical.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_abs(const mp_int *a, mp_int *b)
*5697Smcpowers{
*5697Smcpowers  mp_err   res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if((res = mp_copy(a, b)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  SIGN(b) = ZPOS;
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end mp_abs() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_neg(a, b) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_neg(a, b)
*5697Smcpowers
*5697Smcpowers  Compute b = -a.  'a' and 'b' may be identical.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_neg(const mp_int *a, mp_int *b)
*5697Smcpowers{
*5697Smcpowers  mp_err   res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if((res = mp_copy(a, b)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  if(s_mp_cmp_d(b, 0) == MP_EQ)
*5697Smcpowers    SIGN(b) = ZPOS;
*5697Smcpowers  else
*5697Smcpowers    SIGN(b) = (SIGN(b) == NEG) ? ZPOS : NEG;
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end mp_neg() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_add(a, b, c) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_add(a, b, c)
*5697Smcpowers
*5697Smcpowers  Compute c = a + b.  All parameters may be identical.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_add(const mp_int *a, const mp_int *b, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_err  res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if(SIGN(a) == SIGN(b)) { /* same sign:  add values, keep sign */
*5697Smcpowers    MP_CHECKOK( s_mp_add_3arg(a, b, c) );
*5697Smcpowers  } else if(s_mp_cmp(a, b) >= 0) {  /* different sign: |a| >= |b|   */
*5697Smcpowers    MP_CHECKOK( s_mp_sub_3arg(a, b, c) );
*5697Smcpowers  } else {                          /* different sign: |a|  < |b|   */
*5697Smcpowers    MP_CHECKOK( s_mp_sub_3arg(b, a, c) );
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if (s_mp_cmp_d(c, 0) == MP_EQ)
*5697Smcpowers    SIGN(c) = ZPOS;
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end mp_add() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_sub(a, b, c) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_sub(a, b, c)
*5697Smcpowers
*5697Smcpowers  Compute c = a - b.  All parameters may be identical.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_sub(const mp_int *a, const mp_int *b, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_err  res;
*5697Smcpowers  int     magDiff;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if (a == b) {
*5697Smcpowers    mp_zero(c);
*5697Smcpowers    return MP_OKAY;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if (MP_SIGN(a) != MP_SIGN(b)) {
*5697Smcpowers    MP_CHECKOK( s_mp_add_3arg(a, b, c) );
*5697Smcpowers  } else if (!(magDiff = s_mp_cmp(a, b))) {
*5697Smcpowers    mp_zero(c);
*5697Smcpowers    res = MP_OKAY;
*5697Smcpowers  } else if (magDiff > 0) {
*5697Smcpowers    MP_CHECKOK( s_mp_sub_3arg(a, b, c) );
*5697Smcpowers  } else {
*5697Smcpowers    MP_CHECKOK( s_mp_sub_3arg(b, a, c) );
*5697Smcpowers    MP_SIGN(c) = !MP_SIGN(a);
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if (s_mp_cmp_d(c, 0) == MP_EQ)
*5697Smcpowers    MP_SIGN(c) = MP_ZPOS;
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end mp_sub() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_mul(a, b, c) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_mul(a, b, c)
*5697Smcpowers
*5697Smcpowers  Compute c = a * b.  All parameters may be identical.
*5697Smcpowers */
*5697Smcpowersmp_err   mp_mul(const mp_int *a, const mp_int *b, mp_int * c)
*5697Smcpowers{
*5697Smcpowers  mp_digit *pb;
*5697Smcpowers  mp_int   tmp;
*5697Smcpowers  mp_err   res;
*5697Smcpowers  mp_size  ib;
*5697Smcpowers  mp_size  useda, usedb;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if (a == c) {
*5697Smcpowers    if ((res = mp_init_copy(&tmp, a)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers    if (a == b)
*5697Smcpowers      b = &tmp;
*5697Smcpowers    a = &tmp;
*5697Smcpowers  } else if (b == c) {
*5697Smcpowers    if ((res = mp_init_copy(&tmp, b)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers    b = &tmp;
*5697Smcpowers  } else {
*5697Smcpowers    MP_DIGITS(&tmp) = 0;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if (MP_USED(a) < MP_USED(b)) {
*5697Smcpowers    const mp_int *xch = b;	/* switch a and b, to do fewer outer loops */
*5697Smcpowers    b = a;
*5697Smcpowers    a = xch;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  MP_USED(c) = 1; MP_DIGIT(c, 0) = 0;
*5697Smcpowers  if((res = s_mp_pad(c, USED(a) + USED(b))) != MP_OKAY)
*5697Smcpowers    goto CLEANUP;
*5697Smcpowers
*5697Smcpowers#ifdef NSS_USE_COMBA
*5697Smcpowers  if ((MP_USED(a) == MP_USED(b)) && IS_POWER_OF_2(MP_USED(b))) {
*5697Smcpowers      if (MP_USED(a) == 4) {
*5697Smcpowers          s_mp_mul_comba_4(a, b, c);
*5697Smcpowers          goto CLEANUP;
*5697Smcpowers      }
*5697Smcpowers      if (MP_USED(a) == 8) {
*5697Smcpowers          s_mp_mul_comba_8(a, b, c);
*5697Smcpowers          goto CLEANUP;
*5697Smcpowers      }
*5697Smcpowers      if (MP_USED(a) == 16) {
*5697Smcpowers          s_mp_mul_comba_16(a, b, c);
*5697Smcpowers          goto CLEANUP;
*5697Smcpowers      }
*5697Smcpowers      if (MP_USED(a) == 32) {
*5697Smcpowers          s_mp_mul_comba_32(a, b, c);
*5697Smcpowers          goto CLEANUP;
*5697Smcpowers      }
*5697Smcpowers  }
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers  pb = MP_DIGITS(b);
*5697Smcpowers  s_mpv_mul_d(MP_DIGITS(a), MP_USED(a), *pb++, MP_DIGITS(c));
*5697Smcpowers
*5697Smcpowers  /* Outer loop:  Digits of b */
*5697Smcpowers  useda = MP_USED(a);
*5697Smcpowers  usedb = MP_USED(b);
*5697Smcpowers  for (ib = 1; ib < usedb; ib++) {
*5697Smcpowers    mp_digit b_i    = *pb++;
*5697Smcpowers
*5697Smcpowers    /* Inner product:  Digits of a */
*5697Smcpowers    if (b_i)
*5697Smcpowers      s_mpv_mul_d_add(MP_DIGITS(a), useda, b_i, MP_DIGITS(c) + ib);
*5697Smcpowers    else
*5697Smcpowers      MP_DIGIT(c, ib + useda) = b_i;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  s_mp_clamp(c);
*5697Smcpowers
*5697Smcpowers  if(SIGN(a) == SIGN(b) || s_mp_cmp_d(c, 0) == MP_EQ)
*5697Smcpowers    SIGN(c) = ZPOS;
*5697Smcpowers  else
*5697Smcpowers    SIGN(c) = NEG;
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  mp_clear(&tmp);
*5697Smcpowers  return res;
*5697Smcpowers} /* end mp_mul() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_sqr(a, sqr) */
*5697Smcpowers
*5697Smcpowers#if MP_SQUARE
*5697Smcpowers/*
*5697Smcpowers  Computes the square of a.  This can be done more
*5697Smcpowers  efficiently than a general multiplication, because many of the
*5697Smcpowers  computation steps are redundant when squaring.  The inner product
*5697Smcpowers  step is a bit more complicated, but we save a fair number of
*5697Smcpowers  iterations of the multiplication loop.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowers/* sqr = a^2;   Caller provides both a and tmp; */
*5697Smcpowersmp_err   mp_sqr(const mp_int *a, mp_int *sqr)
*5697Smcpowers{
*5697Smcpowers  mp_digit *pa;
*5697Smcpowers  mp_digit d;
*5697Smcpowers  mp_err   res;
*5697Smcpowers  mp_size  ix;
*5697Smcpowers  mp_int   tmp;
*5697Smcpowers  int      count;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && sqr != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if (a == sqr) {
*5697Smcpowers    if((res = mp_init_copy(&tmp, a)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers    a = &tmp;
*5697Smcpowers  } else {
*5697Smcpowers    DIGITS(&tmp) = 0;
*5697Smcpowers    res = MP_OKAY;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  ix = 2 * MP_USED(a);
*5697Smcpowers  if (ix > MP_ALLOC(sqr)) {
*5697Smcpowers    MP_USED(sqr) = 1;
*5697Smcpowers    MP_CHECKOK( s_mp_grow(sqr, ix) );
*5697Smcpowers  }
*5697Smcpowers  MP_USED(sqr) = ix;
*5697Smcpowers  MP_DIGIT(sqr, 0) = 0;
*5697Smcpowers
*5697Smcpowers#ifdef NSS_USE_COMBA
*5697Smcpowers  if (IS_POWER_OF_2(MP_USED(a))) {
*5697Smcpowers      if (MP_USED(a) == 4) {
*5697Smcpowers          s_mp_sqr_comba_4(a, sqr);
*5697Smcpowers          goto CLEANUP;
*5697Smcpowers      }
*5697Smcpowers      if (MP_USED(a) == 8) {
*5697Smcpowers          s_mp_sqr_comba_8(a, sqr);
*5697Smcpowers          goto CLEANUP;
*5697Smcpowers      }
*5697Smcpowers      if (MP_USED(a) == 16) {
*5697Smcpowers          s_mp_sqr_comba_16(a, sqr);
*5697Smcpowers          goto CLEANUP;
*5697Smcpowers      }
*5697Smcpowers      if (MP_USED(a) == 32) {
*5697Smcpowers          s_mp_sqr_comba_32(a, sqr);
*5697Smcpowers          goto CLEANUP;
*5697Smcpowers      }
*5697Smcpowers  }
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers  pa = MP_DIGITS(a);
*5697Smcpowers  count = MP_USED(a) - 1;
*5697Smcpowers  if (count > 0) {
*5697Smcpowers    d = *pa++;
*5697Smcpowers    s_mpv_mul_d(pa, count, d, MP_DIGITS(sqr) + 1);
*5697Smcpowers    for (ix = 3; --count > 0; ix += 2) {
*5697Smcpowers      d = *pa++;
*5697Smcpowers      s_mpv_mul_d_add(pa, count, d, MP_DIGITS(sqr) + ix);
*5697Smcpowers    } /* for(ix ...) */
*5697Smcpowers    MP_DIGIT(sqr, MP_USED(sqr)-1) = 0; /* above loop stopped short of this. */
*5697Smcpowers
*5697Smcpowers    /* now sqr *= 2 */
*5697Smcpowers    s_mp_mul_2(sqr);
*5697Smcpowers  } else {
*5697Smcpowers    MP_DIGIT(sqr, 1) = 0;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* now add the squares of the digits of a to sqr. */
*5697Smcpowers  s_mpv_sqr_add_prop(MP_DIGITS(a), MP_USED(a), MP_DIGITS(sqr));
*5697Smcpowers
*5697Smcpowers  SIGN(sqr) = ZPOS;
*5697Smcpowers  s_mp_clamp(sqr);
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  mp_clear(&tmp);
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end mp_sqr() */
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_div(a, b, q, r) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_div(a, b, q, r)
*5697Smcpowers
*5697Smcpowers  Compute q = a / b and r = a mod b.  Input parameters may be re-used
*5697Smcpowers  as output parameters.  If q or r is NULL, that portion of the
*5697Smcpowers  computation will be discarded (although it will still be computed)
*5697Smcpowers */
*5697Smcpowersmp_err mp_div(const mp_int *a, const mp_int *b, mp_int *q, mp_int *r)
*5697Smcpowers{
*5697Smcpowers  mp_err   res;
*5697Smcpowers  mp_int   *pQ, *pR;
*5697Smcpowers  mp_int   qtmp, rtmp, btmp;
*5697Smcpowers  int      cmp;
*5697Smcpowers  mp_sign  signA;
*5697Smcpowers  mp_sign  signB;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  signA = MP_SIGN(a);
*5697Smcpowers  signB = MP_SIGN(b);
*5697Smcpowers
*5697Smcpowers  if(mp_cmp_z(b) == MP_EQ)
*5697Smcpowers    return MP_RANGE;
*5697Smcpowers
*5697Smcpowers  DIGITS(&qtmp) = 0;
*5697Smcpowers  DIGITS(&rtmp) = 0;
*5697Smcpowers  DIGITS(&btmp) = 0;
*5697Smcpowers
*5697Smcpowers  /* Set up some temporaries... */
*5697Smcpowers  if (!r || r == a || r == b) {
*5697Smcpowers    MP_CHECKOK( mp_init_copy(&rtmp, a) );
*5697Smcpowers    pR = &rtmp;
*5697Smcpowers  } else {
*5697Smcpowers    MP_CHECKOK( mp_copy(a, r) );
*5697Smcpowers    pR = r;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if (!q || q == a || q == b) {
*5697Smcpowers    MP_CHECKOK( mp_init_size(&qtmp, MP_USED(a), FLAG(a)) );
*5697Smcpowers    pQ = &qtmp;
*5697Smcpowers  } else {
*5697Smcpowers    MP_CHECKOK( s_mp_pad(q, MP_USED(a)) );
*5697Smcpowers    pQ = q;
*5697Smcpowers    mp_zero(pQ);
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /*
*5697Smcpowers    If |a| <= |b|, we can compute the solution without division;
*5697Smcpowers    otherwise, we actually do the work required.
*5697Smcpowers   */
*5697Smcpowers  if ((cmp = s_mp_cmp(a, b)) <= 0) {
*5697Smcpowers    if (cmp) {
*5697Smcpowers      /* r was set to a above. */
*5697Smcpowers      mp_zero(pQ);
*5697Smcpowers    } else {
*5697Smcpowers      mp_set(pQ, 1);
*5697Smcpowers      mp_zero(pR);
*5697Smcpowers    }
*5697Smcpowers  } else {
*5697Smcpowers    MP_CHECKOK( mp_init_copy(&btmp, b) );
*5697Smcpowers    MP_CHECKOK( s_mp_div(pR, &btmp, pQ) );
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* Compute the signs for the output  */
*5697Smcpowers  MP_SIGN(pR) = signA;   /* Sr = Sa              */
*5697Smcpowers  /* Sq = ZPOS if Sa == Sb */ /* Sq = NEG if Sa != Sb */
*5697Smcpowers  MP_SIGN(pQ) = (signA == signB) ? ZPOS : NEG;
*5697Smcpowers
*5697Smcpowers  if(s_mp_cmp_d(pQ, 0) == MP_EQ)
*5697Smcpowers    SIGN(pQ) = ZPOS;
*5697Smcpowers  if(s_mp_cmp_d(pR, 0) == MP_EQ)
*5697Smcpowers    SIGN(pR) = ZPOS;
*5697Smcpowers
*5697Smcpowers  /* Copy output, if it is needed      */
*5697Smcpowers  if(q && q != pQ)
*5697Smcpowers    s_mp_exch(pQ, q);
*5697Smcpowers
*5697Smcpowers  if(r && r != pR)
*5697Smcpowers    s_mp_exch(pR, r);
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  mp_clear(&btmp);
*5697Smcpowers  mp_clear(&rtmp);
*5697Smcpowers  mp_clear(&qtmp);
*5697Smcpowers
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end mp_div() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_div_2d(a, d, q, r) */
*5697Smcpowers
*5697Smcpowersmp_err mp_div_2d(const mp_int *a, mp_digit d, mp_int *q, mp_int *r)
*5697Smcpowers{
*5697Smcpowers  mp_err  res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if(q) {
*5697Smcpowers    if((res = mp_copy(a, q)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers  }
*5697Smcpowers  if(r) {
*5697Smcpowers    if((res = mp_copy(a, r)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers  }
*5697Smcpowers  if(q) {
*5697Smcpowers    s_mp_div_2d(q, d);
*5697Smcpowers  }
*5697Smcpowers  if(r) {
*5697Smcpowers    s_mp_mod_2d(r, d);
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end mp_div_2d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_expt(a, b, c) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_expt(a, b, c)
*5697Smcpowers
*5697Smcpowers  Compute c = a ** b, that is, raise a to the b power.  Uses a
*5697Smcpowers  standard iterative square-and-multiply technique.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_expt(mp_int *a, mp_int *b, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_int   s, x;
*5697Smcpowers  mp_err   res;
*5697Smcpowers  mp_digit d;
*5697Smcpowers  int      dig, bit;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if(mp_cmp_z(b) < 0)
*5697Smcpowers    return MP_RANGE;
*5697Smcpowers
*5697Smcpowers  if((res = mp_init(&s, FLAG(a))) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  mp_set(&s, 1);
*5697Smcpowers
*5697Smcpowers  if((res = mp_init_copy(&x, a)) != MP_OKAY)
*5697Smcpowers    goto X;
*5697Smcpowers
*5697Smcpowers  /* Loop over low-order digits in ascending order */
*5697Smcpowers  for(dig = 0; dig < (USED(b) - 1); dig++) {
*5697Smcpowers    d = DIGIT(b, dig);
*5697Smcpowers
*5697Smcpowers    /* Loop over bits of each non-maximal digit */
*5697Smcpowers    for(bit = 0; bit < DIGIT_BIT; bit++) {
*5697Smcpowers      if(d & 1) {
*5697Smcpowers	if((res = s_mp_mul(&s, &x)) != MP_OKAY)
*5697Smcpowers	  goto CLEANUP;
*5697Smcpowers      }
*5697Smcpowers
*5697Smcpowers      d >>= 1;
*5697Smcpowers
*5697Smcpowers      if((res = s_mp_sqr(&x)) != MP_OKAY)
*5697Smcpowers	goto CLEANUP;
*5697Smcpowers    }
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* Consider now the last digit... */
*5697Smcpowers  d = DIGIT(b, dig);
*5697Smcpowers
*5697Smcpowers  while(d) {
*5697Smcpowers    if(d & 1) {
*5697Smcpowers      if((res = s_mp_mul(&s, &x)) != MP_OKAY)
*5697Smcpowers	goto CLEANUP;
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    d >>= 1;
*5697Smcpowers
*5697Smcpowers    if((res = s_mp_sqr(&x)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if(mp_iseven(b))
*5697Smcpowers    SIGN(&s) = SIGN(a);
*5697Smcpowers
*5697Smcpowers  res = mp_copy(&s, c);
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  mp_clear(&x);
*5697SmcpowersX:
*5697Smcpowers  mp_clear(&s);
*5697Smcpowers
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end mp_expt() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_2expt(a, k) */
*5697Smcpowers
*5697Smcpowers/* Compute a = 2^k */
*5697Smcpowers
*5697Smcpowersmp_err mp_2expt(mp_int *a, mp_digit k)
*5697Smcpowers{
*5697Smcpowers  ARGCHK(a != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  return s_mp_2expt(a, k);
*5697Smcpowers
*5697Smcpowers} /* end mp_2expt() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_mod(a, m, c) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_mod(a, m, c)
*5697Smcpowers
*5697Smcpowers  Compute c = a (mod m).  Result will always be 0 <= c < m.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_mod(const mp_int *a, const mp_int *m, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_err  res;
*5697Smcpowers  int     mag;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && m != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if(SIGN(m) == NEG)
*5697Smcpowers    return MP_RANGE;
*5697Smcpowers
*5697Smcpowers  /*
*5697Smcpowers     If |a| > m, we need to divide to get the remainder and take the
*5697Smcpowers     absolute value.
*5697Smcpowers
*5697Smcpowers     If |a| < m, we don't need to do any division, just copy and adjust
*5697Smcpowers     the sign (if a is negative).
*5697Smcpowers
*5697Smcpowers     If |a| == m, we can simply set the result to zero.
*5697Smcpowers
*5697Smcpowers     This order is intended to minimize the average path length of the
*5697Smcpowers     comparison chain on common workloads -- the most frequent cases are
*5697Smcpowers     that |a| != m, so we do those first.
*5697Smcpowers   */
*5697Smcpowers  if((mag = s_mp_cmp(a, m)) > 0) {
*5697Smcpowers    if((res = mp_div(a, m, NULL, c)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers
*5697Smcpowers    if(SIGN(c) == NEG) {
*5697Smcpowers      if((res = mp_add(c, m, c)) != MP_OKAY)
*5697Smcpowers	return res;
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers  } else if(mag < 0) {
*5697Smcpowers    if((res = mp_copy(a, c)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers
*5697Smcpowers    if(mp_cmp_z(a) < 0) {
*5697Smcpowers      if((res = mp_add(c, m, c)) != MP_OKAY)
*5697Smcpowers	return res;
*5697Smcpowers
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers  } else {
*5697Smcpowers    mp_zero(c);
*5697Smcpowers
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end mp_mod() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_mod_d(a, d, c) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_mod_d(a, d, c)
*5697Smcpowers
*5697Smcpowers  Compute c = a (mod d).  Result will always be 0 <= c < d
*5697Smcpowers */
*5697Smcpowersmp_err mp_mod_d(const mp_int *a, mp_digit d, mp_digit *c)
*5697Smcpowers{
*5697Smcpowers  mp_err   res;
*5697Smcpowers  mp_digit rem;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if(s_mp_cmp_d(a, d) > 0) {
*5697Smcpowers    if((res = mp_div_d(a, d, NULL, &rem)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers
*5697Smcpowers  } else {
*5697Smcpowers    if(SIGN(a) == NEG)
*5697Smcpowers      rem = d - DIGIT(a, 0);
*5697Smcpowers    else
*5697Smcpowers      rem = DIGIT(a, 0);
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if(c)
*5697Smcpowers    *c = rem;
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end mp_mod_d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_sqrt(a, b) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_sqrt(a, b)
*5697Smcpowers
*5697Smcpowers  Compute the integer square root of a, and store the result in b.
*5697Smcpowers  Uses an integer-arithmetic version of Newton's iterative linear
*5697Smcpowers  approximation technique to determine this value; the result has the
*5697Smcpowers  following two properties:
*5697Smcpowers
*5697Smcpowers     b^2 <= a
*5697Smcpowers     (b+1)^2 >= a
*5697Smcpowers
*5697Smcpowers  It is a range error to pass a negative value.
*5697Smcpowers */
*5697Smcpowersmp_err mp_sqrt(const mp_int *a, mp_int *b)
*5697Smcpowers{
*5697Smcpowers  mp_int   x, t;
*5697Smcpowers  mp_err   res;
*5697Smcpowers  mp_size  used;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  /* Cannot take square root of a negative value */
*5697Smcpowers  if(SIGN(a) == NEG)
*5697Smcpowers    return MP_RANGE;
*5697Smcpowers
*5697Smcpowers  /* Special cases for zero and one, trivial     */
*5697Smcpowers  if(mp_cmp_d(a, 1) <= 0)
*5697Smcpowers    return mp_copy(a, b);
*5697Smcpowers
*5697Smcpowers  /* Initialize the temporaries we'll use below  */
*5697Smcpowers  if((res = mp_init_size(&t, USED(a), FLAG(a))) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  /* Compute an initial guess for the iteration as a itself */
*5697Smcpowers  if((res = mp_init_copy(&x, a)) != MP_OKAY)
*5697Smcpowers    goto X;
*5697Smcpowers
*5697Smcpowers  used = MP_USED(&x);
*5697Smcpowers  if (used > 1) {
*5697Smcpowers    s_mp_rshd(&x, used / 2);
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  for(;;) {
*5697Smcpowers    /* t = (x * x) - a */
*5697Smcpowers    mp_copy(&x, &t);      /* can't fail, t is big enough for original x */
*5697Smcpowers    if((res = mp_sqr(&t, &t)) != MP_OKAY ||
*5697Smcpowers       (res = mp_sub(&t, a, &t)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers
*5697Smcpowers    /* t = t / 2x       */
*5697Smcpowers    s_mp_mul_2(&x);
*5697Smcpowers    if((res = mp_div(&t, &x, &t, NULL)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers    s_mp_div_2(&x);
*5697Smcpowers
*5697Smcpowers    /* Terminate the loop, if the quotient is zero */
*5697Smcpowers    if(mp_cmp_z(&t) == MP_EQ)
*5697Smcpowers      break;
*5697Smcpowers
*5697Smcpowers    /* x = x - t       */
*5697Smcpowers    if((res = mp_sub(&x, &t, &x)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* Copy result to output parameter */
*5697Smcpowers  mp_sub_d(&x, 1, &x);
*5697Smcpowers  s_mp_exch(&x, b);
*5697Smcpowers
*5697Smcpowers CLEANUP:
*5697Smcpowers  mp_clear(&x);
*5697Smcpowers X:
*5697Smcpowers  mp_clear(&t);
*5697Smcpowers
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end mp_sqrt() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/*------------------------------------------------------------------------*/
*5697Smcpowers/* {{{ Modular arithmetic */
*5697Smcpowers
*5697Smcpowers#if MP_MODARITH
*5697Smcpowers/* {{{ mp_addmod(a, b, m, c) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_addmod(a, b, m, c)
*5697Smcpowers
*5697Smcpowers  Compute c = (a + b) mod m
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_addmod(const mp_int *a, const mp_int *b, const mp_int *m, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_err  res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL && m != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if((res = mp_add(a, b, c)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers  if((res = mp_mod(c, m, c)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers}
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_submod(a, b, m, c) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_submod(a, b, m, c)
*5697Smcpowers
*5697Smcpowers  Compute c = (a - b) mod m
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_submod(const mp_int *a, const mp_int *b, const mp_int *m, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_err  res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL && m != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if((res = mp_sub(a, b, c)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers  if((res = mp_mod(c, m, c)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers}
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_mulmod(a, b, m, c) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_mulmod(a, b, m, c)
*5697Smcpowers
*5697Smcpowers  Compute c = (a * b) mod m
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_mulmod(const mp_int *a, const mp_int *b, const mp_int *m, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_err  res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL && m != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if((res = mp_mul(a, b, c)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers  if((res = mp_mod(c, m, c)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers}
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_sqrmod(a, m, c) */
*5697Smcpowers
*5697Smcpowers#if MP_SQUARE
*5697Smcpowersmp_err mp_sqrmod(const mp_int *a, const mp_int *m, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_err  res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && m != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if((res = mp_sqr(a, c)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers  if((res = mp_mod(c, m, c)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end mp_sqrmod() */
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_exptmod(a, b, m, c) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  s_mp_exptmod(a, b, m, c)
*5697Smcpowers
*5697Smcpowers  Compute c = (a ** b) mod m.  Uses a standard square-and-multiply
*5697Smcpowers  method with modular reductions at each step. (This is basically the
*5697Smcpowers  same code as mp_expt(), except for the addition of the reductions)
*5697Smcpowers
*5697Smcpowers  The modular reductions are done using Barrett's algorithm (see
*5697Smcpowers  s_mp_reduce() below for details)
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err s_mp_exptmod(const mp_int *a, const mp_int *b, const mp_int *m, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_int   s, x, mu;
*5697Smcpowers  mp_err   res;
*5697Smcpowers  mp_digit d;
*5697Smcpowers  int      dig, bit;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if(mp_cmp_z(b) < 0 || mp_cmp_z(m) <= 0)
*5697Smcpowers    return MP_RANGE;
*5697Smcpowers
*5697Smcpowers  if((res = mp_init(&s, FLAG(a))) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers  if((res = mp_init_copy(&x, a)) != MP_OKAY ||
*5697Smcpowers     (res = mp_mod(&x, m, &x)) != MP_OKAY)
*5697Smcpowers    goto X;
*5697Smcpowers  if((res = mp_init(&mu, FLAG(a))) != MP_OKAY)
*5697Smcpowers    goto MU;
*5697Smcpowers
*5697Smcpowers  mp_set(&s, 1);
*5697Smcpowers
*5697Smcpowers  /* mu = b^2k / m */
*5697Smcpowers  s_mp_add_d(&mu, 1);
*5697Smcpowers  s_mp_lshd(&mu, 2 * USED(m));
*5697Smcpowers  if((res = mp_div(&mu, m, &mu, NULL)) != MP_OKAY)
*5697Smcpowers    goto CLEANUP;
*5697Smcpowers
*5697Smcpowers  /* Loop over digits of b in ascending order, except highest order */
*5697Smcpowers  for(dig = 0; dig < (USED(b) - 1); dig++) {
*5697Smcpowers    d = DIGIT(b, dig);
*5697Smcpowers
*5697Smcpowers    /* Loop over the bits of the lower-order digits */
*5697Smcpowers    for(bit = 0; bit < DIGIT_BIT; bit++) {
*5697Smcpowers      if(d & 1) {
*5697Smcpowers	if((res = s_mp_mul(&s, &x)) != MP_OKAY)
*5697Smcpowers	  goto CLEANUP;
*5697Smcpowers	if((res = s_mp_reduce(&s, m, &mu)) != MP_OKAY)
*5697Smcpowers	  goto CLEANUP;
*5697Smcpowers      }
*5697Smcpowers
*5697Smcpowers      d >>= 1;
*5697Smcpowers
*5697Smcpowers      if((res = s_mp_sqr(&x)) != MP_OKAY)
*5697Smcpowers	goto CLEANUP;
*5697Smcpowers      if((res = s_mp_reduce(&x, m, &mu)) != MP_OKAY)
*5697Smcpowers	goto CLEANUP;
*5697Smcpowers    }
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* Now do the last digit... */
*5697Smcpowers  d = DIGIT(b, dig);
*5697Smcpowers
*5697Smcpowers  while(d) {
*5697Smcpowers    if(d & 1) {
*5697Smcpowers      if((res = s_mp_mul(&s, &x)) != MP_OKAY)
*5697Smcpowers	goto CLEANUP;
*5697Smcpowers      if((res = s_mp_reduce(&s, m, &mu)) != MP_OKAY)
*5697Smcpowers	goto CLEANUP;
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    d >>= 1;
*5697Smcpowers
*5697Smcpowers    if((res = s_mp_sqr(&x)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers    if((res = s_mp_reduce(&x, m, &mu)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  s_mp_exch(&s, c);
*5697Smcpowers
*5697Smcpowers CLEANUP:
*5697Smcpowers  mp_clear(&mu);
*5697Smcpowers MU:
*5697Smcpowers  mp_clear(&x);
*5697Smcpowers X:
*5697Smcpowers  mp_clear(&s);
*5697Smcpowers
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_exptmod() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_exptmod_d(a, d, m, c) */
*5697Smcpowers
*5697Smcpowersmp_err mp_exptmod_d(const mp_int *a, mp_digit d, const mp_int *m, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_int   s, x;
*5697Smcpowers  mp_err   res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if((res = mp_init(&s, FLAG(a))) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers  if((res = mp_init_copy(&x, a)) != MP_OKAY)
*5697Smcpowers    goto X;
*5697Smcpowers
*5697Smcpowers  mp_set(&s, 1);
*5697Smcpowers
*5697Smcpowers  while(d != 0) {
*5697Smcpowers    if(d & 1) {
*5697Smcpowers      if((res = s_mp_mul(&s, &x)) != MP_OKAY ||
*5697Smcpowers	 (res = mp_mod(&s, m, &s)) != MP_OKAY)
*5697Smcpowers	goto CLEANUP;
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    d /= 2;
*5697Smcpowers
*5697Smcpowers    if((res = s_mp_sqr(&x)) != MP_OKAY ||
*5697Smcpowers       (res = mp_mod(&x, m, &x)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  s_mp_exch(&s, c);
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  mp_clear(&x);
*5697SmcpowersX:
*5697Smcpowers  mp_clear(&s);
*5697Smcpowers
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end mp_exptmod_d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers#endif /* if MP_MODARITH */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/*------------------------------------------------------------------------*/
*5697Smcpowers/* {{{ Comparison functions */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_cmp_z(a) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_cmp_z(a)
*5697Smcpowers
*5697Smcpowers  Compare a <=> 0.  Returns <0 if a<0, 0 if a=0, >0 if a>0.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersint    mp_cmp_z(const mp_int *a)
*5697Smcpowers{
*5697Smcpowers  if(SIGN(a) == NEG)
*5697Smcpowers    return MP_LT;
*5697Smcpowers  else if(USED(a) == 1 && DIGIT(a, 0) == 0)
*5697Smcpowers    return MP_EQ;
*5697Smcpowers  else
*5697Smcpowers    return MP_GT;
*5697Smcpowers
*5697Smcpowers} /* end mp_cmp_z() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_cmp_d(a, d) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_cmp_d(a, d)
*5697Smcpowers
*5697Smcpowers  Compare a <=> d.  Returns <0 if a<d, 0 if a=d, >0 if a>d
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersint    mp_cmp_d(const mp_int *a, mp_digit d)
*5697Smcpowers{
*5697Smcpowers  ARGCHK(a != NULL, MP_EQ);
*5697Smcpowers
*5697Smcpowers  if(SIGN(a) == NEG)
*5697Smcpowers    return MP_LT;
*5697Smcpowers
*5697Smcpowers  return s_mp_cmp_d(a, d);
*5697Smcpowers
*5697Smcpowers} /* end mp_cmp_d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_cmp(a, b) */
*5697Smcpowers
*5697Smcpowersint    mp_cmp(const mp_int *a, const mp_int *b)
*5697Smcpowers{
*5697Smcpowers  ARGCHK(a != NULL && b != NULL, MP_EQ);
*5697Smcpowers
*5697Smcpowers  if(SIGN(a) == SIGN(b)) {
*5697Smcpowers    int  mag;
*5697Smcpowers
*5697Smcpowers    if((mag = s_mp_cmp(a, b)) == MP_EQ)
*5697Smcpowers      return MP_EQ;
*5697Smcpowers
*5697Smcpowers    if(SIGN(a) == ZPOS)
*5697Smcpowers      return mag;
*5697Smcpowers    else
*5697Smcpowers      return -mag;
*5697Smcpowers
*5697Smcpowers  } else if(SIGN(a) == ZPOS) {
*5697Smcpowers    return MP_GT;
*5697Smcpowers  } else {
*5697Smcpowers    return MP_LT;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers} /* end mp_cmp() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_cmp_mag(a, b) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_cmp_mag(a, b)
*5697Smcpowers
*5697Smcpowers  Compares |a| <=> |b|, and returns an appropriate comparison result
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersint    mp_cmp_mag(mp_int *a, mp_int *b)
*5697Smcpowers{
*5697Smcpowers  ARGCHK(a != NULL && b != NULL, MP_EQ);
*5697Smcpowers
*5697Smcpowers  return s_mp_cmp(a, b);
*5697Smcpowers
*5697Smcpowers} /* end mp_cmp_mag() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_cmp_int(a, z, kmflag) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  This just converts z to an mp_int, and uses the existing comparison
*5697Smcpowers  routines.  This is sort of inefficient, but it's not clear to me how
*5697Smcpowers  frequently this wil get used anyway.  For small positive constants,
*5697Smcpowers  you can always use mp_cmp_d(), and for zero, there is mp_cmp_z().
*5697Smcpowers */
*5697Smcpowersint    mp_cmp_int(const mp_int *a, long z, int kmflag)
*5697Smcpowers{
*5697Smcpowers  mp_int  tmp;
*5697Smcpowers  int     out;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL, MP_EQ);
*5697Smcpowers
*5697Smcpowers  mp_init(&tmp, kmflag); mp_set_int(&tmp, z);
*5697Smcpowers  out = mp_cmp(a, &tmp);
*5697Smcpowers  mp_clear(&tmp);
*5697Smcpowers
*5697Smcpowers  return out;
*5697Smcpowers
*5697Smcpowers} /* end mp_cmp_int() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_isodd(a) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_isodd(a)
*5697Smcpowers
*5697Smcpowers  Returns a true (non-zero) value if a is odd, false (zero) otherwise.
*5697Smcpowers */
*5697Smcpowersint    mp_isodd(const mp_int *a)
*5697Smcpowers{
*5697Smcpowers  ARGCHK(a != NULL, 0);
*5697Smcpowers
*5697Smcpowers  return (int)(DIGIT(a, 0) & 1);
*5697Smcpowers
*5697Smcpowers} /* end mp_isodd() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_iseven(a) */
*5697Smcpowers
*5697Smcpowersint    mp_iseven(const mp_int *a)
*5697Smcpowers{
*5697Smcpowers  return !mp_isodd(a);
*5697Smcpowers
*5697Smcpowers} /* end mp_iseven() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/*------------------------------------------------------------------------*/
*5697Smcpowers/* {{{ Number theoretic functions */
*5697Smcpowers
*5697Smcpowers#if MP_NUMTH
*5697Smcpowers/* {{{ mp_gcd(a, b, c) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  Like the old mp_gcd() function, except computes the GCD using the
*5697Smcpowers  binary algorithm due to Josef Stein in 1961 (via Knuth).
*5697Smcpowers */
*5697Smcpowersmp_err mp_gcd(mp_int *a, mp_int *b, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_err   res;
*5697Smcpowers  mp_int   u, v, t;
*5697Smcpowers  mp_size  k = 0;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if(mp_cmp_z(a) == MP_EQ && mp_cmp_z(b) == MP_EQ)
*5697Smcpowers      return MP_RANGE;
*5697Smcpowers  if(mp_cmp_z(a) == MP_EQ) {
*5697Smcpowers    return mp_copy(b, c);
*5697Smcpowers  } else if(mp_cmp_z(b) == MP_EQ) {
*5697Smcpowers    return mp_copy(a, c);
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if((res = mp_init(&t, FLAG(a))) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers  if((res = mp_init_copy(&u, a)) != MP_OKAY)
*5697Smcpowers    goto U;
*5697Smcpowers  if((res = mp_init_copy(&v, b)) != MP_OKAY)
*5697Smcpowers    goto V;
*5697Smcpowers
*5697Smcpowers  SIGN(&u) = ZPOS;
*5697Smcpowers  SIGN(&v) = ZPOS;
*5697Smcpowers
*5697Smcpowers  /* Divide out common factors of 2 until at least 1 of a, b is even */
*5697Smcpowers  while(mp_iseven(&u) && mp_iseven(&v)) {
*5697Smcpowers    s_mp_div_2(&u);
*5697Smcpowers    s_mp_div_2(&v);
*5697Smcpowers    ++k;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* Initialize t */
*5697Smcpowers  if(mp_isodd(&u)) {
*5697Smcpowers    if((res = mp_copy(&v, &t)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers
*5697Smcpowers    /* t = -v */
*5697Smcpowers    if(SIGN(&v) == ZPOS)
*5697Smcpowers      SIGN(&t) = NEG;
*5697Smcpowers    else
*5697Smcpowers      SIGN(&t) = ZPOS;
*5697Smcpowers
*5697Smcpowers  } else {
*5697Smcpowers    if((res = mp_copy(&u, &t)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  for(;;) {
*5697Smcpowers    while(mp_iseven(&t)) {
*5697Smcpowers      s_mp_div_2(&t);
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    if(mp_cmp_z(&t) == MP_GT) {
*5697Smcpowers      if((res = mp_copy(&t, &u)) != MP_OKAY)
*5697Smcpowers	goto CLEANUP;
*5697Smcpowers
*5697Smcpowers    } else {
*5697Smcpowers      if((res = mp_copy(&t, &v)) != MP_OKAY)
*5697Smcpowers	goto CLEANUP;
*5697Smcpowers
*5697Smcpowers      /* v = -t */
*5697Smcpowers      if(SIGN(&t) == ZPOS)
*5697Smcpowers	SIGN(&v) = NEG;
*5697Smcpowers      else
*5697Smcpowers	SIGN(&v) = ZPOS;
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    if((res = mp_sub(&u, &v, &t)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers
*5697Smcpowers    if(s_mp_cmp_d(&t, 0) == MP_EQ)
*5697Smcpowers      break;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  s_mp_2expt(&v, k);       /* v = 2^k   */
*5697Smcpowers  res = mp_mul(&u, &v, c); /* c = u * v */
*5697Smcpowers
*5697Smcpowers CLEANUP:
*5697Smcpowers  mp_clear(&v);
*5697Smcpowers V:
*5697Smcpowers  mp_clear(&u);
*5697Smcpowers U:
*5697Smcpowers  mp_clear(&t);
*5697Smcpowers
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end mp_gcd() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_lcm(a, b, c) */
*5697Smcpowers
*5697Smcpowers/* We compute the least common multiple using the rule:
*5697Smcpowers
*5697Smcpowers   ab = [a, b](a, b)
*5697Smcpowers
*5697Smcpowers   ... by computing the product, and dividing out the gcd.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_lcm(mp_int *a, mp_int *b, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_int  gcd, prod;
*5697Smcpowers  mp_err  res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a != NULL && b != NULL && c != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  /* Set up temporaries */
*5697Smcpowers  if((res = mp_init(&gcd, FLAG(a))) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers  if((res = mp_init(&prod, FLAG(a))) != MP_OKAY)
*5697Smcpowers    goto GCD;
*5697Smcpowers
*5697Smcpowers  if((res = mp_mul(a, b, &prod)) != MP_OKAY)
*5697Smcpowers    goto CLEANUP;
*5697Smcpowers  if((res = mp_gcd(a, b, &gcd)) != MP_OKAY)
*5697Smcpowers    goto CLEANUP;
*5697Smcpowers
*5697Smcpowers  res = mp_div(&prod, &gcd, c, NULL);
*5697Smcpowers
*5697Smcpowers CLEANUP:
*5697Smcpowers  mp_clear(&prod);
*5697Smcpowers GCD:
*5697Smcpowers  mp_clear(&gcd);
*5697Smcpowers
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end mp_lcm() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_xgcd(a, b, g, x, y) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_xgcd(a, b, g, x, y)
*5697Smcpowers
*5697Smcpowers  Compute g = (a, b) and values x and y satisfying Bezout's identity
*5697Smcpowers  (that is, ax + by = g).  This uses the binary extended GCD algorithm
*5697Smcpowers  based on the Stein algorithm used for mp_gcd()
*5697Smcpowers  See algorithm 14.61 in Handbook of Applied Cryptogrpahy.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_xgcd(const mp_int *a, const mp_int *b, mp_int *g, mp_int *x, mp_int *y)
*5697Smcpowers{
*5697Smcpowers  mp_int   gx, xc, yc, u, v, A, B, C, D;
*5697Smcpowers  mp_int  *clean[9];
*5697Smcpowers  mp_err   res;
*5697Smcpowers  int      last = -1;
*5697Smcpowers
*5697Smcpowers  if(mp_cmp_z(b) == 0)
*5697Smcpowers    return MP_RANGE;
*5697Smcpowers
*5697Smcpowers  /* Initialize all these variables we need */
*5697Smcpowers  MP_CHECKOK( mp_init(&u, FLAG(a)) );
*5697Smcpowers  clean[++last] = &u;
*5697Smcpowers  MP_CHECKOK( mp_init(&v, FLAG(a)) );
*5697Smcpowers  clean[++last] = &v;
*5697Smcpowers  MP_CHECKOK( mp_init(&gx, FLAG(a)) );
*5697Smcpowers  clean[++last] = &gx;
*5697Smcpowers  MP_CHECKOK( mp_init(&A, FLAG(a)) );
*5697Smcpowers  clean[++last] = &A;
*5697Smcpowers  MP_CHECKOK( mp_init(&B, FLAG(a)) );
*5697Smcpowers  clean[++last] = &B;
*5697Smcpowers  MP_CHECKOK( mp_init(&C, FLAG(a)) );
*5697Smcpowers  clean[++last] = &C;
*5697Smcpowers  MP_CHECKOK( mp_init(&D, FLAG(a)) );
*5697Smcpowers  clean[++last] = &D;
*5697Smcpowers  MP_CHECKOK( mp_init_copy(&xc, a) );
*5697Smcpowers  clean[++last] = &xc;
*5697Smcpowers  mp_abs(&xc, &xc);
*5697Smcpowers  MP_CHECKOK( mp_init_copy(&yc, b) );
*5697Smcpowers  clean[++last] = &yc;
*5697Smcpowers  mp_abs(&yc, &yc);
*5697Smcpowers
*5697Smcpowers  mp_set(&gx, 1);
*5697Smcpowers
*5697Smcpowers  /* Divide by two until at least one of them is odd */
*5697Smcpowers  while(mp_iseven(&xc) && mp_iseven(&yc)) {
*5697Smcpowers    mp_size nx = mp_trailing_zeros(&xc);
*5697Smcpowers    mp_size ny = mp_trailing_zeros(&yc);
*5697Smcpowers    mp_size n  = MP_MIN(nx, ny);
*5697Smcpowers    s_mp_div_2d(&xc,n);
*5697Smcpowers    s_mp_div_2d(&yc,n);
*5697Smcpowers    MP_CHECKOK( s_mp_mul_2d(&gx,n) );
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  mp_copy(&xc, &u);
*5697Smcpowers  mp_copy(&yc, &v);
*5697Smcpowers  mp_set(&A, 1); mp_set(&D, 1);
*5697Smcpowers
*5697Smcpowers  /* Loop through binary GCD algorithm */
*5697Smcpowers  do {
*5697Smcpowers    while(mp_iseven(&u)) {
*5697Smcpowers      s_mp_div_2(&u);
*5697Smcpowers
*5697Smcpowers      if(mp_iseven(&A) && mp_iseven(&B)) {
*5697Smcpowers	s_mp_div_2(&A); s_mp_div_2(&B);
*5697Smcpowers      } else {
*5697Smcpowers	MP_CHECKOK( mp_add(&A, &yc, &A) );
*5697Smcpowers	s_mp_div_2(&A);
*5697Smcpowers	MP_CHECKOK( mp_sub(&B, &xc, &B) );
*5697Smcpowers	s_mp_div_2(&B);
*5697Smcpowers      }
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    while(mp_iseven(&v)) {
*5697Smcpowers      s_mp_div_2(&v);
*5697Smcpowers
*5697Smcpowers      if(mp_iseven(&C) && mp_iseven(&D)) {
*5697Smcpowers	s_mp_div_2(&C); s_mp_div_2(&D);
*5697Smcpowers      } else {
*5697Smcpowers	MP_CHECKOK( mp_add(&C, &yc, &C) );
*5697Smcpowers	s_mp_div_2(&C);
*5697Smcpowers	MP_CHECKOK( mp_sub(&D, &xc, &D) );
*5697Smcpowers	s_mp_div_2(&D);
*5697Smcpowers      }
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    if(mp_cmp(&u, &v) >= 0) {
*5697Smcpowers      MP_CHECKOK( mp_sub(&u, &v, &u) );
*5697Smcpowers      MP_CHECKOK( mp_sub(&A, &C, &A) );
*5697Smcpowers      MP_CHECKOK( mp_sub(&B, &D, &B) );
*5697Smcpowers    } else {
*5697Smcpowers      MP_CHECKOK( mp_sub(&v, &u, &v) );
*5697Smcpowers      MP_CHECKOK( mp_sub(&C, &A, &C) );
*5697Smcpowers      MP_CHECKOK( mp_sub(&D, &B, &D) );
*5697Smcpowers    }
*5697Smcpowers  } while (mp_cmp_z(&u) != 0);
*5697Smcpowers
*5697Smcpowers  /* copy results to output */
*5697Smcpowers  if(x)
*5697Smcpowers    MP_CHECKOK( mp_copy(&C, x) );
*5697Smcpowers
*5697Smcpowers  if(y)
*5697Smcpowers    MP_CHECKOK( mp_copy(&D, y) );
*5697Smcpowers
*5697Smcpowers  if(g)
*5697Smcpowers    MP_CHECKOK( mp_mul(&gx, &v, g) );
*5697Smcpowers
*5697Smcpowers CLEANUP:
*5697Smcpowers  while(last >= 0)
*5697Smcpowers    mp_clear(clean[last--]);
*5697Smcpowers
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end mp_xgcd() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowersmp_size mp_trailing_zeros(const mp_int *mp)
*5697Smcpowers{
*5697Smcpowers  mp_digit d;
*5697Smcpowers  mp_size  n = 0;
*5697Smcpowers  int      ix;
*5697Smcpowers
*5697Smcpowers  if (!mp || !MP_DIGITS(mp) || !mp_cmp_z(mp))
*5697Smcpowers    return n;
*5697Smcpowers
*5697Smcpowers  for (ix = 0; !(d = MP_DIGIT(mp,ix)) && (ix < MP_USED(mp)); ++ix)
*5697Smcpowers    n += MP_DIGIT_BIT;
*5697Smcpowers  if (!d)
*5697Smcpowers    return 0;	/* shouldn't happen, but ... */
*5697Smcpowers#if !defined(MP_USE_UINT_DIGIT)
*5697Smcpowers  if (!(d & 0xffffffffU)) {
*5697Smcpowers    d >>= 32;
*5697Smcpowers    n  += 32;
*5697Smcpowers  }
*5697Smcpowers#endif
*5697Smcpowers  if (!(d & 0xffffU)) {
*5697Smcpowers    d >>= 16;
*5697Smcpowers    n  += 16;
*5697Smcpowers  }
*5697Smcpowers  if (!(d & 0xffU)) {
*5697Smcpowers    d >>= 8;
*5697Smcpowers    n  += 8;
*5697Smcpowers  }
*5697Smcpowers  if (!(d & 0xfU)) {
*5697Smcpowers    d >>= 4;
*5697Smcpowers    n  += 4;
*5697Smcpowers  }
*5697Smcpowers  if (!(d & 0x3U)) {
*5697Smcpowers    d >>= 2;
*5697Smcpowers    n  += 2;
*5697Smcpowers  }
*5697Smcpowers  if (!(d & 0x1U)) {
*5697Smcpowers    d >>= 1;
*5697Smcpowers    n  += 1;
*5697Smcpowers  }
*5697Smcpowers#if MP_ARGCHK == 2
*5697Smcpowers  assert(0 != (d & 1));
*5697Smcpowers#endif
*5697Smcpowers  return n;
*5697Smcpowers}
*5697Smcpowers
*5697Smcpowers/* Given a and prime p, computes c and k such that a*c == 2**k (mod p).
*5697Smcpowers** Returns k (positive) or error (negative).
*5697Smcpowers** This technique from the paper "Fast Modular Reciprocals" (unpublished)
*5697Smcpowers** by Richard Schroeppel (a.k.a. Captain Nemo).
*5697Smcpowers*/
*5697Smcpowersmp_err s_mp_almost_inverse(const mp_int *a, const mp_int *p, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_err res;
*5697Smcpowers  mp_err k    = 0;
*5697Smcpowers  mp_int d, f, g;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a && p && c, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  MP_DIGITS(&d) = 0;
*5697Smcpowers  MP_DIGITS(&f) = 0;
*5697Smcpowers  MP_DIGITS(&g) = 0;
*5697Smcpowers  MP_CHECKOK( mp_init(&d, FLAG(a)) );
*5697Smcpowers  MP_CHECKOK( mp_init_copy(&f, a) );	/* f = a */
*5697Smcpowers  MP_CHECKOK( mp_init_copy(&g, p) );	/* g = p */
*5697Smcpowers
*5697Smcpowers  mp_set(c, 1);
*5697Smcpowers  mp_zero(&d);
*5697Smcpowers
*5697Smcpowers  if (mp_cmp_z(&f) == 0) {
*5697Smcpowers    res = MP_UNDEF;
*5697Smcpowers  } else
*5697Smcpowers  for (;;) {
*5697Smcpowers    int diff_sign;
*5697Smcpowers    while (mp_iseven(&f)) {
*5697Smcpowers      mp_size n = mp_trailing_zeros(&f);
*5697Smcpowers      if (!n) {
*5697Smcpowers	res = MP_UNDEF;
*5697Smcpowers	goto CLEANUP;
*5697Smcpowers      }
*5697Smcpowers      s_mp_div_2d(&f, n);
*5697Smcpowers      MP_CHECKOK( s_mp_mul_2d(&d, n) );
*5697Smcpowers      k += n;
*5697Smcpowers    }
*5697Smcpowers    if (mp_cmp_d(&f, 1) == MP_EQ) {	/* f == 1 */
*5697Smcpowers      res = k;
*5697Smcpowers      break;
*5697Smcpowers    }
*5697Smcpowers    diff_sign = mp_cmp(&f, &g);
*5697Smcpowers    if (diff_sign < 0) {		/* f < g */
*5697Smcpowers      s_mp_exch(&f, &g);
*5697Smcpowers      s_mp_exch(c, &d);
*5697Smcpowers    } else if (diff_sign == 0) {		/* f == g */
*5697Smcpowers      res = MP_UNDEF;		/* a and p are not relatively prime */
*5697Smcpowers      break;
*5697Smcpowers    }
*5697Smcpowers    if ((MP_DIGIT(&f,0) % 4) == (MP_DIGIT(&g,0) % 4)) {
*5697Smcpowers      MP_CHECKOK( mp_sub(&f, &g, &f) );	/* f = f - g */
*5697Smcpowers      MP_CHECKOK( mp_sub(c,  &d,  c) );	/* c = c - d */
*5697Smcpowers    } else {
*5697Smcpowers      MP_CHECKOK( mp_add(&f, &g, &f) );	/* f = f + g */
*5697Smcpowers      MP_CHECKOK( mp_add(c,  &d,  c) );	/* c = c + d */
*5697Smcpowers    }
*5697Smcpowers  }
*5697Smcpowers  if (res >= 0) {
*5697Smcpowers    while (MP_SIGN(c) != MP_ZPOS) {
*5697Smcpowers      MP_CHECKOK( mp_add(c, p, c) );
*5697Smcpowers    }
*5697Smcpowers    res = k;
*5697Smcpowers  }
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  mp_clear(&d);
*5697Smcpowers  mp_clear(&f);
*5697Smcpowers  mp_clear(&g);
*5697Smcpowers  return res;
*5697Smcpowers}
*5697Smcpowers
*5697Smcpowers/* Compute T = (P ** -1) mod MP_RADIX.  Also works for 16-bit mp_digits.
*5697Smcpowers** This technique from the paper "Fast Modular Reciprocals" (unpublished)
*5697Smcpowers** by Richard Schroeppel (a.k.a. Captain Nemo).
*5697Smcpowers*/
*5697Smcpowersmp_digit  s_mp_invmod_radix(mp_digit P)
*5697Smcpowers{
*5697Smcpowers  mp_digit T = P;
*5697Smcpowers  T *= 2 - (P * T);
*5697Smcpowers  T *= 2 - (P * T);
*5697Smcpowers  T *= 2 - (P * T);
*5697Smcpowers  T *= 2 - (P * T);
*5697Smcpowers#if !defined(MP_USE_UINT_DIGIT)
*5697Smcpowers  T *= 2 - (P * T);
*5697Smcpowers  T *= 2 - (P * T);
*5697Smcpowers#endif
*5697Smcpowers  return T;
*5697Smcpowers}
*5697Smcpowers
*5697Smcpowers/* Given c, k, and prime p, where a*c == 2**k (mod p),
*5697Smcpowers** Compute x = (a ** -1) mod p.  This is similar to Montgomery reduction.
*5697Smcpowers** This technique from the paper "Fast Modular Reciprocals" (unpublished)
*5697Smcpowers** by Richard Schroeppel (a.k.a. Captain Nemo).
*5697Smcpowers*/
*5697Smcpowersmp_err  s_mp_fixup_reciprocal(const mp_int *c, const mp_int *p, int k, mp_int *x)
*5697Smcpowers{
*5697Smcpowers  int      k_orig = k;
*5697Smcpowers  mp_digit r;
*5697Smcpowers  mp_size  ix;
*5697Smcpowers  mp_err   res;
*5697Smcpowers
*5697Smcpowers  if (mp_cmp_z(c) < 0) {		/* c < 0 */
*5697Smcpowers    MP_CHECKOK( mp_add(c, p, x) );	/* x = c + p */
*5697Smcpowers  } else {
*5697Smcpowers    MP_CHECKOK( mp_copy(c, x) );	/* x = c */
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* make sure x is large enough */
*5697Smcpowers  ix = MP_HOWMANY(k, MP_DIGIT_BIT) + MP_USED(p) + 1;
*5697Smcpowers  ix = MP_MAX(ix, MP_USED(x));
*5697Smcpowers  MP_CHECKOK( s_mp_pad(x, ix) );
*5697Smcpowers
*5697Smcpowers  r = 0 - s_mp_invmod_radix(MP_DIGIT(p,0));
*5697Smcpowers
*5697Smcpowers  for (ix = 0; k > 0; ix++) {
*5697Smcpowers    int      j = MP_MIN(k, MP_DIGIT_BIT);
*5697Smcpowers    mp_digit v = r * MP_DIGIT(x, ix);
*5697Smcpowers    if (j < MP_DIGIT_BIT) {
*5697Smcpowers      v &= ((mp_digit)1 << j) - 1;	/* v = v mod (2 ** j) */
*5697Smcpowers    }
*5697Smcpowers    s_mp_mul_d_add_offset(p, v, x, ix); /* x += p * v * (RADIX ** ix) */
*5697Smcpowers    k -= j;
*5697Smcpowers  }
*5697Smcpowers  s_mp_clamp(x);
*5697Smcpowers  s_mp_div_2d(x, k_orig);
*5697Smcpowers  res = MP_OKAY;
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  return res;
*5697Smcpowers}
*5697Smcpowers
*5697Smcpowers/* compute mod inverse using Schroeppel's method, only if m is odd */
*5697Smcpowersmp_err s_mp_invmod_odd_m(const mp_int *a, const mp_int *m, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  int k;
*5697Smcpowers  mp_err  res;
*5697Smcpowers  mp_int  x;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a && m && c, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if(mp_cmp_z(a) == 0 || mp_cmp_z(m) == 0)
*5697Smcpowers    return MP_RANGE;
*5697Smcpowers  if (mp_iseven(m))
*5697Smcpowers    return MP_UNDEF;
*5697Smcpowers
*5697Smcpowers  MP_DIGITS(&x) = 0;
*5697Smcpowers
*5697Smcpowers  if (a == c) {
*5697Smcpowers    if ((res = mp_init_copy(&x, a)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers    if (a == m)
*5697Smcpowers      m = &x;
*5697Smcpowers    a = &x;
*5697Smcpowers  } else if (m == c) {
*5697Smcpowers    if ((res = mp_init_copy(&x, m)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers    m = &x;
*5697Smcpowers  } else {
*5697Smcpowers    MP_DIGITS(&x) = 0;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  MP_CHECKOK( s_mp_almost_inverse(a, m, c) );
*5697Smcpowers  k = res;
*5697Smcpowers  MP_CHECKOK( s_mp_fixup_reciprocal(c, m, k, c) );
*5697SmcpowersCLEANUP:
*5697Smcpowers  mp_clear(&x);
*5697Smcpowers  return res;
*5697Smcpowers}
*5697Smcpowers
*5697Smcpowers/* Known good algorithm for computing modular inverse.  But slow. */
*5697Smcpowersmp_err mp_invmod_xgcd(const mp_int *a, const mp_int *m, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_int  g, x;
*5697Smcpowers  mp_err  res;
*5697Smcpowers
*5697Smcpowers  ARGCHK(a && m && c, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if(mp_cmp_z(a) == 0 || mp_cmp_z(m) == 0)
*5697Smcpowers    return MP_RANGE;
*5697Smcpowers
*5697Smcpowers  MP_DIGITS(&g) = 0;
*5697Smcpowers  MP_DIGITS(&x) = 0;
*5697Smcpowers  MP_CHECKOK( mp_init(&x, FLAG(a)) );
*5697Smcpowers  MP_CHECKOK( mp_init(&g, FLAG(a)) );
*5697Smcpowers
*5697Smcpowers  MP_CHECKOK( mp_xgcd(a, m, &g, &x, NULL) );
*5697Smcpowers
*5697Smcpowers  if (mp_cmp_d(&g, 1) != MP_EQ) {
*5697Smcpowers    res = MP_UNDEF;
*5697Smcpowers    goto CLEANUP;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  res = mp_mod(&x, m, c);
*5697Smcpowers  SIGN(c) = SIGN(a);
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  mp_clear(&x);
*5697Smcpowers  mp_clear(&g);
*5697Smcpowers
*5697Smcpowers  return res;
*5697Smcpowers}
*5697Smcpowers
*5697Smcpowers/* modular inverse where modulus is 2**k. */
*5697Smcpowers/* c = a**-1 mod 2**k */
*5697Smcpowersmp_err s_mp_invmod_2d(const mp_int *a, mp_size k, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_err res;
*5697Smcpowers  mp_size ix = k + 4;
*5697Smcpowers  mp_int t0, t1, val, tmp, two2k;
*5697Smcpowers
*5697Smcpowers  static const mp_digit d2 = 2;
*5697Smcpowers  static const mp_int two = { 0, MP_ZPOS, 1, 1, (mp_digit *)&d2 };
*5697Smcpowers
*5697Smcpowers  if (mp_iseven(a))
*5697Smcpowers    return MP_UNDEF;
*5697Smcpowers  if (k <= MP_DIGIT_BIT) {
*5697Smcpowers    mp_digit i = s_mp_invmod_radix(MP_DIGIT(a,0));
*5697Smcpowers    if (k < MP_DIGIT_BIT)
*5697Smcpowers      i &= ((mp_digit)1 << k) - (mp_digit)1;
*5697Smcpowers    mp_set(c, i);
*5697Smcpowers    return MP_OKAY;
*5697Smcpowers  }
*5697Smcpowers  MP_DIGITS(&t0) = 0;
*5697Smcpowers  MP_DIGITS(&t1) = 0;
*5697Smcpowers  MP_DIGITS(&val) = 0;
*5697Smcpowers  MP_DIGITS(&tmp) = 0;
*5697Smcpowers  MP_DIGITS(&two2k) = 0;
*5697Smcpowers  MP_CHECKOK( mp_init_copy(&val, a) );
*5697Smcpowers  s_mp_mod_2d(&val, k);
*5697Smcpowers  MP_CHECKOK( mp_init_copy(&t0, &val) );
*5697Smcpowers  MP_CHECKOK( mp_init_copy(&t1, &t0)  );
*5697Smcpowers  MP_CHECKOK( mp_init(&tmp, FLAG(a)) );
*5697Smcpowers  MP_CHECKOK( mp_init(&two2k, FLAG(a)) );
*5697Smcpowers  MP_CHECKOK( s_mp_2expt(&two2k, k) );
*5697Smcpowers  do {
*5697Smcpowers    MP_CHECKOK( mp_mul(&val, &t1, &tmp)  );
*5697Smcpowers    MP_CHECKOK( mp_sub(&two, &tmp, &tmp) );
*5697Smcpowers    MP_CHECKOK( mp_mul(&t1, &tmp, &t1)   );
*5697Smcpowers    s_mp_mod_2d(&t1, k);
*5697Smcpowers    while (MP_SIGN(&t1) != MP_ZPOS) {
*5697Smcpowers      MP_CHECKOK( mp_add(&t1, &two2k, &t1) );
*5697Smcpowers    }
*5697Smcpowers    if (mp_cmp(&t1, &t0) == MP_EQ)
*5697Smcpowers      break;
*5697Smcpowers    MP_CHECKOK( mp_copy(&t1, &t0) );
*5697Smcpowers  } while (--ix > 0);
*5697Smcpowers  if (!ix) {
*5697Smcpowers    res = MP_UNDEF;
*5697Smcpowers  } else {
*5697Smcpowers    mp_exch(c, &t1);
*5697Smcpowers  }
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  mp_clear(&t0);
*5697Smcpowers  mp_clear(&t1);
*5697Smcpowers  mp_clear(&val);
*5697Smcpowers  mp_clear(&tmp);
*5697Smcpowers  mp_clear(&two2k);
*5697Smcpowers  return res;
*5697Smcpowers}
*5697Smcpowers
*5697Smcpowersmp_err s_mp_invmod_even_m(const mp_int *a, const mp_int *m, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_err res;
*5697Smcpowers  mp_size k;
*5697Smcpowers  mp_int oddFactor, evenFactor;	/* factors of the modulus */
*5697Smcpowers  mp_int oddPart, evenPart;	/* parts to combine via CRT. */
*5697Smcpowers  mp_int C2, tmp1, tmp2;
*5697Smcpowers
*5697Smcpowers  /*static const mp_digit d1 = 1; */
*5697Smcpowers  /*static const mp_int one = { MP_ZPOS, 1, 1, (mp_digit *)&d1 }; */
*5697Smcpowers
*5697Smcpowers  if ((res = s_mp_ispow2(m)) >= 0) {
*5697Smcpowers    k = res;
*5697Smcpowers    return s_mp_invmod_2d(a, k, c);
*5697Smcpowers  }
*5697Smcpowers  MP_DIGITS(&oddFactor) = 0;
*5697Smcpowers  MP_DIGITS(&evenFactor) = 0;
*5697Smcpowers  MP_DIGITS(&oddPart) = 0;
*5697Smcpowers  MP_DIGITS(&evenPart) = 0;
*5697Smcpowers  MP_DIGITS(&C2)     = 0;
*5697Smcpowers  MP_DIGITS(&tmp1)   = 0;
*5697Smcpowers  MP_DIGITS(&tmp2)   = 0;
*5697Smcpowers
*5697Smcpowers  MP_CHECKOK( mp_init_copy(&oddFactor, m) );    /* oddFactor = m */
*5697Smcpowers  MP_CHECKOK( mp_init(&evenFactor, FLAG(m)) );
*5697Smcpowers  MP_CHECKOK( mp_init(&oddPart, FLAG(m)) );
*5697Smcpowers  MP_CHECKOK( mp_init(&evenPart, FLAG(m)) );
*5697Smcpowers  MP_CHECKOK( mp_init(&C2, FLAG(m))     );
*5697Smcpowers  MP_CHECKOK( mp_init(&tmp1, FLAG(m))   );
*5697Smcpowers  MP_CHECKOK( mp_init(&tmp2, FLAG(m))   );
*5697Smcpowers
*5697Smcpowers  k = mp_trailing_zeros(m);
*5697Smcpowers  s_mp_div_2d(&oddFactor, k);
*5697Smcpowers  MP_CHECKOK( s_mp_2expt(&evenFactor, k) );
*5697Smcpowers
*5697Smcpowers  /* compute a**-1 mod oddFactor. */
*5697Smcpowers  MP_CHECKOK( s_mp_invmod_odd_m(a, &oddFactor, &oddPart) );
*5697Smcpowers  /* compute a**-1 mod evenFactor, where evenFactor == 2**k. */
*5697Smcpowers  MP_CHECKOK( s_mp_invmod_2d(   a,       k,    &evenPart) );
*5697Smcpowers
*5697Smcpowers  /* Use Chinese Remainer theorem to compute a**-1 mod m. */
*5697Smcpowers  /* let m1 = oddFactor,  v1 = oddPart,
*5697Smcpowers   * let m2 = evenFactor, v2 = evenPart.
*5697Smcpowers   */
*5697Smcpowers
*5697Smcpowers  /* Compute C2 = m1**-1 mod m2. */
*5697Smcpowers  MP_CHECKOK( s_mp_invmod_2d(&oddFactor, k,    &C2) );
*5697Smcpowers
*5697Smcpowers  /* compute u = (v2 - v1)*C2 mod m2 */
*5697Smcpowers  MP_CHECKOK( mp_sub(&evenPart, &oddPart,   &tmp1) );
*5697Smcpowers  MP_CHECKOK( mp_mul(&tmp1,     &C2,        &tmp2) );
*5697Smcpowers  s_mp_mod_2d(&tmp2, k);
*5697Smcpowers  while (MP_SIGN(&tmp2) != MP_ZPOS) {
*5697Smcpowers    MP_CHECKOK( mp_add(&tmp2, &evenFactor, &tmp2) );
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* compute answer = v1 + u*m1 */
*5697Smcpowers  MP_CHECKOK( mp_mul(&tmp2,     &oddFactor, c) );
*5697Smcpowers  MP_CHECKOK( mp_add(&oddPart,  c,          c) );
*5697Smcpowers  /* not sure this is necessary, but it's low cost if not. */
*5697Smcpowers  MP_CHECKOK( mp_mod(c,         m,          c) );
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  mp_clear(&oddFactor);
*5697Smcpowers  mp_clear(&evenFactor);
*5697Smcpowers  mp_clear(&oddPart);
*5697Smcpowers  mp_clear(&evenPart);
*5697Smcpowers  mp_clear(&C2);
*5697Smcpowers  mp_clear(&tmp1);
*5697Smcpowers  mp_clear(&tmp2);
*5697Smcpowers  return res;
*5697Smcpowers}
*5697Smcpowers
*5697Smcpowers
*5697Smcpowers/* {{{ mp_invmod(a, m, c) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_invmod(a, m, c)
*5697Smcpowers
*5697Smcpowers  Compute c = a^-1 (mod m), if there is an inverse for a (mod m).
*5697Smcpowers  This is equivalent to the question of whether (a, m) = 1.  If not,
*5697Smcpowers  MP_UNDEF is returned, and there is no inverse.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err mp_invmod(const mp_int *a, const mp_int *m, mp_int *c)
*5697Smcpowers{
*5697Smcpowers
*5697Smcpowers  ARGCHK(a && m && c, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  if(mp_cmp_z(a) == 0 || mp_cmp_z(m) == 0)
*5697Smcpowers    return MP_RANGE;
*5697Smcpowers
*5697Smcpowers  if (mp_isodd(m)) {
*5697Smcpowers    return s_mp_invmod_odd_m(a, m, c);
*5697Smcpowers  }
*5697Smcpowers  if (mp_iseven(a))
*5697Smcpowers    return MP_UNDEF;	/* not invertable */
*5697Smcpowers
*5697Smcpowers  return s_mp_invmod_even_m(a, m, c);
*5697Smcpowers
*5697Smcpowers} /* end mp_invmod() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers#endif /* if MP_NUMTH */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/*------------------------------------------------------------------------*/
*5697Smcpowers/* {{{ mp_print(mp, ofp) */
*5697Smcpowers
*5697Smcpowers#if MP_IOFUNC
*5697Smcpowers/*
*5697Smcpowers  mp_print(mp, ofp)
*5697Smcpowers
*5697Smcpowers  Print a textual representation of the given mp_int on the output
*5697Smcpowers  stream 'ofp'.  Output is generated using the internal radix.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersvoid   mp_print(mp_int *mp, FILE *ofp)
*5697Smcpowers{
*5697Smcpowers  int   ix;
*5697Smcpowers
*5697Smcpowers  if(mp == NULL || ofp == NULL)
*5697Smcpowers    return;
*5697Smcpowers
*5697Smcpowers  fputc((SIGN(mp) == NEG) ? '-' : '+', ofp);
*5697Smcpowers
*5697Smcpowers  for(ix = USED(mp) - 1; ix >= 0; ix--) {
*5697Smcpowers    fprintf(ofp, DIGIT_FMT, DIGIT(mp, ix));
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers} /* end mp_print() */
*5697Smcpowers
*5697Smcpowers#endif /* if MP_IOFUNC */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/*------------------------------------------------------------------------*/
*5697Smcpowers/* {{{ More I/O Functions */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_read_raw(mp, str, len) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers   mp_read_raw(mp, str, len)
*5697Smcpowers
*5697Smcpowers   Read in a raw value (base 256) into the given mp_int
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err  mp_read_raw(mp_int *mp, char *str, int len)
*5697Smcpowers{
*5697Smcpowers  int            ix;
*5697Smcpowers  mp_err         res;
*5697Smcpowers  unsigned char *ustr = (unsigned char *)str;
*5697Smcpowers
*5697Smcpowers  ARGCHK(mp != NULL && str != NULL && len > 0, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  mp_zero(mp);
*5697Smcpowers
*5697Smcpowers  /* Get sign from first byte */
*5697Smcpowers  if(ustr[0])
*5697Smcpowers    SIGN(mp) = NEG;
*5697Smcpowers  else
*5697Smcpowers    SIGN(mp) = ZPOS;
*5697Smcpowers
*5697Smcpowers  /* Read the rest of the digits */
*5697Smcpowers  for(ix = 1; ix < len; ix++) {
*5697Smcpowers    if((res = mp_mul_d(mp, 256, mp)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers    if((res = mp_add_d(mp, ustr[ix], mp)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end mp_read_raw() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_raw_size(mp) */
*5697Smcpowers
*5697Smcpowersint    mp_raw_size(mp_int *mp)
*5697Smcpowers{
*5697Smcpowers  ARGCHK(mp != NULL, 0);
*5697Smcpowers
*5697Smcpowers  return (USED(mp) * sizeof(mp_digit)) + 1;
*5697Smcpowers
*5697Smcpowers} /* end mp_raw_size() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_toraw(mp, str) */
*5697Smcpowers
*5697Smcpowersmp_err mp_toraw(mp_int *mp, char *str)
*5697Smcpowers{
*5697Smcpowers  int  ix, jx, pos = 1;
*5697Smcpowers
*5697Smcpowers  ARGCHK(mp != NULL && str != NULL, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  str[0] = (char)SIGN(mp);
*5697Smcpowers
*5697Smcpowers  /* Iterate over each digit... */
*5697Smcpowers  for(ix = USED(mp) - 1; ix >= 0; ix--) {
*5697Smcpowers    mp_digit  d = DIGIT(mp, ix);
*5697Smcpowers
*5697Smcpowers    /* Unpack digit bytes, high order first */
*5697Smcpowers    for(jx = sizeof(mp_digit) - 1; jx >= 0; jx--) {
*5697Smcpowers      str[pos++] = (char)(d >> (jx * CHAR_BIT));
*5697Smcpowers    }
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end mp_toraw() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_read_radix(mp, str, radix) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_read_radix(mp, str, radix)
*5697Smcpowers
*5697Smcpowers  Read an integer from the given string, and set mp to the resulting
*5697Smcpowers  value.  The input is presumed to be in base 10.  Leading non-digit
*5697Smcpowers  characters are ignored, and the function reads until a non-digit
*5697Smcpowers  character or the end of the string.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err  mp_read_radix(mp_int *mp, const char *str, int radix)
*5697Smcpowers{
*5697Smcpowers  int     ix = 0, val = 0;
*5697Smcpowers  mp_err  res;
*5697Smcpowers  mp_sign sig = ZPOS;
*5697Smcpowers
*5697Smcpowers  ARGCHK(mp != NULL && str != NULL && radix >= 2 && radix <= MAX_RADIX,
*5697Smcpowers	 MP_BADARG);
*5697Smcpowers
*5697Smcpowers  mp_zero(mp);
*5697Smcpowers
*5697Smcpowers  /* Skip leading non-digit characters until a digit or '-' or '+' */
*5697Smcpowers  while(str[ix] &&
*5697Smcpowers	(s_mp_tovalue(str[ix], radix) < 0) &&
*5697Smcpowers	str[ix] != '-' &&
*5697Smcpowers	str[ix] != '+') {
*5697Smcpowers    ++ix;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if(str[ix] == '-') {
*5697Smcpowers    sig = NEG;
*5697Smcpowers    ++ix;
*5697Smcpowers  } else if(str[ix] == '+') {
*5697Smcpowers    sig = ZPOS; /* this is the default anyway... */
*5697Smcpowers    ++ix;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  while((val = s_mp_tovalue(str[ix], radix)) >= 0) {
*5697Smcpowers    if((res = s_mp_mul_d(mp, radix)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers    if((res = s_mp_add_d(mp, val)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers    ++ix;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if(s_mp_cmp_d(mp, 0) == MP_EQ)
*5697Smcpowers    SIGN(mp) = ZPOS;
*5697Smcpowers  else
*5697Smcpowers    SIGN(mp) = sig;
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end mp_read_radix() */
*5697Smcpowers
*5697Smcpowersmp_err mp_read_variable_radix(mp_int *a, const char * str, int default_radix)
*5697Smcpowers{
*5697Smcpowers  int     radix = default_radix;
*5697Smcpowers  int     cx;
*5697Smcpowers  mp_sign sig   = ZPOS;
*5697Smcpowers  mp_err  res;
*5697Smcpowers
*5697Smcpowers  /* Skip leading non-digit characters until a digit or '-' or '+' */
*5697Smcpowers  while ((cx = *str) != 0 &&
*5697Smcpowers	(s_mp_tovalue(cx, radix) < 0) &&
*5697Smcpowers	cx != '-' &&
*5697Smcpowers	cx != '+') {
*5697Smcpowers    ++str;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if (cx == '-') {
*5697Smcpowers    sig = NEG;
*5697Smcpowers    ++str;
*5697Smcpowers  } else if (cx == '+') {
*5697Smcpowers    sig = ZPOS; /* this is the default anyway... */
*5697Smcpowers    ++str;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if (str[0] == '0') {
*5697Smcpowers    if ((str[1] | 0x20) == 'x') {
*5697Smcpowers      radix = 16;
*5697Smcpowers      str += 2;
*5697Smcpowers    } else {
*5697Smcpowers      radix = 8;
*5697Smcpowers      str++;
*5697Smcpowers    }
*5697Smcpowers  }
*5697Smcpowers  res = mp_read_radix(a, str, radix);
*5697Smcpowers  if (res == MP_OKAY) {
*5697Smcpowers    MP_SIGN(a) = (s_mp_cmp_d(a, 0) == MP_EQ) ? ZPOS : sig;
*5697Smcpowers  }
*5697Smcpowers  return res;
*5697Smcpowers}
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_radix_size(mp, radix) */
*5697Smcpowers
*5697Smcpowersint    mp_radix_size(mp_int *mp, int radix)
*5697Smcpowers{
*5697Smcpowers  int  bits;
*5697Smcpowers
*5697Smcpowers  if(!mp || radix < 2 || radix > MAX_RADIX)
*5697Smcpowers    return 0;
*5697Smcpowers
*5697Smcpowers  bits = USED(mp) * DIGIT_BIT - 1;
*5697Smcpowers
*5697Smcpowers  return s_mp_outlen(bits, radix);
*5697Smcpowers
*5697Smcpowers} /* end mp_radix_size() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_toradix(mp, str, radix) */
*5697Smcpowers
*5697Smcpowersmp_err mp_toradix(mp_int *mp, char *str, int radix)
*5697Smcpowers{
*5697Smcpowers  int  ix, pos = 0;
*5697Smcpowers
*5697Smcpowers  ARGCHK(mp != NULL && str != NULL, MP_BADARG);
*5697Smcpowers  ARGCHK(radix > 1 && radix <= MAX_RADIX, MP_RANGE);
*5697Smcpowers
*5697Smcpowers  if(mp_cmp_z(mp) == MP_EQ) {
*5697Smcpowers    str[0] = '0';
*5697Smcpowers    str[1] = '\0';
*5697Smcpowers  } else {
*5697Smcpowers    mp_err   res;
*5697Smcpowers    mp_int   tmp;
*5697Smcpowers    mp_sign  sgn;
*5697Smcpowers    mp_digit rem, rdx = (mp_digit)radix;
*5697Smcpowers    char     ch;
*5697Smcpowers
*5697Smcpowers    if((res = mp_init_copy(&tmp, mp)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers
*5697Smcpowers    /* Save sign for later, and take absolute value */
*5697Smcpowers    sgn = SIGN(&tmp); SIGN(&tmp) = ZPOS;
*5697Smcpowers
*5697Smcpowers    /* Generate output digits in reverse order      */
*5697Smcpowers    while(mp_cmp_z(&tmp) != 0) {
*5697Smcpowers      if((res = mp_div_d(&tmp, rdx, &tmp, &rem)) != MP_OKAY) {
*5697Smcpowers	mp_clear(&tmp);
*5697Smcpowers	return res;
*5697Smcpowers      }
*5697Smcpowers
*5697Smcpowers      /* Generate digits, use capital letters */
*5697Smcpowers      ch = s_mp_todigit(rem, radix, 0);
*5697Smcpowers
*5697Smcpowers      str[pos++] = ch;
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    /* Add - sign if original value was negative */
*5697Smcpowers    if(sgn == NEG)
*5697Smcpowers      str[pos++] = '-';
*5697Smcpowers
*5697Smcpowers    /* Add trailing NUL to end the string        */
*5697Smcpowers    str[pos--] = '\0';
*5697Smcpowers
*5697Smcpowers    /* Reverse the digits and sign indicator     */
*5697Smcpowers    ix = 0;
*5697Smcpowers    while(ix < pos) {
*5697Smcpowers      char tmp = str[ix];
*5697Smcpowers
*5697Smcpowers      str[ix] = str[pos];
*5697Smcpowers      str[pos] = tmp;
*5697Smcpowers      ++ix;
*5697Smcpowers      --pos;
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    mp_clear(&tmp);
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end mp_toradix() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_tovalue(ch, r) */
*5697Smcpowers
*5697Smcpowersint    mp_tovalue(char ch, int r)
*5697Smcpowers{
*5697Smcpowers  return s_mp_tovalue(ch, r);
*5697Smcpowers
*5697Smcpowers} /* end mp_tovalue() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_strerror(ec) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  mp_strerror(ec)
*5697Smcpowers
*5697Smcpowers  Return a string describing the meaning of error code 'ec'.  The
*5697Smcpowers  string returned is allocated in static memory, so the caller should
*5697Smcpowers  not attempt to modify or free the memory associated with this
*5697Smcpowers  string.
*5697Smcpowers */
*5697Smcpowersconst char  *mp_strerror(mp_err ec)
*5697Smcpowers{
*5697Smcpowers  int   aec = (ec < 0) ? -ec : ec;
*5697Smcpowers
*5697Smcpowers  /* Code values are negative, so the senses of these comparisons
*5697Smcpowers     are accurate */
*5697Smcpowers  if(ec < MP_LAST_CODE || ec > MP_OKAY) {
*5697Smcpowers    return mp_err_string[0];  /* unknown error code */
*5697Smcpowers  } else {
*5697Smcpowers    return mp_err_string[aec + 1];
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers} /* end mp_strerror() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/*========================================================================*/
*5697Smcpowers/*------------------------------------------------------------------------*/
*5697Smcpowers/* Static function definitions (internal use only)                        */
*5697Smcpowers
*5697Smcpowers/* {{{ Memory management */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_grow(mp, min) */
*5697Smcpowers
*5697Smcpowers/* Make sure there are at least 'min' digits allocated to mp              */
*5697Smcpowersmp_err   s_mp_grow(mp_int *mp, mp_size min)
*5697Smcpowers{
*5697Smcpowers  if(min > ALLOC(mp)) {
*5697Smcpowers    mp_digit   *tmp;
*5697Smcpowers
*5697Smcpowers    /* Set min to next nearest default precision block size */
*5697Smcpowers    min = MP_ROUNDUP(min, s_mp_defprec);
*5697Smcpowers
*5697Smcpowers    if((tmp = s_mp_alloc(min, sizeof(mp_digit), FLAG(mp))) == NULL)
*5697Smcpowers      return MP_MEM;
*5697Smcpowers
*5697Smcpowers    s_mp_copy(DIGITS(mp), tmp, USED(mp));
*5697Smcpowers
*5697Smcpowers#if MP_CRYPTO
*5697Smcpowers    s_mp_setz(DIGITS(mp), ALLOC(mp));
*5697Smcpowers#endif
*5697Smcpowers    s_mp_free(DIGITS(mp), ALLOC(mp));
*5697Smcpowers    DIGITS(mp) = tmp;
*5697Smcpowers    ALLOC(mp) = min;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_grow() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_pad(mp, min) */
*5697Smcpowers
*5697Smcpowers/* Make sure the used size of mp is at least 'min', growing if needed     */
*5697Smcpowersmp_err   s_mp_pad(mp_int *mp, mp_size min)
*5697Smcpowers{
*5697Smcpowers  if(min > USED(mp)) {
*5697Smcpowers    mp_err  res;
*5697Smcpowers
*5697Smcpowers    /* Make sure there is room to increase precision  */
*5697Smcpowers    if (min > ALLOC(mp)) {
*5697Smcpowers      if ((res = s_mp_grow(mp, min)) != MP_OKAY)
*5697Smcpowers	return res;
*5697Smcpowers    } else {
*5697Smcpowers      s_mp_setz(DIGITS(mp) + USED(mp), min - USED(mp));
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    /* Increase precision; should already be 0-filled */
*5697Smcpowers    USED(mp) = min;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_pad() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_setz(dp, count) */
*5697Smcpowers
*5697Smcpowers#if MP_MACRO == 0
*5697Smcpowers/* Set 'count' digits pointed to by dp to be zeroes                       */
*5697Smcpowersvoid s_mp_setz(mp_digit *dp, mp_size count)
*5697Smcpowers{
*5697Smcpowers#if MP_MEMSET == 0
*5697Smcpowers  int  ix;
*5697Smcpowers
*5697Smcpowers  for(ix = 0; ix < count; ix++)
*5697Smcpowers    dp[ix] = 0;
*5697Smcpowers#else
*5697Smcpowers  memset(dp, 0, count * sizeof(mp_digit));
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers} /* end s_mp_setz() */
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_copy(sp, dp, count) */
*5697Smcpowers
*5697Smcpowers#if MP_MACRO == 0
*5697Smcpowers/* Copy 'count' digits from sp to dp                                      */
*5697Smcpowersvoid s_mp_copy(const mp_digit *sp, mp_digit *dp, mp_size count)
*5697Smcpowers{
*5697Smcpowers#if MP_MEMCPY == 0
*5697Smcpowers  int  ix;
*5697Smcpowers
*5697Smcpowers  for(ix = 0; ix < count; ix++)
*5697Smcpowers    dp[ix] = sp[ix];
*5697Smcpowers#else
*5697Smcpowers  memcpy(dp, sp, count * sizeof(mp_digit));
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers} /* end s_mp_copy() */
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_alloc(nb, ni, kmflag) */
*5697Smcpowers
*5697Smcpowers#if MP_MACRO == 0
*5697Smcpowers/* Allocate ni records of nb bytes each, and return a pointer to that     */
*5697Smcpowersvoid    *s_mp_alloc(size_t nb, size_t ni, int kmflag)
*5697Smcpowers{
*5697Smcpowers  mp_int *mp;
*5697Smcpowers  ++mp_allocs;
*5697Smcpowers#ifdef _KERNEL
*5697Smcpowers  mp = kmem_zalloc(nb * ni, kmflag);
*5697Smcpowers  if (mp != NULL)
*5697Smcpowers    FLAG(mp) = kmflag;
*5697Smcpowers  return (mp);
*5697Smcpowers#else
*5697Smcpowers  return calloc(nb, ni);
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers} /* end s_mp_alloc() */
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_free(ptr) */
*5697Smcpowers
*5697Smcpowers#if MP_MACRO == 0
*5697Smcpowers/* Free the memory pointed to by ptr                                      */
*5697Smcpowersvoid     s_mp_free(void *ptr, mp_size alloc)
*5697Smcpowers{
*5697Smcpowers  if(ptr) {
*5697Smcpowers    ++mp_frees;
*5697Smcpowers#ifdef _KERNEL
*5697Smcpowers    kmem_free(ptr, alloc * sizeof (mp_digit));
*5697Smcpowers#else
*5697Smcpowers    free(ptr);
*5697Smcpowers#endif
*5697Smcpowers  }
*5697Smcpowers} /* end s_mp_free() */
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_clamp(mp) */
*5697Smcpowers
*5697Smcpowers#if MP_MACRO == 0
*5697Smcpowers/* Remove leading zeroes from the given value                             */
*5697Smcpowersvoid     s_mp_clamp(mp_int *mp)
*5697Smcpowers{
*5697Smcpowers  mp_size used = MP_USED(mp);
*5697Smcpowers  while (used > 1 && DIGIT(mp, used - 1) == 0)
*5697Smcpowers    --used;
*5697Smcpowers  MP_USED(mp) = used;
*5697Smcpowers} /* end s_mp_clamp() */
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_exch(a, b) */
*5697Smcpowers
*5697Smcpowers/* Exchange the data for a and b; (b, a) = (a, b)                         */
*5697Smcpowersvoid     s_mp_exch(mp_int *a, mp_int *b)
*5697Smcpowers{
*5697Smcpowers  mp_int   tmp;
*5697Smcpowers
*5697Smcpowers  tmp = *a;
*5697Smcpowers  *a = *b;
*5697Smcpowers  *b = tmp;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_exch() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ Arithmetic helpers */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_lshd(mp, p) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers   Shift mp leftward by p digits, growing if needed, and zero-filling
*5697Smcpowers   the in-shifted digits at the right end.  This is a convenient
*5697Smcpowers   alternative to multiplication by powers of the radix
*5697Smcpowers   The value of USED(mp) must already have been set to the value for
*5697Smcpowers   the shifted result.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err   s_mp_lshd(mp_int *mp, mp_size p)
*5697Smcpowers{
*5697Smcpowers  mp_err  res;
*5697Smcpowers  mp_size pos;
*5697Smcpowers  int     ix;
*5697Smcpowers
*5697Smcpowers  if(p == 0)
*5697Smcpowers    return MP_OKAY;
*5697Smcpowers
*5697Smcpowers  if (MP_USED(mp) == 1 && MP_DIGIT(mp, 0) == 0)
*5697Smcpowers    return MP_OKAY;
*5697Smcpowers
*5697Smcpowers  if((res = s_mp_pad(mp, USED(mp) + p)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  pos = USED(mp) - 1;
*5697Smcpowers
*5697Smcpowers  /* Shift all the significant figures over as needed */
*5697Smcpowers  for(ix = pos - p; ix >= 0; ix--)
*5697Smcpowers    DIGIT(mp, ix + p) = DIGIT(mp, ix);
*5697Smcpowers
*5697Smcpowers  /* Fill the bottom digits with zeroes */
*5697Smcpowers  for(ix = 0; ix < p; ix++)
*5697Smcpowers    DIGIT(mp, ix) = 0;
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_lshd() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_mul_2d(mp, d) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  Multiply the integer by 2^d, where d is a number of bits.  This
*5697Smcpowers  amounts to a bitwise shift of the value.
*5697Smcpowers */
*5697Smcpowersmp_err   s_mp_mul_2d(mp_int *mp, mp_digit d)
*5697Smcpowers{
*5697Smcpowers  mp_err   res;
*5697Smcpowers  mp_digit dshift, bshift;
*5697Smcpowers  mp_digit mask;
*5697Smcpowers
*5697Smcpowers  ARGCHK(mp != NULL,  MP_BADARG);
*5697Smcpowers
*5697Smcpowers  dshift = d / MP_DIGIT_BIT;
*5697Smcpowers  bshift = d % MP_DIGIT_BIT;
*5697Smcpowers  /* bits to be shifted out of the top word */
*5697Smcpowers  mask   = ((mp_digit)~0 << (MP_DIGIT_BIT - bshift));
*5697Smcpowers  mask  &= MP_DIGIT(mp, MP_USED(mp) - 1);
*5697Smcpowers
*5697Smcpowers  if (MP_OKAY != (res = s_mp_pad(mp, MP_USED(mp) + dshift + (mask != 0) )))
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  if (dshift && MP_OKAY != (res = s_mp_lshd(mp, dshift)))
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  if (bshift) {
*5697Smcpowers    mp_digit *pa = MP_DIGITS(mp);
*5697Smcpowers    mp_digit *alim = pa + MP_USED(mp);
*5697Smcpowers    mp_digit  prev = 0;
*5697Smcpowers
*5697Smcpowers    for (pa += dshift; pa < alim; ) {
*5697Smcpowers      mp_digit x = *pa;
*5697Smcpowers      *pa++ = (x << bshift) | prev;
*5697Smcpowers      prev = x >> (DIGIT_BIT - bshift);
*5697Smcpowers    }
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  s_mp_clamp(mp);
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers} /* end s_mp_mul_2d() */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_rshd(mp, p) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers   Shift mp rightward by p digits.  Maintains the invariant that
*5697Smcpowers   digits above the precision are all zero.  Digits shifted off the
*5697Smcpowers   end are lost.  Cannot fail.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersvoid     s_mp_rshd(mp_int *mp, mp_size p)
*5697Smcpowers{
*5697Smcpowers  mp_size  ix;
*5697Smcpowers  mp_digit *src, *dst;
*5697Smcpowers
*5697Smcpowers  if(p == 0)
*5697Smcpowers    return;
*5697Smcpowers
*5697Smcpowers  /* Shortcut when all digits are to be shifted off */
*5697Smcpowers  if(p >= USED(mp)) {
*5697Smcpowers    s_mp_setz(DIGITS(mp), ALLOC(mp));
*5697Smcpowers    USED(mp) = 1;
*5697Smcpowers    SIGN(mp) = ZPOS;
*5697Smcpowers    return;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* Shift all the significant figures over as needed */
*5697Smcpowers  dst = MP_DIGITS(mp);
*5697Smcpowers  src = dst + p;
*5697Smcpowers  for (ix = USED(mp) - p; ix > 0; ix--)
*5697Smcpowers    *dst++ = *src++;
*5697Smcpowers
*5697Smcpowers  MP_USED(mp) -= p;
*5697Smcpowers  /* Fill the top digits with zeroes */
*5697Smcpowers  while (p-- > 0)
*5697Smcpowers    *dst++ = 0;
*5697Smcpowers
*5697Smcpowers#if 0
*5697Smcpowers  /* Strip off any leading zeroes    */
*5697Smcpowers  s_mp_clamp(mp);
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers} /* end s_mp_rshd() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_div_2(mp) */
*5697Smcpowers
*5697Smcpowers/* Divide by two -- take advantage of radix properties to do it fast      */
*5697Smcpowersvoid     s_mp_div_2(mp_int *mp)
*5697Smcpowers{
*5697Smcpowers  s_mp_div_2d(mp, 1);
*5697Smcpowers
*5697Smcpowers} /* end s_mp_div_2() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_mul_2(mp) */
*5697Smcpowers
*5697Smcpowersmp_err s_mp_mul_2(mp_int *mp)
*5697Smcpowers{
*5697Smcpowers  mp_digit *pd;
*5697Smcpowers  int      ix, used;
*5697Smcpowers  mp_digit kin = 0;
*5697Smcpowers
*5697Smcpowers  /* Shift digits leftward by 1 bit */
*5697Smcpowers  used = MP_USED(mp);
*5697Smcpowers  pd = MP_DIGITS(mp);
*5697Smcpowers  for (ix = 0; ix < used; ix++) {
*5697Smcpowers    mp_digit d = *pd;
*5697Smcpowers    *pd++ = (d << 1) | kin;
*5697Smcpowers    kin = (d >> (DIGIT_BIT - 1));
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* Deal with rollover from last digit */
*5697Smcpowers  if (kin) {
*5697Smcpowers    if (ix >= ALLOC(mp)) {
*5697Smcpowers      mp_err res;
*5697Smcpowers      if((res = s_mp_grow(mp, ALLOC(mp) + 1)) != MP_OKAY)
*5697Smcpowers	return res;
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    DIGIT(mp, ix) = kin;
*5697Smcpowers    USED(mp) += 1;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_mul_2() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_mod_2d(mp, d) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  Remainder the integer by 2^d, where d is a number of bits.  This
*5697Smcpowers  amounts to a bitwise AND of the value, and does not require the full
*5697Smcpowers  division code
*5697Smcpowers */
*5697Smcpowersvoid     s_mp_mod_2d(mp_int *mp, mp_digit d)
*5697Smcpowers{
*5697Smcpowers  mp_size  ndig = (d / DIGIT_BIT), nbit = (d % DIGIT_BIT);
*5697Smcpowers  mp_size  ix;
*5697Smcpowers  mp_digit dmask;
*5697Smcpowers
*5697Smcpowers  if(ndig >= USED(mp))
*5697Smcpowers    return;
*5697Smcpowers
*5697Smcpowers  /* Flush all the bits above 2^d in its digit */
*5697Smcpowers  dmask = ((mp_digit)1 << nbit) - 1;
*5697Smcpowers  DIGIT(mp, ndig) &= dmask;
*5697Smcpowers
*5697Smcpowers  /* Flush all digits above the one with 2^d in it */
*5697Smcpowers  for(ix = ndig + 1; ix < USED(mp); ix++)
*5697Smcpowers    DIGIT(mp, ix) = 0;
*5697Smcpowers
*5697Smcpowers  s_mp_clamp(mp);
*5697Smcpowers
*5697Smcpowers} /* end s_mp_mod_2d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_div_2d(mp, d) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  Divide the integer by 2^d, where d is a number of bits.  This
*5697Smcpowers  amounts to a bitwise shift of the value, and does not require the
*5697Smcpowers  full division code (used in Barrett reduction, see below)
*5697Smcpowers */
*5697Smcpowersvoid     s_mp_div_2d(mp_int *mp, mp_digit d)
*5697Smcpowers{
*5697Smcpowers  int       ix;
*5697Smcpowers  mp_digit  save, next, mask;
*5697Smcpowers
*5697Smcpowers  s_mp_rshd(mp, d / DIGIT_BIT);
*5697Smcpowers  d %= DIGIT_BIT;
*5697Smcpowers  if (d) {
*5697Smcpowers    mask = ((mp_digit)1 << d) - 1;
*5697Smcpowers    save = 0;
*5697Smcpowers    for(ix = USED(mp) - 1; ix >= 0; ix--) {
*5697Smcpowers      next = DIGIT(mp, ix) & mask;
*5697Smcpowers      DIGIT(mp, ix) = (DIGIT(mp, ix) >> d) | (save << (DIGIT_BIT - d));
*5697Smcpowers      save = next;
*5697Smcpowers    }
*5697Smcpowers  }
*5697Smcpowers  s_mp_clamp(mp);
*5697Smcpowers
*5697Smcpowers} /* end s_mp_div_2d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_norm(a, b, *d) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  s_mp_norm(a, b, *d)
*5697Smcpowers
*5697Smcpowers  Normalize a and b for division, where b is the divisor.  In order
*5697Smcpowers  that we might make good guesses for quotient digits, we want the
*5697Smcpowers  leading digit of b to be at least half the radix, which we
*5697Smcpowers  accomplish by multiplying a and b by a power of 2.  The exponent
*5697Smcpowers  (shift count) is placed in *pd, so that the remainder can be shifted
*5697Smcpowers  back at the end of the division process.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err   s_mp_norm(mp_int *a, mp_int *b, mp_digit *pd)
*5697Smcpowers{
*5697Smcpowers  mp_digit  d;
*5697Smcpowers  mp_digit  mask;
*5697Smcpowers  mp_digit  b_msd;
*5697Smcpowers  mp_err    res    = MP_OKAY;
*5697Smcpowers
*5697Smcpowers  d = 0;
*5697Smcpowers  mask  = DIGIT_MAX & ~(DIGIT_MAX >> 1);	/* mask is msb of digit */
*5697Smcpowers  b_msd = DIGIT(b, USED(b) - 1);
*5697Smcpowers  while (!(b_msd & mask)) {
*5697Smcpowers    b_msd <<= 1;
*5697Smcpowers    ++d;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if (d) {
*5697Smcpowers    MP_CHECKOK( s_mp_mul_2d(a, d) );
*5697Smcpowers    MP_CHECKOK( s_mp_mul_2d(b, d) );
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  *pd = d;
*5697SmcpowersCLEANUP:
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_norm() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ Primitive digit arithmetic */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_add_d(mp, d) */
*5697Smcpowers
*5697Smcpowers/* Add d to |mp| in place                                                 */
*5697Smcpowersmp_err   s_mp_add_d(mp_int *mp, mp_digit d)    /* unsigned digit addition */
*5697Smcpowers{
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_ADD_WORD)
*5697Smcpowers  mp_word   w, k = 0;
*5697Smcpowers  mp_size   ix = 1;
*5697Smcpowers
*5697Smcpowers  w = (mp_word)DIGIT(mp, 0) + d;
*5697Smcpowers  DIGIT(mp, 0) = ACCUM(w);
*5697Smcpowers  k = CARRYOUT(w);
*5697Smcpowers
*5697Smcpowers  while(ix < USED(mp) && k) {
*5697Smcpowers    w = (mp_word)DIGIT(mp, ix) + k;
*5697Smcpowers    DIGIT(mp, ix) = ACCUM(w);
*5697Smcpowers    k = CARRYOUT(w);
*5697Smcpowers    ++ix;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  if(k != 0) {
*5697Smcpowers    mp_err  res;
*5697Smcpowers
*5697Smcpowers    if((res = s_mp_pad(mp, USED(mp) + 1)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers
*5697Smcpowers    DIGIT(mp, ix) = (mp_digit)k;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers#else
*5697Smcpowers  mp_digit * pmp = MP_DIGITS(mp);
*5697Smcpowers  mp_digit sum, mp_i, carry = 0;
*5697Smcpowers  mp_err   res = MP_OKAY;
*5697Smcpowers  int used = (int)MP_USED(mp);
*5697Smcpowers
*5697Smcpowers  mp_i = *pmp;
*5697Smcpowers  *pmp++ = sum = d + mp_i;
*5697Smcpowers  carry = (sum < d);
*5697Smcpowers  while (carry && --used > 0) {
*5697Smcpowers    mp_i = *pmp;
*5697Smcpowers    *pmp++ = sum = carry + mp_i;
*5697Smcpowers    carry = !sum;
*5697Smcpowers  }
*5697Smcpowers  if (carry && !used) {
*5697Smcpowers    /* mp is growing */
*5697Smcpowers    used = MP_USED(mp);
*5697Smcpowers    MP_CHECKOK( s_mp_pad(mp, used + 1) );
*5697Smcpowers    MP_DIGIT(mp, used) = carry;
*5697Smcpowers  }
*5697SmcpowersCLEANUP:
*5697Smcpowers  return res;
*5697Smcpowers#endif
*5697Smcpowers} /* end s_mp_add_d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_sub_d(mp, d) */
*5697Smcpowers
*5697Smcpowers/* Subtract d from |mp| in place, assumes |mp| > d                        */
*5697Smcpowersmp_err   s_mp_sub_d(mp_int *mp, mp_digit d)    /* unsigned digit subtract */
*5697Smcpowers{
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_SUB_WORD)
*5697Smcpowers  mp_word   w, b = 0;
*5697Smcpowers  mp_size   ix = 1;
*5697Smcpowers
*5697Smcpowers  /* Compute initial subtraction    */
*5697Smcpowers  w = (RADIX + (mp_word)DIGIT(mp, 0)) - d;
*5697Smcpowers  b = CARRYOUT(w) ? 0 : 1;
*5697Smcpowers  DIGIT(mp, 0) = ACCUM(w);
*5697Smcpowers
*5697Smcpowers  /* Propagate borrows leftward     */
*5697Smcpowers  while(b && ix < USED(mp)) {
*5697Smcpowers    w = (RADIX + (mp_word)DIGIT(mp, ix)) - b;
*5697Smcpowers    b = CARRYOUT(w) ? 0 : 1;
*5697Smcpowers    DIGIT(mp, ix) = ACCUM(w);
*5697Smcpowers    ++ix;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* Remove leading zeroes          */
*5697Smcpowers  s_mp_clamp(mp);
*5697Smcpowers
*5697Smcpowers  /* If we have a borrow out, it's a violation of the input invariant */
*5697Smcpowers  if(b)
*5697Smcpowers    return MP_RANGE;
*5697Smcpowers  else
*5697Smcpowers    return MP_OKAY;
*5697Smcpowers#else
*5697Smcpowers  mp_digit *pmp = MP_DIGITS(mp);
*5697Smcpowers  mp_digit mp_i, diff, borrow;
*5697Smcpowers  mp_size  used = MP_USED(mp);
*5697Smcpowers
*5697Smcpowers  mp_i = *pmp;
*5697Smcpowers  *pmp++ = diff = mp_i - d;
*5697Smcpowers  borrow = (diff > mp_i);
*5697Smcpowers  while (borrow && --used) {
*5697Smcpowers    mp_i = *pmp;
*5697Smcpowers    *pmp++ = diff = mp_i - borrow;
*5697Smcpowers    borrow = (diff > mp_i);
*5697Smcpowers  }
*5697Smcpowers  s_mp_clamp(mp);
*5697Smcpowers  return (borrow && !used) ? MP_RANGE : MP_OKAY;
*5697Smcpowers#endif
*5697Smcpowers} /* end s_mp_sub_d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_mul_d(a, d) */
*5697Smcpowers
*5697Smcpowers/* Compute a = a * d, single digit multiplication                         */
*5697Smcpowersmp_err   s_mp_mul_d(mp_int *a, mp_digit d)
*5697Smcpowers{
*5697Smcpowers  mp_err  res;
*5697Smcpowers  mp_size used;
*5697Smcpowers  int     pow;
*5697Smcpowers
*5697Smcpowers  if (!d) {
*5697Smcpowers    mp_zero(a);
*5697Smcpowers    return MP_OKAY;
*5697Smcpowers  }
*5697Smcpowers  if (d == 1)
*5697Smcpowers    return MP_OKAY;
*5697Smcpowers  if (0 <= (pow = s_mp_ispow2d(d))) {
*5697Smcpowers    return s_mp_mul_2d(a, (mp_digit)pow);
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  used = MP_USED(a);
*5697Smcpowers  MP_CHECKOK( s_mp_pad(a, used + 1) );
*5697Smcpowers
*5697Smcpowers  s_mpv_mul_d(MP_DIGITS(a), used, d, MP_DIGITS(a));
*5697Smcpowers
*5697Smcpowers  s_mp_clamp(a);
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_mul_d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_div_d(mp, d, r) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  s_mp_div_d(mp, d, r)
*5697Smcpowers
*5697Smcpowers  Compute the quotient mp = mp / d and remainder r = mp mod d, for a
*5697Smcpowers  single digit d.  If r is null, the remainder will be discarded.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err   s_mp_div_d(mp_int *mp, mp_digit d, mp_digit *r)
*5697Smcpowers{
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_DIV_WORD)
*5697Smcpowers  mp_word   w = 0, q;
*5697Smcpowers#else
*5697Smcpowers  mp_digit  w, q;
*5697Smcpowers#endif
*5697Smcpowers  int       ix;
*5697Smcpowers  mp_err    res;
*5697Smcpowers  mp_int    quot;
*5697Smcpowers  mp_int    rem;
*5697Smcpowers
*5697Smcpowers  if(d == 0)
*5697Smcpowers    return MP_RANGE;
*5697Smcpowers  if (d == 1) {
*5697Smcpowers    if (r)
*5697Smcpowers      *r = 0;
*5697Smcpowers    return MP_OKAY;
*5697Smcpowers  }
*5697Smcpowers  /* could check for power of 2 here, but mp_div_d does that. */
*5697Smcpowers  if (MP_USED(mp) == 1) {
*5697Smcpowers    mp_digit n   = MP_DIGIT(mp,0);
*5697Smcpowers    mp_digit rem;
*5697Smcpowers
*5697Smcpowers    q   = n / d;
*5697Smcpowers    rem = n % d;
*5697Smcpowers    MP_DIGIT(mp,0) = q;
*5697Smcpowers    if (r)
*5697Smcpowers      *r = rem;
*5697Smcpowers    return MP_OKAY;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  MP_DIGITS(&rem)  = 0;
*5697Smcpowers  MP_DIGITS(&quot) = 0;
*5697Smcpowers  /* Make room for the quotient */
*5697Smcpowers  MP_CHECKOK( mp_init_size(&quot, USED(mp), FLAG(mp)) );
*5697Smcpowers
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_DIV_WORD)
*5697Smcpowers  for(ix = USED(mp) - 1; ix >= 0; ix--) {
*5697Smcpowers    w = (w << DIGIT_BIT) | DIGIT(mp, ix);
*5697Smcpowers
*5697Smcpowers    if(w >= d) {
*5697Smcpowers      q = w / d;
*5697Smcpowers      w = w % d;
*5697Smcpowers    } else {
*5697Smcpowers      q = 0;
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    s_mp_lshd(&quot, 1);
*5697Smcpowers    DIGIT(&quot, 0) = (mp_digit)q;
*5697Smcpowers  }
*5697Smcpowers#else
*5697Smcpowers  {
*5697Smcpowers    mp_digit p;
*5697Smcpowers#if !defined(MP_ASSEMBLY_DIV_2DX1D)
*5697Smcpowers    mp_digit norm;
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers    MP_CHECKOK( mp_init_copy(&rem, mp) );
*5697Smcpowers
*5697Smcpowers#if !defined(MP_ASSEMBLY_DIV_2DX1D)
*5697Smcpowers    MP_DIGIT(&quot, 0) = d;
*5697Smcpowers    MP_CHECKOK( s_mp_norm(&rem, &quot, &norm) );
*5697Smcpowers    if (norm)
*5697Smcpowers      d <<= norm;
*5697Smcpowers    MP_DIGIT(&quot, 0) = 0;
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers    p = 0;
*5697Smcpowers    for (ix = USED(&rem) - 1; ix >= 0; ix--) {
*5697Smcpowers      w = DIGIT(&rem, ix);
*5697Smcpowers
*5697Smcpowers      if (p) {
*5697Smcpowers        MP_CHECKOK( s_mpv_div_2dx1d(p, w, d, &q, &w) );
*5697Smcpowers      } else if (w >= d) {
*5697Smcpowers	q = w / d;
*5697Smcpowers	w = w % d;
*5697Smcpowers      } else {
*5697Smcpowers	q = 0;
*5697Smcpowers      }
*5697Smcpowers
*5697Smcpowers      MP_CHECKOK( s_mp_lshd(&quot, 1) );
*5697Smcpowers      DIGIT(&quot, 0) = q;
*5697Smcpowers      p = w;
*5697Smcpowers    }
*5697Smcpowers#if !defined(MP_ASSEMBLY_DIV_2DX1D)
*5697Smcpowers    if (norm)
*5697Smcpowers      w >>= norm;
*5697Smcpowers#endif
*5697Smcpowers  }
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers  /* Deliver the remainder, if desired */
*5697Smcpowers  if(r)
*5697Smcpowers    *r = (mp_digit)w;
*5697Smcpowers
*5697Smcpowers  s_mp_clamp(&quot);
*5697Smcpowers  mp_exch(&quot, mp);
*5697SmcpowersCLEANUP:
*5697Smcpowers  mp_clear(&quot);
*5697Smcpowers  mp_clear(&rem);
*5697Smcpowers
*5697Smcpowers  return res;
*5697Smcpowers} /* end s_mp_div_d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ Primitive full arithmetic */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_add(a, b) */
*5697Smcpowers
*5697Smcpowers/* Compute a = |a| + |b|                                                  */
*5697Smcpowersmp_err   s_mp_add(mp_int *a, const mp_int *b)  /* magnitude addition      */
*5697Smcpowers{
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_ADD_WORD)
*5697Smcpowers  mp_word   w = 0;
*5697Smcpowers#else
*5697Smcpowers  mp_digit  d, sum, carry = 0;
*5697Smcpowers#endif
*5697Smcpowers  mp_digit *pa, *pb;
*5697Smcpowers  mp_size   ix;
*5697Smcpowers  mp_size   used;
*5697Smcpowers  mp_err    res;
*5697Smcpowers
*5697Smcpowers  /* Make sure a has enough precision for the output value */
*5697Smcpowers  if((USED(b) > USED(a)) && (res = s_mp_pad(a, USED(b))) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  /*
*5697Smcpowers    Add up all digits up to the precision of b.  If b had initially
*5697Smcpowers    the same precision as a, or greater, we took care of it by the
*5697Smcpowers    padding step above, so there is no problem.  If b had initially
*5697Smcpowers    less precision, we'll have to make sure the carry out is duly
*5697Smcpowers    propagated upward among the higher-order digits of the sum.
*5697Smcpowers   */
*5697Smcpowers  pa = MP_DIGITS(a);
*5697Smcpowers  pb = MP_DIGITS(b);
*5697Smcpowers  used = MP_USED(b);
*5697Smcpowers  for(ix = 0; ix < used; ix++) {
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_ADD_WORD)
*5697Smcpowers    w = w + *pa + *pb++;
*5697Smcpowers    *pa++ = ACCUM(w);
*5697Smcpowers    w = CARRYOUT(w);
*5697Smcpowers#else
*5697Smcpowers    d = *pa;
*5697Smcpowers    sum = d + *pb++;
*5697Smcpowers    d = (sum < d);			/* detect overflow */
*5697Smcpowers    *pa++ = sum += carry;
*5697Smcpowers    carry = d + (sum < carry);		/* detect overflow */
*5697Smcpowers#endif
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* If we run out of 'b' digits before we're actually done, make
*5697Smcpowers     sure the carries get propagated upward...
*5697Smcpowers   */
*5697Smcpowers  used = MP_USED(a);
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_ADD_WORD)
*5697Smcpowers  while (w && ix < used) {
*5697Smcpowers    w = w + *pa;
*5697Smcpowers    *pa++ = ACCUM(w);
*5697Smcpowers    w = CARRYOUT(w);
*5697Smcpowers    ++ix;
*5697Smcpowers  }
*5697Smcpowers#else
*5697Smcpowers  while (carry && ix < used) {
*5697Smcpowers    sum = carry + *pa;
*5697Smcpowers    *pa++ = sum;
*5697Smcpowers    carry = !sum;
*5697Smcpowers    ++ix;
*5697Smcpowers  }
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers  /* If there's an overall carry out, increase precision and include
*5697Smcpowers     it.  We could have done this initially, but why touch the memory
*5697Smcpowers     allocator unless we're sure we have to?
*5697Smcpowers   */
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_ADD_WORD)
*5697Smcpowers  if (w) {
*5697Smcpowers    if((res = s_mp_pad(a, used + 1)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers
*5697Smcpowers    DIGIT(a, ix) = (mp_digit)w;
*5697Smcpowers  }
*5697Smcpowers#else
*5697Smcpowers  if (carry) {
*5697Smcpowers    if((res = s_mp_pad(a, used + 1)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers
*5697Smcpowers    DIGIT(a, used) = carry;
*5697Smcpowers  }
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers} /* end s_mp_add() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* Compute c = |a| + |b|         */ /* magnitude addition      */
*5697Smcpowersmp_err   s_mp_add_3arg(const mp_int *a, const mp_int *b, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_digit *pa, *pb, *pc;
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_ADD_WORD)
*5697Smcpowers  mp_word   w = 0;
*5697Smcpowers#else
*5697Smcpowers  mp_digit  sum, carry = 0, d;
*5697Smcpowers#endif
*5697Smcpowers  mp_size   ix;
*5697Smcpowers  mp_size   used;
*5697Smcpowers  mp_err    res;
*5697Smcpowers
*5697Smcpowers  MP_SIGN(c) = MP_SIGN(a);
*5697Smcpowers  if (MP_USED(a) < MP_USED(b)) {
*5697Smcpowers    const mp_int *xch = a;
*5697Smcpowers    a = b;
*5697Smcpowers    b = xch;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* Make sure a has enough precision for the output value */
*5697Smcpowers  if (MP_OKAY != (res = s_mp_pad(c, MP_USED(a))))
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  /*
*5697Smcpowers    Add up all digits up to the precision of b.  If b had initially
*5697Smcpowers    the same precision as a, or greater, we took care of it by the
*5697Smcpowers    exchange step above, so there is no problem.  If b had initially
*5697Smcpowers    less precision, we'll have to make sure the carry out is duly
*5697Smcpowers    propagated upward among the higher-order digits of the sum.
*5697Smcpowers   */
*5697Smcpowers  pa = MP_DIGITS(a);
*5697Smcpowers  pb = MP_DIGITS(b);
*5697Smcpowers  pc = MP_DIGITS(c);
*5697Smcpowers  used = MP_USED(b);
*5697Smcpowers  for (ix = 0; ix < used; ix++) {
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_ADD_WORD)
*5697Smcpowers    w = w + *pa++ + *pb++;
*5697Smcpowers    *pc++ = ACCUM(w);
*5697Smcpowers    w = CARRYOUT(w);
*5697Smcpowers#else
*5697Smcpowers    d = *pa++;
*5697Smcpowers    sum = d + *pb++;
*5697Smcpowers    d = (sum < d);			/* detect overflow */
*5697Smcpowers    *pc++ = sum += carry;
*5697Smcpowers    carry = d + (sum < carry);		/* detect overflow */
*5697Smcpowers#endif
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* If we run out of 'b' digits before we're actually done, make
*5697Smcpowers     sure the carries get propagated upward...
*5697Smcpowers   */
*5697Smcpowers  for (used = MP_USED(a); ix < used; ++ix) {
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_ADD_WORD)
*5697Smcpowers    w = w + *pa++;
*5697Smcpowers    *pc++ = ACCUM(w);
*5697Smcpowers    w = CARRYOUT(w);
*5697Smcpowers#else
*5697Smcpowers    *pc++ = sum = carry + *pa++;
*5697Smcpowers    carry = (sum < carry);
*5697Smcpowers#endif
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* If there's an overall carry out, increase precision and include
*5697Smcpowers     it.  We could have done this initially, but why touch the memory
*5697Smcpowers     allocator unless we're sure we have to?
*5697Smcpowers   */
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_ADD_WORD)
*5697Smcpowers  if (w) {
*5697Smcpowers    if((res = s_mp_pad(c, used + 1)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers
*5697Smcpowers    DIGIT(c, used) = (mp_digit)w;
*5697Smcpowers    ++used;
*5697Smcpowers  }
*5697Smcpowers#else
*5697Smcpowers  if (carry) {
*5697Smcpowers    if((res = s_mp_pad(c, used + 1)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers
*5697Smcpowers    DIGIT(c, used) = carry;
*5697Smcpowers    ++used;
*5697Smcpowers  }
*5697Smcpowers#endif
*5697Smcpowers  MP_USED(c) = used;
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers}
*5697Smcpowers/* {{{ s_mp_add_offset(a, b, offset) */
*5697Smcpowers
*5697Smcpowers/* Compute a = |a| + ( |b| * (RADIX ** offset) )             */
*5697Smcpowersmp_err   s_mp_add_offset(mp_int *a, mp_int *b, mp_size offset)
*5697Smcpowers{
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_ADD_WORD)
*5697Smcpowers  mp_word   w, k = 0;
*5697Smcpowers#else
*5697Smcpowers  mp_digit  d, sum, carry = 0;
*5697Smcpowers#endif
*5697Smcpowers  mp_size   ib;
*5697Smcpowers  mp_size   ia;
*5697Smcpowers  mp_size   lim;
*5697Smcpowers  mp_err    res;
*5697Smcpowers
*5697Smcpowers  /* Make sure a has enough precision for the output value */
*5697Smcpowers  lim = MP_USED(b) + offset;
*5697Smcpowers  if((lim > USED(a)) && (res = s_mp_pad(a, lim)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  /*
*5697Smcpowers    Add up all digits up to the precision of b.  If b had initially
*5697Smcpowers    the same precision as a, or greater, we took care of it by the
*5697Smcpowers    padding step above, so there is no problem.  If b had initially
*5697Smcpowers    less precision, we'll have to make sure the carry out is duly
*5697Smcpowers    propagated upward among the higher-order digits of the sum.
*5697Smcpowers   */
*5697Smcpowers  lim = USED(b);
*5697Smcpowers  for(ib = 0, ia = offset; ib < lim; ib++, ia++) {
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_ADD_WORD)
*5697Smcpowers    w = (mp_word)DIGIT(a, ia) + DIGIT(b, ib) + k;
*5697Smcpowers    DIGIT(a, ia) = ACCUM(w);
*5697Smcpowers    k = CARRYOUT(w);
*5697Smcpowers#else
*5697Smcpowers    d = MP_DIGIT(a, ia);
*5697Smcpowers    sum = d + MP_DIGIT(b, ib);
*5697Smcpowers    d = (sum < d);
*5697Smcpowers    MP_DIGIT(a,ia) = sum += carry;
*5697Smcpowers    carry = d + (sum < carry);
*5697Smcpowers#endif
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* If we run out of 'b' digits before we're actually done, make
*5697Smcpowers     sure the carries get propagated upward...
*5697Smcpowers   */
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_ADD_WORD)
*5697Smcpowers  for (lim = MP_USED(a); k && (ia < lim); ++ia) {
*5697Smcpowers    w = (mp_word)DIGIT(a, ia) + k;
*5697Smcpowers    DIGIT(a, ia) = ACCUM(w);
*5697Smcpowers    k = CARRYOUT(w);
*5697Smcpowers  }
*5697Smcpowers#else
*5697Smcpowers  for (lim = MP_USED(a); carry && (ia < lim); ++ia) {
*5697Smcpowers    d = MP_DIGIT(a, ia);
*5697Smcpowers    MP_DIGIT(a,ia) = sum = d + carry;
*5697Smcpowers    carry = (sum < d);
*5697Smcpowers  }
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers  /* If there's an overall carry out, increase precision and include
*5697Smcpowers     it.  We could have done this initially, but why touch the memory
*5697Smcpowers     allocator unless we're sure we have to?
*5697Smcpowers   */
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_ADD_WORD)
*5697Smcpowers  if(k) {
*5697Smcpowers    if((res = s_mp_pad(a, USED(a) + 1)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers
*5697Smcpowers    DIGIT(a, ia) = (mp_digit)k;
*5697Smcpowers  }
*5697Smcpowers#else
*5697Smcpowers  if (carry) {
*5697Smcpowers    if((res = s_mp_pad(a, lim + 1)) != MP_OKAY)
*5697Smcpowers      return res;
*5697Smcpowers
*5697Smcpowers    DIGIT(a, lim) = carry;
*5697Smcpowers  }
*5697Smcpowers#endif
*5697Smcpowers  s_mp_clamp(a);
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_add_offset() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_sub(a, b) */
*5697Smcpowers
*5697Smcpowers/* Compute a = |a| - |b|, assumes |a| >= |b|                              */
*5697Smcpowersmp_err   s_mp_sub(mp_int *a, const mp_int *b)  /* magnitude subtract      */
*5697Smcpowers{
*5697Smcpowers  mp_digit *pa, *pb, *limit;
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_SUB_WORD)
*5697Smcpowers  mp_sword  w = 0;
*5697Smcpowers#else
*5697Smcpowers  mp_digit  d, diff, borrow = 0;
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers  /*
*5697Smcpowers    Subtract and propagate borrow.  Up to the precision of b, this
*5697Smcpowers    accounts for the digits of b; after that, we just make sure the
*5697Smcpowers    carries get to the right place.  This saves having to pad b out to
*5697Smcpowers    the precision of a just to make the loops work right...
*5697Smcpowers   */
*5697Smcpowers  pa = MP_DIGITS(a);
*5697Smcpowers  pb = MP_DIGITS(b);
*5697Smcpowers  limit = pb + MP_USED(b);
*5697Smcpowers  while (pb < limit) {
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_SUB_WORD)
*5697Smcpowers    w = w + *pa - *pb++;
*5697Smcpowers    *pa++ = ACCUM(w);
*5697Smcpowers    w >>= MP_DIGIT_BIT;
*5697Smcpowers#else
*5697Smcpowers    d = *pa;
*5697Smcpowers    diff = d - *pb++;
*5697Smcpowers    d = (diff > d);				/* detect borrow */
*5697Smcpowers    if (borrow && --diff == MP_DIGIT_MAX)
*5697Smcpowers      ++d;
*5697Smcpowers    *pa++ = diff;
*5697Smcpowers    borrow = d;
*5697Smcpowers#endif
*5697Smcpowers  }
*5697Smcpowers  limit = MP_DIGITS(a) + MP_USED(a);
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_SUB_WORD)
*5697Smcpowers  while (w && pa < limit) {
*5697Smcpowers    w = w + *pa;
*5697Smcpowers    *pa++ = ACCUM(w);
*5697Smcpowers    w >>= MP_DIGIT_BIT;
*5697Smcpowers  }
*5697Smcpowers#else
*5697Smcpowers  while (borrow && pa < limit) {
*5697Smcpowers    d = *pa;
*5697Smcpowers    *pa++ = diff = d - borrow;
*5697Smcpowers    borrow = (diff > d);
*5697Smcpowers  }
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers  /* Clobber any leading zeroes we created    */
*5697Smcpowers  s_mp_clamp(a);
*5697Smcpowers
*5697Smcpowers  /*
*5697Smcpowers     If there was a borrow out, then |b| > |a| in violation
*5697Smcpowers     of our input invariant.  We've already done the work,
*5697Smcpowers     but we'll at least complain about it...
*5697Smcpowers   */
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_SUB_WORD)
*5697Smcpowers  return w ? MP_RANGE : MP_OKAY;
*5697Smcpowers#else
*5697Smcpowers  return borrow ? MP_RANGE : MP_OKAY;
*5697Smcpowers#endif
*5697Smcpowers} /* end s_mp_sub() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* Compute c = |a| - |b|, assumes |a| >= |b| */ /* magnitude subtract      */
*5697Smcpowersmp_err   s_mp_sub_3arg(const mp_int *a, const mp_int *b, mp_int *c)
*5697Smcpowers{
*5697Smcpowers  mp_digit *pa, *pb, *pc;
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_SUB_WORD)
*5697Smcpowers  mp_sword  w = 0;
*5697Smcpowers#else
*5697Smcpowers  mp_digit  d, diff, borrow = 0;
*5697Smcpowers#endif
*5697Smcpowers  int       ix, limit;
*5697Smcpowers  mp_err    res;
*5697Smcpowers
*5697Smcpowers  MP_SIGN(c) = MP_SIGN(a);
*5697Smcpowers
*5697Smcpowers  /* Make sure a has enough precision for the output value */
*5697Smcpowers  if (MP_OKAY != (res = s_mp_pad(c, MP_USED(a))))
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  /*
*5697Smcpowers    Subtract and propagate borrow.  Up to the precision of b, this
*5697Smcpowers    accounts for the digits of b; after that, we just make sure the
*5697Smcpowers    carries get to the right place.  This saves having to pad b out to
*5697Smcpowers    the precision of a just to make the loops work right...
*5697Smcpowers   */
*5697Smcpowers  pa = MP_DIGITS(a);
*5697Smcpowers  pb = MP_DIGITS(b);
*5697Smcpowers  pc = MP_DIGITS(c);
*5697Smcpowers  limit = MP_USED(b);
*5697Smcpowers  for (ix = 0; ix < limit; ++ix) {
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_SUB_WORD)
*5697Smcpowers    w = w + *pa++ - *pb++;
*5697Smcpowers    *pc++ = ACCUM(w);
*5697Smcpowers    w >>= MP_DIGIT_BIT;
*5697Smcpowers#else
*5697Smcpowers    d = *pa++;
*5697Smcpowers    diff = d - *pb++;
*5697Smcpowers    d = (diff > d);
*5697Smcpowers    if (borrow && --diff == MP_DIGIT_MAX)
*5697Smcpowers      ++d;
*5697Smcpowers    *pc++ = diff;
*5697Smcpowers    borrow = d;
*5697Smcpowers#endif
*5697Smcpowers  }
*5697Smcpowers  for (limit = MP_USED(a); ix < limit; ++ix) {
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_SUB_WORD)
*5697Smcpowers    w = w + *pa++;
*5697Smcpowers    *pc++ = ACCUM(w);
*5697Smcpowers    w >>= MP_DIGIT_BIT;
*5697Smcpowers#else
*5697Smcpowers    d = *pa++;
*5697Smcpowers    *pc++ = diff = d - borrow;
*5697Smcpowers    borrow = (diff > d);
*5697Smcpowers#endif
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* Clobber any leading zeroes we created    */
*5697Smcpowers  MP_USED(c) = ix;
*5697Smcpowers  s_mp_clamp(c);
*5697Smcpowers
*5697Smcpowers  /*
*5697Smcpowers     If there was a borrow out, then |b| > |a| in violation
*5697Smcpowers     of our input invariant.  We've already done the work,
*5697Smcpowers     but we'll at least complain about it...
*5697Smcpowers   */
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_SUB_WORD)
*5697Smcpowers  return w ? MP_RANGE : MP_OKAY;
*5697Smcpowers#else
*5697Smcpowers  return borrow ? MP_RANGE : MP_OKAY;
*5697Smcpowers#endif
*5697Smcpowers}
*5697Smcpowers/* {{{ s_mp_mul(a, b) */
*5697Smcpowers
*5697Smcpowers/* Compute a = |a| * |b|                                                  */
*5697Smcpowersmp_err   s_mp_mul(mp_int *a, const mp_int *b)
*5697Smcpowers{
*5697Smcpowers  return mp_mul(a, b, a);
*5697Smcpowers} /* end s_mp_mul() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers#if defined(MP_USE_UINT_DIGIT) && defined(MP_USE_LONG_LONG_MULTIPLY)
*5697Smcpowers/* This trick works on Sparc V8 CPUs with the Workshop compilers. */
*5697Smcpowers#define MP_MUL_DxD(a, b, Phi, Plo) \
*5697Smcpowers  { unsigned long long product = (unsigned long long)a * b; \
*5697Smcpowers    Plo = (mp_digit)product; \
*5697Smcpowers    Phi = (mp_digit)(product >> MP_DIGIT_BIT); }
*5697Smcpowers#elif defined(OSF1)
*5697Smcpowers#define MP_MUL_DxD(a, b, Phi, Plo) \
*5697Smcpowers  { Plo = asm ("mulq %a0, %a1, %v0", a, b);\
*5697Smcpowers    Phi = asm ("umulh %a0, %a1, %v0", a, b); }
*5697Smcpowers#else
*5697Smcpowers#define MP_MUL_DxD(a, b, Phi, Plo) \
*5697Smcpowers  { mp_digit a0b1, a1b0; \
*5697Smcpowers    Plo = (a & MP_HALF_DIGIT_MAX) * (b & MP_HALF_DIGIT_MAX); \
*5697Smcpowers    Phi = (a >> MP_HALF_DIGIT_BIT) * (b >> MP_HALF_DIGIT_BIT); \
*5697Smcpowers    a0b1 = (a & MP_HALF_DIGIT_MAX) * (b >> MP_HALF_DIGIT_BIT); \
*5697Smcpowers    a1b0 = (a >> MP_HALF_DIGIT_BIT) * (b & MP_HALF_DIGIT_MAX); \
*5697Smcpowers    a1b0 += a0b1; \
*5697Smcpowers    Phi += a1b0 >> MP_HALF_DIGIT_BIT; \
*5697Smcpowers    if (a1b0 < a0b1)  \
*5697Smcpowers      Phi += MP_HALF_RADIX; \
*5697Smcpowers    a1b0 <<= MP_HALF_DIGIT_BIT; \
*5697Smcpowers    Plo += a1b0; \
*5697Smcpowers    if (Plo < a1b0) \
*5697Smcpowers      ++Phi; \
*5697Smcpowers  }
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers#if !defined(MP_ASSEMBLY_MULTIPLY)
*5697Smcpowers/* c = a * b */
*5697Smcpowersvoid s_mpv_mul_d(const mp_digit *a, mp_size a_len, mp_digit b, mp_digit *c)
*5697Smcpowers{
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_MUL_WORD)
*5697Smcpowers  mp_digit   d = 0;
*5697Smcpowers
*5697Smcpowers  /* Inner product:  Digits of a */
*5697Smcpowers  while (a_len--) {
*5697Smcpowers    mp_word w = ((mp_word)b * *a++) + d;
*5697Smcpowers    *c++ = ACCUM(w);
*5697Smcpowers    d = CARRYOUT(w);
*5697Smcpowers  }
*5697Smcpowers  *c = d;
*5697Smcpowers#else
*5697Smcpowers  mp_digit carry = 0;
*5697Smcpowers  while (a_len--) {
*5697Smcpowers    mp_digit a_i = *a++;
*5697Smcpowers    mp_digit a0b0, a1b1;
*5697Smcpowers
*5697Smcpowers    MP_MUL_DxD(a_i, b, a1b1, a0b0);
*5697Smcpowers
*5697Smcpowers    a0b0 += carry;
*5697Smcpowers    if (a0b0 < carry)
*5697Smcpowers      ++a1b1;
*5697Smcpowers    *c++ = a0b0;
*5697Smcpowers    carry = a1b1;
*5697Smcpowers  }
*5697Smcpowers  *c = carry;
*5697Smcpowers#endif
*5697Smcpowers}
*5697Smcpowers
*5697Smcpowers/* c += a * b */
*5697Smcpowersvoid s_mpv_mul_d_add(const mp_digit *a, mp_size a_len, mp_digit b,
*5697Smcpowers			      mp_digit *c)
*5697Smcpowers{
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_MUL_WORD)
*5697Smcpowers  mp_digit   d = 0;
*5697Smcpowers
*5697Smcpowers  /* Inner product:  Digits of a */
*5697Smcpowers  while (a_len--) {
*5697Smcpowers    mp_word w = ((mp_word)b * *a++) + *c + d;
*5697Smcpowers    *c++ = ACCUM(w);
*5697Smcpowers    d = CARRYOUT(w);
*5697Smcpowers  }
*5697Smcpowers  *c = d;
*5697Smcpowers#else
*5697Smcpowers  mp_digit carry = 0;
*5697Smcpowers  while (a_len--) {
*5697Smcpowers    mp_digit a_i = *a++;
*5697Smcpowers    mp_digit a0b0, a1b1;
*5697Smcpowers
*5697Smcpowers    MP_MUL_DxD(a_i, b, a1b1, a0b0);
*5697Smcpowers
*5697Smcpowers    a0b0 += carry;
*5697Smcpowers    if (a0b0 < carry)
*5697Smcpowers      ++a1b1;
*5697Smcpowers    a0b0 += a_i = *c;
*5697Smcpowers    if (a0b0 < a_i)
*5697Smcpowers      ++a1b1;
*5697Smcpowers    *c++ = a0b0;
*5697Smcpowers    carry = a1b1;
*5697Smcpowers  }
*5697Smcpowers  *c = carry;
*5697Smcpowers#endif
*5697Smcpowers}
*5697Smcpowers
*5697Smcpowers/* Presently, this is only used by the Montgomery arithmetic code. */
*5697Smcpowers/* c += a * b */
*5697Smcpowersvoid s_mpv_mul_d_add_prop(const mp_digit *a, mp_size a_len, mp_digit b, mp_digit *c)
*5697Smcpowers{
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_MUL_WORD)
*5697Smcpowers  mp_digit   d = 0;
*5697Smcpowers
*5697Smcpowers  /* Inner product:  Digits of a */
*5697Smcpowers  while (a_len--) {
*5697Smcpowers    mp_word w = ((mp_word)b * *a++) + *c + d;
*5697Smcpowers    *c++ = ACCUM(w);
*5697Smcpowers    d = CARRYOUT(w);
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  while (d) {
*5697Smcpowers    mp_word w = (mp_word)*c + d;
*5697Smcpowers    *c++ = ACCUM(w);
*5697Smcpowers    d = CARRYOUT(w);
*5697Smcpowers  }
*5697Smcpowers#else
*5697Smcpowers  mp_digit carry = 0;
*5697Smcpowers  while (a_len--) {
*5697Smcpowers    mp_digit a_i = *a++;
*5697Smcpowers    mp_digit a0b0, a1b1;
*5697Smcpowers
*5697Smcpowers    MP_MUL_DxD(a_i, b, a1b1, a0b0);
*5697Smcpowers
*5697Smcpowers    a0b0 += carry;
*5697Smcpowers    if (a0b0 < carry)
*5697Smcpowers      ++a1b1;
*5697Smcpowers
*5697Smcpowers    a0b0 += a_i = *c;
*5697Smcpowers    if (a0b0 < a_i)
*5697Smcpowers      ++a1b1;
*5697Smcpowers
*5697Smcpowers    *c++ = a0b0;
*5697Smcpowers    carry = a1b1;
*5697Smcpowers  }
*5697Smcpowers  while (carry) {
*5697Smcpowers    mp_digit c_i = *c;
*5697Smcpowers    carry += c_i;
*5697Smcpowers    *c++ = carry;
*5697Smcpowers    carry = carry < c_i;
*5697Smcpowers  }
*5697Smcpowers#endif
*5697Smcpowers}
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers#if defined(MP_USE_UINT_DIGIT) && defined(MP_USE_LONG_LONG_MULTIPLY)
*5697Smcpowers/* This trick works on Sparc V8 CPUs with the Workshop compilers. */
*5697Smcpowers#define MP_SQR_D(a, Phi, Plo) \
*5697Smcpowers  { unsigned long long square = (unsigned long long)a * a; \
*5697Smcpowers    Plo = (mp_digit)square; \
*5697Smcpowers    Phi = (mp_digit)(square >> MP_DIGIT_BIT); }
*5697Smcpowers#elif defined(OSF1)
*5697Smcpowers#define MP_SQR_D(a, Phi, Plo) \
*5697Smcpowers  { Plo = asm ("mulq  %a0, %a0, %v0", a);\
*5697Smcpowers    Phi = asm ("umulh %a0, %a0, %v0", a); }
*5697Smcpowers#else
*5697Smcpowers#define MP_SQR_D(a, Phi, Plo) \
*5697Smcpowers  { mp_digit Pmid; \
*5697Smcpowers    Plo  = (a  & MP_HALF_DIGIT_MAX) * (a  & MP_HALF_DIGIT_MAX); \
*5697Smcpowers    Phi  = (a >> MP_HALF_DIGIT_BIT) * (a >> MP_HALF_DIGIT_BIT); \
*5697Smcpowers    Pmid = (a  & MP_HALF_DIGIT_MAX) * (a >> MP_HALF_DIGIT_BIT); \
*5697Smcpowers    Phi += Pmid >> (MP_HALF_DIGIT_BIT - 1);  \
*5697Smcpowers    Pmid <<= (MP_HALF_DIGIT_BIT + 1);  \
*5697Smcpowers    Plo += Pmid;  \
*5697Smcpowers    if (Plo < Pmid)  \
*5697Smcpowers      ++Phi;  \
*5697Smcpowers  }
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers#if !defined(MP_ASSEMBLY_SQUARE)
*5697Smcpowers/* Add the squares of the digits of a to the digits of b. */
*5697Smcpowersvoid s_mpv_sqr_add_prop(const mp_digit *pa, mp_size a_len, mp_digit *ps)
*5697Smcpowers{
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_MUL_WORD)
*5697Smcpowers  mp_word  w;
*5697Smcpowers  mp_digit d;
*5697Smcpowers  mp_size  ix;
*5697Smcpowers
*5697Smcpowers  w  = 0;
*5697Smcpowers#define ADD_SQUARE(n) \
*5697Smcpowers    d = pa[n]; \
*5697Smcpowers    w += (d * (mp_word)d) + ps[2*n]; \
*5697Smcpowers    ps[2*n] = ACCUM(w); \
*5697Smcpowers    w = (w >> DIGIT_BIT) + ps[2*n+1]; \
*5697Smcpowers    ps[2*n+1] = ACCUM(w); \
*5697Smcpowers    w = (w >> DIGIT_BIT)
*5697Smcpowers
*5697Smcpowers  for (ix = a_len; ix >= 4; ix -= 4) {
*5697Smcpowers    ADD_SQUARE(0);
*5697Smcpowers    ADD_SQUARE(1);
*5697Smcpowers    ADD_SQUARE(2);
*5697Smcpowers    ADD_SQUARE(3);
*5697Smcpowers    pa += 4;
*5697Smcpowers    ps += 8;
*5697Smcpowers  }
*5697Smcpowers  if (ix) {
*5697Smcpowers    ps += 2*ix;
*5697Smcpowers    pa += ix;
*5697Smcpowers    switch (ix) {
*5697Smcpowers    case 3: ADD_SQUARE(-3); /* FALLTHRU */
*5697Smcpowers    case 2: ADD_SQUARE(-2); /* FALLTHRU */
*5697Smcpowers    case 1: ADD_SQUARE(-1); /* FALLTHRU */
*5697Smcpowers    case 0: break;
*5697Smcpowers    }
*5697Smcpowers  }
*5697Smcpowers  while (w) {
*5697Smcpowers    w += *ps;
*5697Smcpowers    *ps++ = ACCUM(w);
*5697Smcpowers    w = (w >> DIGIT_BIT);
*5697Smcpowers  }
*5697Smcpowers#else
*5697Smcpowers  mp_digit carry = 0;
*5697Smcpowers  while (a_len--) {
*5697Smcpowers    mp_digit a_i = *pa++;
*5697Smcpowers    mp_digit a0a0, a1a1;
*5697Smcpowers
*5697Smcpowers    MP_SQR_D(a_i, a1a1, a0a0);
*5697Smcpowers
*5697Smcpowers    /* here a1a1 and a0a0 constitute a_i ** 2 */
*5697Smcpowers    a0a0 += carry;
*5697Smcpowers    if (a0a0 < carry)
*5697Smcpowers      ++a1a1;
*5697Smcpowers
*5697Smcpowers    /* now add to ps */
*5697Smcpowers    a0a0 += a_i = *ps;
*5697Smcpowers    if (a0a0 < a_i)
*5697Smcpowers      ++a1a1;
*5697Smcpowers    *ps++ = a0a0;
*5697Smcpowers    a1a1 += a_i = *ps;
*5697Smcpowers    carry = (a1a1 < a_i);
*5697Smcpowers    *ps++ = a1a1;
*5697Smcpowers  }
*5697Smcpowers  while (carry) {
*5697Smcpowers    mp_digit s_i = *ps;
*5697Smcpowers    carry += s_i;
*5697Smcpowers    *ps++ = carry;
*5697Smcpowers    carry = carry < s_i;
*5697Smcpowers  }
*5697Smcpowers#endif
*5697Smcpowers}
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers#if (defined(MP_NO_MP_WORD) || defined(MP_NO_DIV_WORD)) \
*5697Smcpowers&& !defined(MP_ASSEMBLY_DIV_2DX1D)
*5697Smcpowers/*
*5697Smcpowers** Divide 64-bit (Nhi,Nlo) by 32-bit divisor, which must be normalized
*5697Smcpowers** so its high bit is 1.   This code is from NSPR.
*5697Smcpowers*/
*5697Smcpowersmp_err s_mpv_div_2dx1d(mp_digit Nhi, mp_digit Nlo, mp_digit divisor,
*5697Smcpowers		       mp_digit *qp, mp_digit *rp)
*5697Smcpowers{
*5697Smcpowers    mp_digit d1, d0, q1, q0;
*5697Smcpowers    mp_digit r1, r0, m;
*5697Smcpowers
*5697Smcpowers    d1 = divisor >> MP_HALF_DIGIT_BIT;
*5697Smcpowers    d0 = divisor & MP_HALF_DIGIT_MAX;
*5697Smcpowers    r1 = Nhi % d1;
*5697Smcpowers    q1 = Nhi / d1;
*5697Smcpowers    m = q1 * d0;
*5697Smcpowers    r1 = (r1 << MP_HALF_DIGIT_BIT) | (Nlo >> MP_HALF_DIGIT_BIT);
*5697Smcpowers    if (r1 < m) {
*5697Smcpowers        q1--, r1 += divisor;
*5697Smcpowers        if (r1 >= divisor && r1 < m) {
*5697Smcpowers	    q1--, r1 += divisor;
*5697Smcpowers	}
*5697Smcpowers    }
*5697Smcpowers    r1 -= m;
*5697Smcpowers    r0 = r1 % d1;
*5697Smcpowers    q0 = r1 / d1;
*5697Smcpowers    m = q0 * d0;
*5697Smcpowers    r0 = (r0 << MP_HALF_DIGIT_BIT) | (Nlo & MP_HALF_DIGIT_MAX);
*5697Smcpowers    if (r0 < m) {
*5697Smcpowers        q0--, r0 += divisor;
*5697Smcpowers        if (r0 >= divisor && r0 < m) {
*5697Smcpowers	    q0--, r0 += divisor;
*5697Smcpowers	}
*5697Smcpowers    }
*5697Smcpowers    if (qp)
*5697Smcpowers	*qp = (q1 << MP_HALF_DIGIT_BIT) | q0;
*5697Smcpowers    if (rp)
*5697Smcpowers	*rp = r0 - m;
*5697Smcpowers    return MP_OKAY;
*5697Smcpowers}
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers#if MP_SQUARE
*5697Smcpowers/* {{{ s_mp_sqr(a) */
*5697Smcpowers
*5697Smcpowersmp_err   s_mp_sqr(mp_int *a)
*5697Smcpowers{
*5697Smcpowers  mp_err   res;
*5697Smcpowers  mp_int   tmp;
*5697Smcpowers
*5697Smcpowers  if((res = mp_init_size(&tmp, 2 * USED(a), FLAG(a))) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers  res = mp_sqr(a, &tmp);
*5697Smcpowers  if (res == MP_OKAY) {
*5697Smcpowers    s_mp_exch(&tmp, a);
*5697Smcpowers  }
*5697Smcpowers  mp_clear(&tmp);
*5697Smcpowers  return res;
*5697Smcpowers}
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers#endif
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_div(a, b) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  s_mp_div(a, b)
*5697Smcpowers
*5697Smcpowers  Compute a = a / b and b = a mod b.  Assumes b > a.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err   s_mp_div(mp_int *rem, 	/* i: dividend, o: remainder */
*5697Smcpowers                  mp_int *div, 	/* i: divisor                */
*5697Smcpowers		  mp_int *quot)	/* i: 0;        o: quotient  */
*5697Smcpowers{
*5697Smcpowers  mp_int   part, t;
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_DIV_WORD)
*5697Smcpowers  mp_word  q_msd;
*5697Smcpowers#else
*5697Smcpowers  mp_digit q_msd;
*5697Smcpowers#endif
*5697Smcpowers  mp_err   res;
*5697Smcpowers  mp_digit d;
*5697Smcpowers  mp_digit div_msd;
*5697Smcpowers  int      ix;
*5697Smcpowers
*5697Smcpowers  if(mp_cmp_z(div) == 0)
*5697Smcpowers    return MP_RANGE;
*5697Smcpowers
*5697Smcpowers  /* Shortcut if divisor is power of two */
*5697Smcpowers  if((ix = s_mp_ispow2(div)) >= 0) {
*5697Smcpowers    MP_CHECKOK( mp_copy(rem, quot) );
*5697Smcpowers    s_mp_div_2d(quot, (mp_digit)ix);
*5697Smcpowers    s_mp_mod_2d(rem,  (mp_digit)ix);
*5697Smcpowers
*5697Smcpowers    return MP_OKAY;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  DIGITS(&t) = 0;
*5697Smcpowers  MP_SIGN(rem) = ZPOS;
*5697Smcpowers  MP_SIGN(div) = ZPOS;
*5697Smcpowers
*5697Smcpowers  /* A working temporary for division     */
*5697Smcpowers  MP_CHECKOK( mp_init_size(&t, MP_ALLOC(rem), FLAG(rem)));
*5697Smcpowers
*5697Smcpowers  /* Normalize to optimize guessing       */
*5697Smcpowers  MP_CHECKOK( s_mp_norm(rem, div, &d) );
*5697Smcpowers
*5697Smcpowers  part = *rem;
*5697Smcpowers
*5697Smcpowers  /* Perform the division itself...woo!   */
*5697Smcpowers  MP_USED(quot) = MP_ALLOC(quot);
*5697Smcpowers
*5697Smcpowers  /* Find a partial substring of rem which is at least div */
*5697Smcpowers  /* If we didn't find one, we're finished dividing    */
*5697Smcpowers  while (MP_USED(rem) > MP_USED(div) || s_mp_cmp(rem, div) >= 0) {
*5697Smcpowers    int i;
*5697Smcpowers    int unusedRem;
*5697Smcpowers
*5697Smcpowers    unusedRem = MP_USED(rem) - MP_USED(div);
*5697Smcpowers    MP_DIGITS(&part) = MP_DIGITS(rem) + unusedRem;
*5697Smcpowers    MP_ALLOC(&part)  = MP_ALLOC(rem)  - unusedRem;
*5697Smcpowers    MP_USED(&part)   = MP_USED(div);
*5697Smcpowers    if (s_mp_cmp(&part, div) < 0) {
*5697Smcpowers      -- unusedRem;
*5697Smcpowers#if MP_ARGCHK == 2
*5697Smcpowers      assert(unusedRem >= 0);
*5697Smcpowers#endif
*5697Smcpowers      -- MP_DIGITS(&part);
*5697Smcpowers      ++ MP_USED(&part);
*5697Smcpowers      ++ MP_ALLOC(&part);
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    /* Compute a guess for the next quotient digit       */
*5697Smcpowers    q_msd = MP_DIGIT(&part, MP_USED(&part) - 1);
*5697Smcpowers    div_msd = MP_DIGIT(div, MP_USED(div) - 1);
*5697Smcpowers    if (q_msd >= div_msd) {
*5697Smcpowers      q_msd = 1;
*5697Smcpowers    } else if (MP_USED(&part) > 1) {
*5697Smcpowers#if !defined(MP_NO_MP_WORD) && !defined(MP_NO_DIV_WORD)
*5697Smcpowers      q_msd = (q_msd << MP_DIGIT_BIT) | MP_DIGIT(&part, MP_USED(&part) - 2);
*5697Smcpowers      q_msd /= div_msd;
*5697Smcpowers      if (q_msd == RADIX)
*5697Smcpowers        --q_msd;
*5697Smcpowers#else
*5697Smcpowers      mp_digit r;
*5697Smcpowers      MP_CHECKOK( s_mpv_div_2dx1d(q_msd, MP_DIGIT(&part, MP_USED(&part) - 2),
*5697Smcpowers				  div_msd, &q_msd, &r) );
*5697Smcpowers#endif
*5697Smcpowers    } else {
*5697Smcpowers      q_msd = 0;
*5697Smcpowers    }
*5697Smcpowers#if MP_ARGCHK == 2
*5697Smcpowers    assert(q_msd > 0); /* This case should never occur any more. */
*5697Smcpowers#endif
*5697Smcpowers    if (q_msd <= 0)
*5697Smcpowers      break;
*5697Smcpowers
*5697Smcpowers    /* See what that multiplies out to                   */
*5697Smcpowers    mp_copy(div, &t);
*5697Smcpowers    MP_CHECKOK( s_mp_mul_d(&t, (mp_digit)q_msd) );
*5697Smcpowers
*5697Smcpowers    /*
*5697Smcpowers       If it's too big, back it off.  We should not have to do this
*5697Smcpowers       more than once, or, in rare cases, twice.  Knuth describes a
*5697Smcpowers       method by which this could be reduced to a maximum of once, but
*5697Smcpowers       I didn't implement that here.
*5697Smcpowers     * When using s_mpv_div_2dx1d, we may have to do this 3 times.
*5697Smcpowers     */
*5697Smcpowers    for (i = 4; s_mp_cmp(&t, &part) > 0 && i > 0; --i) {
*5697Smcpowers      --q_msd;
*5697Smcpowers      s_mp_sub(&t, div);	/* t -= div */
*5697Smcpowers    }
*5697Smcpowers    if (i < 0) {
*5697Smcpowers      res = MP_RANGE;
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers    }
*5697Smcpowers
*5697Smcpowers    /* At this point, q_msd should be the right next digit   */
*5697Smcpowers    MP_CHECKOK( s_mp_sub(&part, &t) );	/* part -= t */
*5697Smcpowers    s_mp_clamp(rem);
*5697Smcpowers
*5697Smcpowers    /*
*5697Smcpowers      Include the digit in the quotient.  We allocated enough memory
*5697Smcpowers      for any quotient we could ever possibly get, so we should not
*5697Smcpowers      have to check for failures here
*5697Smcpowers     */
*5697Smcpowers    MP_DIGIT(quot, unusedRem) = (mp_digit)q_msd;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* Denormalize remainder                */
*5697Smcpowers  if (d) {
*5697Smcpowers    s_mp_div_2d(rem, d);
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  s_mp_clamp(quot);
*5697Smcpowers
*5697SmcpowersCLEANUP:
*5697Smcpowers  mp_clear(&t);
*5697Smcpowers
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_div() */
*5697Smcpowers
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_2expt(a, k) */
*5697Smcpowers
*5697Smcpowersmp_err   s_mp_2expt(mp_int *a, mp_digit k)
*5697Smcpowers{
*5697Smcpowers  mp_err    res;
*5697Smcpowers  mp_size   dig, bit;
*5697Smcpowers
*5697Smcpowers  dig = k / DIGIT_BIT;
*5697Smcpowers  bit = k % DIGIT_BIT;
*5697Smcpowers
*5697Smcpowers  mp_zero(a);
*5697Smcpowers  if((res = s_mp_pad(a, dig + 1)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  DIGIT(a, dig) |= ((mp_digit)1 << bit);
*5697Smcpowers
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_2expt() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_reduce(x, m, mu) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  Compute Barrett reduction, x (mod m), given a precomputed value for
*5697Smcpowers  mu = b^2k / m, where b = RADIX and k = #digits(m).  This should be
*5697Smcpowers  faster than straight division, when many reductions by the same
*5697Smcpowers  value of m are required (such as in modular exponentiation).  This
*5697Smcpowers  can nearly halve the time required to do modular exponentiation,
*5697Smcpowers  as compared to using the full integer divide to reduce.
*5697Smcpowers
*5697Smcpowers  This algorithm was derived from the _Handbook of Applied
*5697Smcpowers  Cryptography_ by Menezes, Oorschot and VanStone, Ch. 14,
*5697Smcpowers  pp. 603-604.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err   s_mp_reduce(mp_int *x, const mp_int *m, const mp_int *mu)
*5697Smcpowers{
*5697Smcpowers  mp_int   q;
*5697Smcpowers  mp_err   res;
*5697Smcpowers
*5697Smcpowers  if((res = mp_init_copy(&q, x)) != MP_OKAY)
*5697Smcpowers    return res;
*5697Smcpowers
*5697Smcpowers  s_mp_rshd(&q, USED(m) - 1);  /* q1 = x / b^(k-1)  */
*5697Smcpowers  s_mp_mul(&q, mu);            /* q2 = q1 * mu      */
*5697Smcpowers  s_mp_rshd(&q, USED(m) + 1);  /* q3 = q2 / b^(k+1) */
*5697Smcpowers
*5697Smcpowers  /* x = x mod b^(k+1), quick (no division) */
*5697Smcpowers  s_mp_mod_2d(x, DIGIT_BIT * (USED(m) + 1));
*5697Smcpowers
*5697Smcpowers  /* q = q * m mod b^(k+1), quick (no division) */
*5697Smcpowers  s_mp_mul(&q, m);
*5697Smcpowers  s_mp_mod_2d(&q, DIGIT_BIT * (USED(m) + 1));
*5697Smcpowers
*5697Smcpowers  /* x = x - q */
*5697Smcpowers  if((res = mp_sub(x, &q, x)) != MP_OKAY)
*5697Smcpowers    goto CLEANUP;
*5697Smcpowers
*5697Smcpowers  /* If x < 0, add b^(k+1) to it */
*5697Smcpowers  if(mp_cmp_z(x) < 0) {
*5697Smcpowers    mp_set(&q, 1);
*5697Smcpowers    if((res = s_mp_lshd(&q, USED(m) + 1)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers    if((res = mp_add(x, &q, x)) != MP_OKAY)
*5697Smcpowers      goto CLEANUP;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* Back off if it's too big */
*5697Smcpowers  while(mp_cmp(x, m) >= 0) {
*5697Smcpowers    if((res = s_mp_sub(x, m)) != MP_OKAY)
*5697Smcpowers      break;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers CLEANUP:
*5697Smcpowers  mp_clear(&q);
*5697Smcpowers
*5697Smcpowers  return res;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_reduce() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ Primitive comparisons */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_cmp(a, b) */
*5697Smcpowers
*5697Smcpowers/* Compare |a| <=> |b|, return 0 if equal, <0 if a<b, >0 if a>b           */
*5697Smcpowersint      s_mp_cmp(const mp_int *a, const mp_int *b)
*5697Smcpowers{
*5697Smcpowers  mp_size used_a = MP_USED(a);
*5697Smcpowers  {
*5697Smcpowers    mp_size used_b = MP_USED(b);
*5697Smcpowers
*5697Smcpowers    if (used_a > used_b)
*5697Smcpowers      goto IS_GT;
*5697Smcpowers    if (used_a < used_b)
*5697Smcpowers      goto IS_LT;
*5697Smcpowers  }
*5697Smcpowers  {
*5697Smcpowers    mp_digit *pa, *pb;
*5697Smcpowers    mp_digit da = 0, db = 0;
*5697Smcpowers
*5697Smcpowers#define CMP_AB(n) if ((da = pa[n]) != (db = pb[n])) goto done
*5697Smcpowers
*5697Smcpowers    pa = MP_DIGITS(a) + used_a;
*5697Smcpowers    pb = MP_DIGITS(b) + used_a;
*5697Smcpowers    while (used_a >= 4) {
*5697Smcpowers      pa     -= 4;
*5697Smcpowers      pb     -= 4;
*5697Smcpowers      used_a -= 4;
*5697Smcpowers      CMP_AB(3);
*5697Smcpowers      CMP_AB(2);
*5697Smcpowers      CMP_AB(1);
*5697Smcpowers      CMP_AB(0);
*5697Smcpowers    }
*5697Smcpowers    while (used_a-- > 0 && ((da = *--pa) == (db = *--pb)))
*5697Smcpowers      /* do nothing */;
*5697Smcpowersdone:
*5697Smcpowers    if (da > db)
*5697Smcpowers      goto IS_GT;
*5697Smcpowers    if (da < db)
*5697Smcpowers      goto IS_LT;
*5697Smcpowers  }
*5697Smcpowers  return MP_EQ;
*5697SmcpowersIS_LT:
*5697Smcpowers  return MP_LT;
*5697SmcpowersIS_GT:
*5697Smcpowers  return MP_GT;
*5697Smcpowers} /* end s_mp_cmp() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_cmp_d(a, d) */
*5697Smcpowers
*5697Smcpowers/* Compare |a| <=> d, return 0 if equal, <0 if a<d, >0 if a>d             */
*5697Smcpowersint      s_mp_cmp_d(const mp_int *a, mp_digit d)
*5697Smcpowers{
*5697Smcpowers  if(USED(a) > 1)
*5697Smcpowers    return MP_GT;
*5697Smcpowers
*5697Smcpowers  if(DIGIT(a, 0) < d)
*5697Smcpowers    return MP_LT;
*5697Smcpowers  else if(DIGIT(a, 0) > d)
*5697Smcpowers    return MP_GT;
*5697Smcpowers  else
*5697Smcpowers    return MP_EQ;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_cmp_d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_ispow2(v) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  Returns -1 if the value is not a power of two; otherwise, it returns
*5697Smcpowers  k such that v = 2^k, i.e. lg(v).
*5697Smcpowers */
*5697Smcpowersint      s_mp_ispow2(const mp_int *v)
*5697Smcpowers{
*5697Smcpowers  mp_digit d;
*5697Smcpowers  int      extra = 0, ix;
*5697Smcpowers
*5697Smcpowers  ix = MP_USED(v) - 1;
*5697Smcpowers  d = MP_DIGIT(v, ix); /* most significant digit of v */
*5697Smcpowers
*5697Smcpowers  extra = s_mp_ispow2d(d);
*5697Smcpowers  if (extra < 0 || ix == 0)
*5697Smcpowers    return extra;
*5697Smcpowers
*5697Smcpowers  while (--ix >= 0) {
*5697Smcpowers    if (DIGIT(v, ix) != 0)
*5697Smcpowers      return -1; /* not a power of two */
*5697Smcpowers    extra += MP_DIGIT_BIT;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  return extra;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_ispow2() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_ispow2d(d) */
*5697Smcpowers
*5697Smcpowersint      s_mp_ispow2d(mp_digit d)
*5697Smcpowers{
*5697Smcpowers  if ((d != 0) && ((d & (d-1)) == 0)) { /* d is a power of 2 */
*5697Smcpowers    int pow = 0;
*5697Smcpowers#if defined (MP_USE_UINT_DIGIT)
*5697Smcpowers    if (d & 0xffff0000U)
*5697Smcpowers      pow += 16;
*5697Smcpowers    if (d & 0xff00ff00U)
*5697Smcpowers      pow += 8;
*5697Smcpowers    if (d & 0xf0f0f0f0U)
*5697Smcpowers      pow += 4;
*5697Smcpowers    if (d & 0xccccccccU)
*5697Smcpowers      pow += 2;
*5697Smcpowers    if (d & 0xaaaaaaaaU)
*5697Smcpowers      pow += 1;
*5697Smcpowers#elif defined(MP_USE_LONG_LONG_DIGIT)
*5697Smcpowers    if (d & 0xffffffff00000000ULL)
*5697Smcpowers      pow += 32;
*5697Smcpowers    if (d & 0xffff0000ffff0000ULL)
*5697Smcpowers      pow += 16;
*5697Smcpowers    if (d & 0xff00ff00ff00ff00ULL)
*5697Smcpowers      pow += 8;
*5697Smcpowers    if (d & 0xf0f0f0f0f0f0f0f0ULL)
*5697Smcpowers      pow += 4;
*5697Smcpowers    if (d & 0xccccccccccccccccULL)
*5697Smcpowers      pow += 2;
*5697Smcpowers    if (d & 0xaaaaaaaaaaaaaaaaULL)
*5697Smcpowers      pow += 1;
*5697Smcpowers#elif defined(MP_USE_LONG_DIGIT)
*5697Smcpowers    if (d & 0xffffffff00000000UL)
*5697Smcpowers      pow += 32;
*5697Smcpowers    if (d & 0xffff0000ffff0000UL)
*5697Smcpowers      pow += 16;
*5697Smcpowers    if (d & 0xff00ff00ff00ff00UL)
*5697Smcpowers      pow += 8;
*5697Smcpowers    if (d & 0xf0f0f0f0f0f0f0f0UL)
*5697Smcpowers      pow += 4;
*5697Smcpowers    if (d & 0xccccccccccccccccUL)
*5697Smcpowers      pow += 2;
*5697Smcpowers    if (d & 0xaaaaaaaaaaaaaaaaUL)
*5697Smcpowers      pow += 1;
*5697Smcpowers#else
*5697Smcpowers#error "unknown type for mp_digit"
*5697Smcpowers#endif
*5697Smcpowers    return pow;
*5697Smcpowers  }
*5697Smcpowers  return -1;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_ispow2d() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ Primitive I/O helpers */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_tovalue(ch, r) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  Convert the given character to its digit value, in the given radix.
*5697Smcpowers  If the given character is not understood in the given radix, -1 is
*5697Smcpowers  returned.  Otherwise the digit's numeric value is returned.
*5697Smcpowers
*5697Smcpowers  The results will be odd if you use a radix < 2 or > 62, you are
*5697Smcpowers  expected to know what you're up to.
*5697Smcpowers */
*5697Smcpowersint      s_mp_tovalue(char ch, int r)
*5697Smcpowers{
*5697Smcpowers  int    val, xch;
*5697Smcpowers
*5697Smcpowers  if(r > 36)
*5697Smcpowers    xch = ch;
*5697Smcpowers  else
*5697Smcpowers    xch = toupper(ch);
*5697Smcpowers
*5697Smcpowers  if(isdigit(xch))
*5697Smcpowers    val = xch - '0';
*5697Smcpowers  else if(isupper(xch))
*5697Smcpowers    val = xch - 'A' + 10;
*5697Smcpowers  else if(islower(xch))
*5697Smcpowers    val = xch - 'a' + 36;
*5697Smcpowers  else if(xch == '+')
*5697Smcpowers    val = 62;
*5697Smcpowers  else if(xch == '/')
*5697Smcpowers    val = 63;
*5697Smcpowers  else
*5697Smcpowers    return -1;
*5697Smcpowers
*5697Smcpowers  if(val < 0 || val >= r)
*5697Smcpowers    return -1;
*5697Smcpowers
*5697Smcpowers  return val;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_tovalue() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_todigit(val, r, low) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers  Convert val to a radix-r digit, if possible.  If val is out of range
*5697Smcpowers  for r, returns zero.  Otherwise, returns an ASCII character denoting
*5697Smcpowers  the value in the given radix.
*5697Smcpowers
*5697Smcpowers  The results may be odd if you use a radix < 2 or > 64, you are
*5697Smcpowers  expected to know what you're doing.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowerschar     s_mp_todigit(mp_digit val, int r, int low)
*5697Smcpowers{
*5697Smcpowers  char   ch;
*5697Smcpowers
*5697Smcpowers  if(val >= r)
*5697Smcpowers    return 0;
*5697Smcpowers
*5697Smcpowers  ch = s_dmap_1[val];
*5697Smcpowers
*5697Smcpowers  if(r <= 36 && low)
*5697Smcpowers    ch = tolower(ch);
*5697Smcpowers
*5697Smcpowers  return ch;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_todigit() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ s_mp_outlen(bits, radix) */
*5697Smcpowers
*5697Smcpowers/*
*5697Smcpowers   Return an estimate for how long a string is needed to hold a radix
*5697Smcpowers   r representation of a number with 'bits' significant bits, plus an
*5697Smcpowers   extra for a zero terminator (assuming C style strings here)
*5697Smcpowers */
*5697Smcpowersint      s_mp_outlen(int bits, int r)
*5697Smcpowers{
*5697Smcpowers  return (int)((double)bits * LOG_V_2(r) + 1.5) + 1;
*5697Smcpowers
*5697Smcpowers} /* end s_mp_outlen() */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_read_unsigned_octets(mp, str, len) */
*5697Smcpowers/* mp_read_unsigned_octets(mp, str, len)
*5697Smcpowers   Read in a raw value (base 256) into the given mp_int
*5697Smcpowers   No sign bit, number is positive.  Leading zeros ignored.
*5697Smcpowers */
*5697Smcpowers
*5697Smcpowersmp_err
*5697Smcpowersmp_read_unsigned_octets(mp_int *mp, const unsigned char *str, mp_size len)
*5697Smcpowers{
*5697Smcpowers  int            count;
*5697Smcpowers  mp_err         res;
*5697Smcpowers  mp_digit       d;
*5697Smcpowers
*5697Smcpowers  ARGCHK(mp != NULL && str != NULL && len > 0, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  mp_zero(mp);
*5697Smcpowers
*5697Smcpowers  count = len % sizeof(mp_digit);
*5697Smcpowers  if (count) {
*5697Smcpowers    for (d = 0; count-- > 0; --len) {
*5697Smcpowers      d = (d << 8) | *str++;
*5697Smcpowers    }
*5697Smcpowers    MP_DIGIT(mp, 0) = d;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* Read the rest of the digits */
*5697Smcpowers  for(; len > 0; len -= sizeof(mp_digit)) {
*5697Smcpowers    for (d = 0, count = sizeof(mp_digit); count > 0; --count) {
*5697Smcpowers      d = (d << 8) | *str++;
*5697Smcpowers    }
*5697Smcpowers    if (MP_EQ == mp_cmp_z(mp)) {
*5697Smcpowers      if (!d)
*5697Smcpowers	continue;
*5697Smcpowers    } else {
*5697Smcpowers      if((res = s_mp_lshd(mp, 1)) != MP_OKAY)
*5697Smcpowers	return res;
*5697Smcpowers    }
*5697Smcpowers    MP_DIGIT(mp, 0) = d;
*5697Smcpowers  }
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers} /* end mp_read_unsigned_octets() */
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_unsigned_octet_size(mp) */
*5697Smcpowersint
*5697Smcpowersmp_unsigned_octet_size(const mp_int *mp)
*5697Smcpowers{
*5697Smcpowers  int  bytes;
*5697Smcpowers  int  ix;
*5697Smcpowers  mp_digit  d = 0;
*5697Smcpowers
*5697Smcpowers  ARGCHK(mp != NULL, MP_BADARG);
*5697Smcpowers  ARGCHK(MP_ZPOS == SIGN(mp), MP_BADARG);
*5697Smcpowers
*5697Smcpowers  bytes = (USED(mp) * sizeof(mp_digit));
*5697Smcpowers
*5697Smcpowers  /* subtract leading zeros. */
*5697Smcpowers  /* Iterate over each digit... */
*5697Smcpowers  for(ix = USED(mp) - 1; ix >= 0; ix--) {
*5697Smcpowers    d = DIGIT(mp, ix);
*5697Smcpowers    if (d)
*5697Smcpowers	break;
*5697Smcpowers    bytes -= sizeof(d);
*5697Smcpowers  }
*5697Smcpowers  if (!bytes)
*5697Smcpowers    return 1;
*5697Smcpowers
*5697Smcpowers  /* Have MSD, check digit bytes, high order first */
*5697Smcpowers  for(ix = sizeof(mp_digit) - 1; ix >= 0; ix--) {
*5697Smcpowers    unsigned char x = (unsigned char)(d >> (ix * CHAR_BIT));
*5697Smcpowers    if (x)
*5697Smcpowers	break;
*5697Smcpowers    --bytes;
*5697Smcpowers  }
*5697Smcpowers  return bytes;
*5697Smcpowers} /* end mp_unsigned_octet_size() */
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_to_unsigned_octets(mp, str) */
*5697Smcpowers/* output a buffer of big endian octets no longer than specified. */
*5697Smcpowersmp_err
*5697Smcpowersmp_to_unsigned_octets(const mp_int *mp, unsigned char *str, mp_size maxlen)
*5697Smcpowers{
*5697Smcpowers  int  ix, pos = 0;
*5697Smcpowers  int  bytes;
*5697Smcpowers
*5697Smcpowers  ARGCHK(mp != NULL && str != NULL && !SIGN(mp), MP_BADARG);
*5697Smcpowers
*5697Smcpowers  bytes = mp_unsigned_octet_size(mp);
*5697Smcpowers  ARGCHK(bytes <= maxlen, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  /* Iterate over each digit... */
*5697Smcpowers  for(ix = USED(mp) - 1; ix >= 0; ix--) {
*5697Smcpowers    mp_digit  d = DIGIT(mp, ix);
*5697Smcpowers    int       jx;
*5697Smcpowers
*5697Smcpowers    /* Unpack digit bytes, high order first */
*5697Smcpowers    for(jx = sizeof(mp_digit) - 1; jx >= 0; jx--) {
*5697Smcpowers      unsigned char x = (unsigned char)(d >> (jx * CHAR_BIT));
*5697Smcpowers      if (!pos && !x)	/* suppress leading zeros */
*5697Smcpowers	continue;
*5697Smcpowers      str[pos++] = x;
*5697Smcpowers    }
*5697Smcpowers  }
*5697Smcpowers  if (!pos)
*5697Smcpowers    str[pos++] = 0;
*5697Smcpowers  return pos;
*5697Smcpowers} /* end mp_to_unsigned_octets() */
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_to_signed_octets(mp, str) */
*5697Smcpowers/* output a buffer of big endian octets no longer than specified. */
*5697Smcpowersmp_err
*5697Smcpowersmp_to_signed_octets(const mp_int *mp, unsigned char *str, mp_size maxlen)
*5697Smcpowers{
*5697Smcpowers  int  ix, pos = 0;
*5697Smcpowers  int  bytes;
*5697Smcpowers
*5697Smcpowers  ARGCHK(mp != NULL && str != NULL && !SIGN(mp), MP_BADARG);
*5697Smcpowers
*5697Smcpowers  bytes = mp_unsigned_octet_size(mp);
*5697Smcpowers  ARGCHK(bytes <= maxlen, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  /* Iterate over each digit... */
*5697Smcpowers  for(ix = USED(mp) - 1; ix >= 0; ix--) {
*5697Smcpowers    mp_digit  d = DIGIT(mp, ix);
*5697Smcpowers    int       jx;
*5697Smcpowers
*5697Smcpowers    /* Unpack digit bytes, high order first */
*5697Smcpowers    for(jx = sizeof(mp_digit) - 1; jx >= 0; jx--) {
*5697Smcpowers      unsigned char x = (unsigned char)(d >> (jx * CHAR_BIT));
*5697Smcpowers      if (!pos) {
*5697Smcpowers	if (!x)		/* suppress leading zeros */
*5697Smcpowers	  continue;
*5697Smcpowers	if (x & 0x80) { /* add one leading zero to make output positive.  */
*5697Smcpowers	  ARGCHK(bytes + 1 <= maxlen, MP_BADARG);
*5697Smcpowers	  if (bytes + 1 > maxlen)
*5697Smcpowers	    return MP_BADARG;
*5697Smcpowers	  str[pos++] = 0;
*5697Smcpowers	}
*5697Smcpowers      }
*5697Smcpowers      str[pos++] = x;
*5697Smcpowers    }
*5697Smcpowers  }
*5697Smcpowers  if (!pos)
*5697Smcpowers    str[pos++] = 0;
*5697Smcpowers  return pos;
*5697Smcpowers} /* end mp_to_signed_octets() */
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers/* {{{ mp_to_fixlen_octets(mp, str) */
*5697Smcpowers/* output a buffer of big endian octets exactly as long as requested. */
*5697Smcpowersmp_err
*5697Smcpowersmp_to_fixlen_octets(const mp_int *mp, unsigned char *str, mp_size length)
*5697Smcpowers{
*5697Smcpowers  int  ix, pos = 0;
*5697Smcpowers  int  bytes;
*5697Smcpowers
*5697Smcpowers  ARGCHK(mp != NULL && str != NULL && !SIGN(mp), MP_BADARG);
*5697Smcpowers
*5697Smcpowers  bytes = mp_unsigned_octet_size(mp);
*5697Smcpowers  ARGCHK(bytes <= length, MP_BADARG);
*5697Smcpowers
*5697Smcpowers  /* place any needed leading zeros */
*5697Smcpowers  for (;length > bytes; --length) {
*5697Smcpowers	*str++ = 0;
*5697Smcpowers  }
*5697Smcpowers
*5697Smcpowers  /* Iterate over each digit... */
*5697Smcpowers  for(ix = USED(mp) - 1; ix >= 0; ix--) {
*5697Smcpowers    mp_digit  d = DIGIT(mp, ix);
*5697Smcpowers    int       jx;
*5697Smcpowers
*5697Smcpowers    /* Unpack digit bytes, high order first */
*5697Smcpowers    for(jx = sizeof(mp_digit) - 1; jx >= 0; jx--) {
*5697Smcpowers      unsigned char x = (unsigned char)(d >> (jx * CHAR_BIT));
*5697Smcpowers      if (!pos && !x)	/* suppress leading zeros */
*5697Smcpowers	continue;
*5697Smcpowers      str[pos++] = x;
*5697Smcpowers    }
*5697Smcpowers  }
*5697Smcpowers  if (!pos)
*5697Smcpowers    str[pos++] = 0;
*5697Smcpowers  return MP_OKAY;
*5697Smcpowers} /* end mp_to_fixlen_octets() */
*5697Smcpowers/* }}} */
*5697Smcpowers
*5697Smcpowers
*5697Smcpowers/*------------------------------------------------------------------------*/
*5697Smcpowers/* HERE THERE BE DRAGONS                                                  */