[catacomb] / math / exp.h

/* -*-c-*-
 *
 * Generalized exponentiation
 *
 * (c) 2001 Straylight/Edgeware
 */

/*----- Licensing notice --------------------------------------------------*
 *
 * This file is part of Catacomb.
 *
 * Catacomb is free software; you can redistribute it and/or modify
 * it under the terms of the GNU Library General Public License as
 * published by the Free Software Foundation; either version 2 of the
 * License, or (at your option) any later version.
 *
 * Catacomb is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Library General Public License for more details.
 *
 * You should have received a copy of the GNU Library General Public
 * License along with Catacomb; if not, write to the Free
 * Software Foundation, Inc., 59 Temple Place - Suite 330, Boston,
 * MA 02111-1307, USA.
 */

#ifdef CATACOMB_EXP_H
#  error "Multiple inclusion of <catacomb/exp.h>"
#endif

#define CATACOMB_EXP_H

#ifdef __cplusplus
  extern "C" {
#endif

/*----- Header files ------------------------------------------------------*/

#include <stddef.h>

#include <mLib/alloc.h>

#ifndef CATACOMB_MP_H
#  include "mp.h"
#endif

/*----- Data structures ---------------------------------------------------*/

typedef struct exp_simulscan {
  mpw w;
  size_t len;
  const mpw *v;
} exp_simulscan;

typedef struct exp_simul {
  unsigned b;
  size_t o, n;
  exp_simulscan *s;
} exp_simul;

/*----- Macros provided ---------------------------------------------------*/

/* --- Parameters --- */

#ifndef EXP_WINSZ			/* Sliding window size */
#  define EXP_WINSZ 4			/* Predefine if you need to */
#endif

/* --- These are determined from the window size --- *
 *
 * Given a %$k$%-bit exponent, I expect to do %$k/2$% multiplies if I use the
 * simple way.  If I use an n-bit sliding window, then I do %$2^n$%
 * multiplies up front, but I only do %$(2^n - 1)/2^n k/n$% multiplies for
 * the exponentiation.  This is a win when
 *
 *   %$k \ge \frac{n 2^{n+1}}{n - 2}$%
 */

#define EXP_TABSZ (1 << EXP_WINSZ)
#define EXP_THRESH							\
    ((EXP_WINSZ * (2 << EXP_WINSZ))/((EXP_WINSZ - 2) * MPW_BITS))

/* --- Required operations --- *
 *
 * The macros here are independent of the underlying group elements.  You
 * must provide the necessary group operations and other definitions.  The
 * group operation is assumed to be written multiplicatively.
 *
 * @EXP_TYPE@			The type of a group element, e.g., @mp *@.
 *
 * @EXP_COPY(d, x)@		Makes @d@ be a copy of @x@.
 *
 * @EXP_DROP(x)@		Discards the element @x@, reclaiming any
 *				memory it used.
 *
 * @EXP_MUL(a, x)@		Multiplies @a@ by @x@ (writing the result
 *				back to @a@).
 *
 * @EXP_FIX(x)@			Makes @x@ be a canonical representation of
 *				its value.  All multiplications have the
 *				right argument canonical.
 *
 * @EXP_SQR(a)@			Multiplies @a@ by itself.
 *
 * @EXP_SETMUL(d, x, y)@	Sets @d@ to be the product of @x@ and @y@.
 *				The value @d@ has not been initialized.
 *
 * @EXP_SETSQR(d, x)@		Sets @d@ to be the square of @x@.
 *
 * Only @EXP_TYPE@, @EXP_MUL@ and @EXP_SQR@ are required for simple
 * exponentation.  Sliding window and simultaneous exponentation require all
 * of the operations.
 */

#ifndef EXP_TYPE
#  error "EXP_TYPE not defined for <catacomb/exp.h>"
#endif

/* --- @EXP_SIMPLE@ --- *
 *
 * Arguments:	@a@ = the result object, initially a multiplicative identity
 *		@g@ = the object to exponentiate
 *		@x@ = the exponent, as a multiprecision integer
 *
 * Use:		Performs a simple left-to-right exponentiation.  At the end
 *		of the code, the answer is left in @a@; @g@ and @x@ are
 *		unchanged.
 */

#define EXP_SIMPLE(a, g, x) do {					\
  mpscan sc;								\
  unsigned sq = 0;							\
									\
  /* --- Begin scanning --- */						\
									\
  mp_rscan(&sc, x);							\
  if (!MP_RSTEP(&sc))							\
    goto exp_simple_exit;						\
  while (!MP_RBIT(&sc))							\
    MP_RSTEP(&sc);							\
									\
  /* --- Do the main body of the work --- */				\
									\
  EXP_FIX(g);								\
  for (;;) {								\
    EXP_MUL(a, g);							\
    sq = 0;								\
    for (;;) {								\
      if (!MP_RSTEP(&sc))						\
	goto exp_simple_done;						\
      sq++;								\
      if (MP_RBIT(&sc))							\
	break;								\
    }									\
    while (sq--) EXP_SQR(a);						\
  }									\
									\
  /* --- Do a final round of squaring --- */				\
									\
exp_simple_done:							\
  while (sq--) EXP_SQR(a);						\
exp_simple_exit:;							\
} while (0)

/* --- @EXP_WINDOW@ --- *
 *
 * Arguments:	@a@ = the result object, initially a multiplicative identity
 *		@g@ = the object to exponentiate
 *		@x@ = the exponent, as a multiprecision integer
 *
 * Use:		Performs a sliding-window exponentiation.  At the end of the
 *		code, the answer is left in @a@; @g@ and @x@ are unchanged.
 */

#define EXP_WINDOW(a, g, x) do {					\
  EXP_TYPE *v;								\
  EXP_TYPE g2;								\
  unsigned i, sq = 0;							\
  mpscan sc;								\
									\
  /* --- Get going --- */						\
									\
  mp_rscan(&sc, x);							\
  if (!MP_RSTEP(&sc))							\
    goto exp_window_exit;						\
									\
  /* --- Do the precomputation --- */					\
									\
  EXP_FIX(g);								\
  EXP_SETSQR(g2, g);							\
  EXP_FIX(g2);								\
  v = xmalloc(EXP_TABSZ * sizeof(EXP_TYPE));				\
  EXP_COPY(v[0], g);							\
  for (i = 1; i < EXP_TABSZ; i++) {					\
    EXP_SETMUL(v[i], v[i - 1], g2);					\
    EXP_FIX(v[i]);							\
  }									\
  EXP_DROP(g2);								\
									\
  /* --- Skip top-end zero bits --- *					\
   *									\
   * If the initial step worked, there must be a set bit somewhere, so	\
   * keep stepping until I find it.					\
   */									\
									\
  while (!MP_RBIT(&sc))							\
    MP_RSTEP(&sc);							\
									\
  /* --- Now for the main work --- */					\
									\
  for (;;) {								\
    unsigned l = 1;							\
    unsigned z = 0;							\
									\
    /* --- The next bit is set, so read a window index --- *		\
     *									\
     * Reset @i@ to zero and increment @sq@.  Then, until either I read	\
     * @WINSZ@ bits or I run out of bits, scan in a bit: if it's clear,	\
     * bump the @z@ counter; if it's set, push a set bit into @i@,	\
     * shift it over by @z@ bits, bump @sq@ by @z + 1@ and clear @z@.	\
     * By the end of this palaver, @i@ is an index to the precomputed	\
     * value in @v@.							\
     */									\
									\
    i = 0;								\
    sq++;								\
    while (l < EXP_WINSZ && MP_RSTEP(&sc)) {				\
      l++;								\
      if (!MP_RBIT(&sc))						\
	z++;								\
      else {								\
	i = ((i << 1) | 1) << z;					\
	sq += z + 1;							\
	z = 0;								\
      }									\
    }									\
									\
    /* --- Do the squaring --- *					\
     *									\
     * Remember that @sq@ carries over from the zero-skipping stuff	\
     * below.								\
     */									\
									\
    while (sq--) EXP_SQR(a);						\
									\
    /* --- Do the multiply --- */					\
									\
    EXP_MUL(a, v[i]);							\
									\
    /* --- Now grind along through the rest of the bits --- */		\
									\
    sq = z;								\
    for (;;) {								\
      if (!MP_RSTEP(&sc))						\
	goto exp_window_done;						\
      if (MP_RBIT(&sc))							\
	break;								\
      sq++;								\
    }									\
  }									\
									\
  /* --- Do a final round of squaring --- */				\
									\
exp_window_done:							\
  while (sq--) EXP_SQR(a);						\
  for (i = 0; i < EXP_TABSZ; i++)					\
    EXP_DROP(v[i]);							\
  xfree(v);								\
exp_window_exit:;							\
} while (0)

/* --- @EXP_SIMUL@ --- *
 *
 * Arguments:	@a@ = the result object, initially a multiplicative identity
 *		@f@ = pointer to a vector of base/exp pairs
 *		@n@ = the number of base/exp pairs
 *
 * Use:		Performs a simultaneous sliding-window exponentiation.  The
 *		@f@ table is an array of structures containing members @base@
 *		of type @EXP_TYPE@, and @exp@ of type @mp *@.
 */

#define EXP_SIMUL(a, f, n) do {						\
  size_t i, j, jj, k;							\
  size_t vn = 1 << (EXP_WINSZ * n), m = (1 << n) - 1;			\
  EXP_TYPE *v = xmalloc(vn * sizeof(EXP_TYPE));				\
  exp_simul e;								\
  unsigned sq = 0;							\
									\
  /* --- Fill in the precomputed table --- */				\
									\
  j = 1;								\
  for (i = 0; i < n; i++) {						\
    EXP_COPY(v[j], f[n - 1 - i].base);					\
    EXP_FIX(v[j]);							\
    j <<= 1;								\
  }									\
  k = n * EXP_WINSZ;							\
  jj = 1;								\
  for (; i < k; i++) {							\
    EXP_SETSQR(v[j], v[jj]);						\
    EXP_FIX(v[j]);							\
    j <<= 1; jj <<= 1;							\
  }									\
  for (i = 1; i < vn; i <<= 1) {					\
    for (j = 1; j < i; j++) {						\
      EXP_SETMUL(v[j + i], v[j], v[i]);					\
      EXP_FIX(v[j + i]);						\
    }									\
  }									\
									\
  /* --- Set up the bitscanners --- *					\
   *									\
   * Got to use custom scanners, to keep them all in sync.		\
   */									\
									\
  e.n = n;								\
  e.b = 0;								\
  e.s = xmalloc(n * sizeof(*e.s));					\
  e.o = 0;								\
  for (i = 0; i < n; i++) {						\
    MP_SHRINK(f[i].exp);						\
    e.s[i].len = MP_LEN(f[i].exp);					\
    e.s[i].v = f[i].exp->v;						\
    if (e.s[i].len > e.o)						\
      e.o = e.s[i].len;							\
  }									\
									\
  /* --- Skip as far as a nonzero column in the exponent matrix --- */	\
									\
  do {									\
    if (!e.o && !e.b)							\
      goto exp_simul_done;						\
    i = exp_simulnext(&e, 0);						\
  } while (!(i & m));							\
									\
  /* --- Now for the main work --- */					\
									\
  for (;;) {								\
    unsigned l = 1;							\
    unsigned z = 0;							\
									\
    /* --- Just read a nonzero column, so read a window index --- *	\
     *									\
     * Clear high bits of @i@ and increment @sq@.  Then, until either I	\
     * read @WINSZ@ columns or I run out, scan in a column and append	\
     * it to @i@.  If it's zero, bump the @z@ counter; if it's nonzero,	\
     * bump @sq@ by @z + 1@ and clear @z@.  By the end of this palaver,	\
     * @i@ is an index to the precomputed value in @v@, followed by	\
     * @n * z@ zero bits.						\
     */									\
									\
    sq++;								\
    while (l < EXP_WINSZ && (e.o || e.b)) {				\
      l++;								\
      i = exp_simulnext(&e, i);						\
      if (!(i & m))							\
	z++;								\
      else {								\
	sq += z + 1;							\
	z = 0;								\
      }									\
    }									\
									\
    /* --- Do the squaring --- *					\
     *									\
     * Remember that @sq@ carries over from the zero-skipping stuff	\
     * below.								\
     */									\
									\
    while (sq--) EXP_SQR(a);						\
									\
    /* --- Do the multiply --- */					\
									\
    i >>= (z * n);							\
    EXP_MUL(a, v[i]);							\
									\
    /* --- Now grind along through the rest of the bits --- */		\
									\
    sq = z;								\
    for (;;) {								\
      if (!e.o && !e.b)							\
	goto exp_simul_done;						\
      if ((i = exp_simulnext(&e, 0)) != 0)				\
	break;								\
      sq++;								\
    }									\
  }									\
									\
  /* --- Do a final round of squaring --- */				\
									\
exp_simul_done:								\
  while (sq--) EXP_SQR(a);						\
  for (i = 1; i < vn; i++)						\
    EXP_DROP(v[i]);							\
  xfree(v);								\
  xfree(e.s);								\
} while (0)

/*----- Functions provided ------------------------------------------------*/

/* --- @exp_simulnext@ --- *
 *
 * Arguments:	@exp_simul *e@ = pointer to state structure
 *		@size_t x@ = a current accumulator
 *
 * Returns:	The next column of bits.
 *
 * Use:		Scans the next column of bits for a simultaneous
 *		exponentiation.
 */

extern size_t exp_simulnext(exp_simul */*e*/, size_t /*x*/);

/*----- That's all, folks -------------------------------------------------*/

#ifdef __cplusplus
  }
#endif
Commit	Line	Data
7765e926	1	/* --c--
7765e926	2	*
	3	* Generalized exponentiation
	4	*
	5	* (c) 2001 Straylight/Edgeware
	6	*/
	7
45c0fd36	8	/----- Licensing notice --------------------------------------------------
7765e926	9	*
	10	* This file is part of Catacomb.
	11	*
	12	* Catacomb is free software; you can redistribute it and/or modify
	13	* it under the terms of the GNU Library General Public License as
	14	* published by the Free Software Foundation; either version 2 of the
	15	* License, or (at your option) any later version.
45c0fd36	16	*
7765e926	17	* Catacomb is distributed in the hope that it will be useful,
	18	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	19	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	20	* GNU Library General Public License for more details.
45c0fd36	21	*
7765e926	22	* You should have received a copy of the GNU Library General Public
	23	* License along with Catacomb; if not, write to the Free
	24	* Software Foundation, Inc., 59 Temple Place - Suite 330, Boston,
	25	* MA 02111-1307, USA.
	26	*/
	27
7765e926	28	#ifdef CATACOMB_EXP_H
	29	# error "Multiple inclusion of <catacomb/exp.h>"
	30	#endif
	31
	32	#define CATACOMB_EXP_H
	33
	34	#ifdef __cplusplus
	35	extern "C" {
	36	#endif
	37
	38	/----- Header files ------------------------------------------------------/
	39
	40	#include <stddef.h>
	41
	42	#include <mLib/alloc.h>
	43
	44	#ifndef CATACOMB_MP_H
	45	# include "mp.h"
	46	#endif
	47
	48	/----- Data structures ---------------------------------------------------/
	49
	50	typedef struct exp_simulscan {
	51	mpw w;
	52	size_t len;
	53	const mpw *v;
45c0fd36	54	} exp_simulscan;
7765e926	55
	56	typedef struct exp_simul {
	57	unsigned b;
	58	size_t o, n;
	59	exp_simulscan *s;
	60	} exp_simul;
	61
	62	/----- Macros provided ---------------------------------------------------/
	63
	64	/* --- Parameters --- */
	65
	66	#ifndef EXP_WINSZ /* Sliding window size */
	67	# define EXP_WINSZ 4 /* Predefine if you need to */
	68	#endif
	69
391faf42	70	/* --- These are determined from the window size --- *
	71	*
	72	* Given a %$k$%-bit exponent, I expect to do %$k/2$% multiplies if I use the
	73	* simple way. If I use an n-bit sliding window, then I do %$2^n$%
	74	* multiplies up front, but I only do %$(2^n - 1)/2^n k/n$% multiplies for
	75	* the exponentiation. This is a win when
	76	*
	77	* %$k \ge \frac{n 2^{n+1}}{n - 2}$%
	78	*/
7765e926	79
7765e926	80	#define EXP_TABSZ (1 << EXP_WINSZ)
391faf42	81	#define EXP_THRESH \
391faf42	82	((EXP_WINSZ * (2 << EXP_WINSZ))/((EXP_WINSZ - 2) * MPW_BITS))
7765e926	83
	84	/* --- Required operations --- *
	85	*
	86	* The macros here are independent of the underlying group elements. You
	87	* must provide the necessary group operations and other definitions. The
	88	* group operation is assumed to be written multiplicatively.
	89	*
	90	* @EXP_TYPE@ The type of a group element, e.g., @mp *@.
	91	*
	92	* @EXP_COPY(d, x)@ Makes @d@ be a copy of @x@.
	93	*
	94	* @EXP_DROP(x)@ Discards the element @x@, reclaiming any
	95	* memory it used.
	96	*
	97	* @EXP_MUL(a, x)@ Multiplies @a@ by @x@ (writing the result
	98	* back to @a@).
	99	*
8823192f	100	* @EXP_FIX(x)@ Makes @x@ be a canonical representation of
	101	* its value. All multiplications have the
	102	* right argument canonical.
	103	*
7765e926	104	* @EXP_SQR(a)@ Multiplies @a@ by itself.
	105	*
	106	* @EXP_SETMUL(d, x, y)@ Sets @d@ to be the product of @x@ and @y@.
	107	* The value @d@ has not been initialized.
	108	*
	109	* @EXP_SETSQR(d, x)@ Sets @d@ to be the square of @x@.
	110	*
	111	* Only @EXP_TYPE@, @EXP_MUL@ and @EXP_SQR@ are required for simple
	112	* exponentation. Sliding window and simultaneous exponentation require all
	113	* of the operations.
	114	*/
	115
	116	#ifndef EXP_TYPE
	117	# error "EXP_TYPE not defined for <catacomb/exp.h>"
	118	#endif
	119
	120	/* --- @EXP_SIMPLE@ --- *
	121	*
	122	* Arguments: @a@ = the result object, initially a multiplicative identity
	123	* @g@ = the object to exponentiate
	124	* @x@ = the exponent, as a multiprecision integer
	125	*
	126	* Use: Performs a simple left-to-right exponentiation. At the end
	127	* of the code, the answer is left in @a@; @g@ and @x@ are
	128	* unchanged.
	129	*/
	130
	131	#define EXP_SIMPLE(a, g, x) do { \
	132	mpscan sc; \
	133	unsigned sq = 0; \
	134	\
	135	/* --- Begin scanning --- */ \
	136	\
	137	mp_rscan(&sc, x); \
	138	if (!MP_RSTEP(&sc)) \
	139	goto exp_simple_exit; \
	140	while (!MP_RBIT(&sc)) \
	141	MP_RSTEP(&sc); \
	142	\
	143	/* --- Do the main body of the work --- */ \
	144	\
8823192f	145	EXP_FIX(g); \
7765e926	146	for (;;) { \
	147	EXP_MUL(a, g); \
	148	sq = 0; \
	149	for (;;) { \
	150	if (!MP_RSTEP(&sc)) \
	151	goto exp_simple_done; \
	152	sq++; \
	153	if (MP_RBIT(&sc)) \
	154	break; \
	155	} \
	156	while (sq--) EXP_SQR(a); \
	157	} \
	158	\
	159	/* --- Do a final round of squaring --- */ \
	160	\
	161	exp_simple_done: \
	162	while (sq--) EXP_SQR(a); \
	163	exp_simple_exit:; \
	164	} while (0)
	165
	166	/* --- @EXP_WINDOW@ --- *
	167	*
	168	* Arguments: @a@ = the result object, initially a multiplicative identity
	169	* @g@ = the object to exponentiate
	170	* @x@ = the exponent, as a multiprecision integer
	171	*
	172	* Use: Performs a sliding-window exponentiation. At the end of the
	173	* code, the answer is left in @a@; @g@ and @x@ are unchanged.
	174	*/
	175
	176	#define EXP_WINDOW(a, g, x) do { \
	177	EXP_TYPE *v; \
	178	EXP_TYPE g2; \
	179	unsigned i, sq = 0; \
	180	mpscan sc; \
	181	\
	182	/* --- Get going --- */ \
	183	\
	184	mp_rscan(&sc, x); \
	185	if (!MP_RSTEP(&sc)) \
	186	goto exp_window_exit; \
	187	\
	188	/* --- Do the precomputation --- */ \
	189	\
8823192f	190	EXP_FIX(g); \
7765e926	191	EXP_SETSQR(g2, g); \
8823192f	192	EXP_FIX(g2); \
7765e926	193	v = xmalloc(EXP_TABSZ * sizeof(EXP_TYPE)); \
7765e926	194	EXP_COPY(v[0], g); \
8823192f	195	for (i = 1; i < EXP_TABSZ; i++) { \
7765e926	196	EXP_SETMUL(v[i], v[i - 1], g2); \
8823192f	197	EXP_FIX(v[i]); \
8823192f	198	} \
7765e926	199	EXP_DROP(g2); \
	200	\
	201	/* --- Skip top-end zero bits --- * \
	202	* \
	203	* If the initial step worked, there must be a set bit somewhere, so \
	204	* keep stepping until I find it. \
	205	*/ \
	206	\
	207	while (!MP_RBIT(&sc)) \
	208	MP_RSTEP(&sc); \
	209	\
	210	/* --- Now for the main work --- */ \
	211	\
	212	for (;;) { \
	213	unsigned l = 1; \
	214	unsigned z = 0; \
	215	\
	216	/* --- The next bit is set, so read a window index --- * \
	217	* \
	218	* Reset @i@ to zero and increment @sq@. Then, until either I read \
	219	* @WINSZ@ bits or I run out of bits, scan in a bit: if it's clear, \
	220	* bump the @z@ counter; if it's set, push a set bit into @i@, \
	221	* shift it over by @z@ bits, bump @sq@ by @z + 1@ and clear @z@. \
	222	* By the end of this palaver, @i@ is an index to the precomputed \
	223	* value in @v@. \
	224	*/ \
	225	\
	226	i = 0; \
	227	sq++; \
	228	while (l < EXP_WINSZ && MP_RSTEP(&sc)) { \
	229	l++; \
	230	if (!MP_RBIT(&sc)) \
	231	z++; \
	232	else { \
	233	i = ((i << 1) \| 1) << z; \
	234	sq += z + 1; \
	235	z = 0; \
	236	} \
	237	} \
	238	\
	239	/* --- Do the squaring --- * \
	240	* \
	241	* Remember that @sq@ carries over from the zero-skipping stuff \
	242	* below. \
	243	*/ \
	244	\
	245	while (sq--) EXP_SQR(a); \
	246	\
	247	/* --- Do the multiply --- */ \
	248	\
	249	EXP_MUL(a, v[i]); \
	250	\
	251	/* --- Now grind along through the rest of the bits --- */ \
	252	\
	253	sq = z; \
	254	for (;;) { \
	255	if (!MP_RSTEP(&sc)) \
	256	goto exp_window_done; \
	257	if (MP_RBIT(&sc)) \
	258	break; \
	259	sq++; \
	260	} \
	261	} \
	262	\
263	/* --- Do a final round of squaring --- */ \
264	\
265	exp_window_done: \
266	while (sq--) EXP_SQR(a); \
267	for (i = 0; i < EXP_TABSZ; i++) \
268	EXP_DROP(v[i]); \
269	xfree(v); \
270	exp_window_exit:; \
271	} while (0)
272
273	/* --- @EXP_SIMUL@ --- *
274	*
275	* Arguments: @a@ = the result object, initially a multiplicative identity
276	* @f@ = pointer to a vector of base/exp pairs
277	* @n@ = the number of base/exp pairs
278	*
279	* Use: Performs a simultaneous sliding-window exponentiation. The
280	* @f@ table is an array of structures containing members @base@
281	* of type @EXP_TYPE@, and @exp@ of type @mp *@.
282	*/
283
284	#define EXP_SIMUL(a, f, n) do { \
285	size_t i, j, jj, k; \
286	size_t vn = 1 << (EXP_WINSZ * n), m = (1 << n) - 1; \
287	EXP_TYPE v = xmalloc(vn sizeof(EXP_TYPE)); \
288	exp_simul e; \
289	unsigned sq = 0; \
290	\
291	/* --- Fill in the precomputed table --- */ \
292	\
293	j = 1; \
294	for (i = 0; i < n; i++) { \
295	EXP_COPY(v[j], f[n - 1 - i].base); \
8823192f	296	EXP_FIX(v[j]); \
7765e926	297	j <<= 1; \
	298	} \
	299	k = n * EXP_WINSZ; \
	300	jj = 1; \
	301	for (; i < k; i++) { \
	302	EXP_SETSQR(v[j], v[jj]); \
8823192f	303	EXP_FIX(v[j]); \
7765e926	304	j <<= 1; jj <<= 1; \
	305	} \
	306	for (i = 1; i < vn; i <<= 1) { \
8823192f	307	for (j = 1; j < i; j++) { \
7765e926	308	EXP_SETMUL(v[j + i], v[j], v[i]); \
8823192f	309	EXP_FIX(v[j + i]); \
8823192f	310	} \
7765e926	311	} \
	312	\
	313	/* --- Set up the bitscanners --- * \
	314	* \
	315	* Got to use custom scanners, to keep them all in sync. \
	316	*/ \
	317	\
	318	e.n = n; \
	319	e.b = 0; \
	320	e.s = xmalloc(n * sizeof(*e.s)); \
	321	e.o = 0; \
	322	for (i = 0; i < n; i++) { \
	323	MP_SHRINK(f[i].exp); \
	324	e.s[i].len = MP_LEN(f[i].exp); \
	325	e.s[i].v = f[i].exp->v; \
	326	if (e.s[i].len > e.o) \
	327	e.o = e.s[i].len; \
	328	} \
	329	\
	330	/* --- Skip as far as a nonzero column in the exponent matrix --- */ \
	331	\
	332	do { \
	333	if (!e.o && !e.b) \
	334	goto exp_simul_done; \
	335	i = exp_simulnext(&e, 0); \
	336	} while (!(i & m)); \
	337	\
	338	/* --- Now for the main work --- */ \
	339	\
	340	for (;;) { \
	341	unsigned l = 1; \
	342	unsigned z = 0; \
	343	\
	344	/* --- Just read a nonzero column, so read a window index --- * \
	345	* \
	346	* Clear high bits of @i@ and increment @sq@. Then, until either I \
	347	* read @WINSZ@ columns or I run out, scan in a column and append \
	348	* it to @i@. If it's zero, bump the @z@ counter; if it's nonzero, \
	349	* bump @sq@ by @z + 1@ and clear @z@. By the end of this palaver, \
	350	* @i@ is an index to the precomputed value in @v@, followed by \
	351	* @n * z@ zero bits. \
	352	*/ \
	353	\
	354	sq++; \
	355	while (l < EXP_WINSZ && (e.o \|\| e.b)) { \
	356	l++; \
	357	i = exp_simulnext(&e, i); \
	358	if (!(i & m)) \
	359	z++; \
	360	else { \
	361	sq += z + 1; \
	362	z = 0; \
	363	} \
	364	} \
	365	\
	366	/* --- Do the squaring --- * \
	367	* \
	368	* Remember that @sq@ carries over from the zero-skipping stuff \
	369	* below. \
	370	*/ \
	371	\
	372	while (sq--) EXP_SQR(a); \
	373	\
	374	/* --- Do the multiply --- */ \
375	\
376	i >>= (z * n); \
377	EXP_MUL(a, v[i]); \
378	\
379	/* --- Now grind along through the rest of the bits --- */ \
380	\
381	sq = z; \
382	for (;;) { \
383	if (!e.o && !e.b) \
384	goto exp_simul_done; \
385	if ((i = exp_simulnext(&e, 0)) != 0) \
386	break; \
387	sq++; \
388	} \
389	} \
390	\
391	/* --- Do a final round of squaring --- */ \
392	\
393	exp_simul_done: \
394	while (sq--) EXP_SQR(a); \
8823192f	395	for (i = 1; i < vn; i++) \
7765e926	396	EXP_DROP(v[i]); \
7765e926	397	xfree(v); \
ef13e9a4	398	xfree(e.s); \
7765e926	399	} while (0)
	400
	401	/----- Functions provided ------------------------------------------------/
	402
	403	/* --- @exp_simulnext@ --- *
	404	*
	405	* Arguments: @exp_simul *e@ = pointer to state structure
	406	* @size_t x@ = a current accumulator
	407	*
	408	* Returns: The next column of bits.
	409	*
	410	* Use: Scans the next column of bits for a simultaneous
	411	* exponentiation.
	412	*/
	413
	414	extern size_t exp_simulnext(exp_simul /e/, size_t /x*/);
	415
	416	/----- That's all, folks -------------------------------------------------/
	417
	418	#ifdef __cplusplus
	419	}
	420	#endif