pock: New program for generating and verifying primality certificates.

[catacomb-python] / pock
diff --git a/pock b/pock

new file mode 100644 (file)

index 0000000..46cde4d
--- /dev/null
+++ b/pock
@@ -0,0 +1,1065 @@
+#! /usr/bin/python
+### -*- mode: python, coding: utf-8 -*-
+###
+### Tool for generating and verifying primality certificates
+###
+### (c) 2017 Straylight/Edgeware
+###
+
+###----- Licensing notice ---------------------------------------------------
+###
+### This file is part of the Python interface to Catacomb.
+###
+### Catacomb/Python is free software; you can redistribute it and/or modify
+### it under the terms of the GNU General Public License as published by
+### the Free Software Foundation; either version 2 of the License, or
+### (at your option) any later version.
+###
+### Catacomb/Python is distributed in the hope that it will be useful,
+### but WITHOUT ANY WARRANTY; without even the implied warranty of
+### MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+### GNU General Public License for more details.
+###
+### You should have received a copy of the GNU General Public License
+### along with Catacomb/Python; if not, write to the Free Software Foundation,
+### Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
+
+###--------------------------------------------------------------------------
+### Imported modules.
+
+from sys import argv, stdin, stdout, stderr
+import os as OS
+import itertools as I
+import math as M
+import optparse as OP
+
+import catacomb as C
+
+###--------------------------------------------------------------------------
+### Utilities.
+
+class ExpectedError (Exception):
+  """
+  I represent an expected error, which should be reported in a friendly way.
+  """
+  pass
+
+def prod(ff, one = 1):
+  """
+  Return ONE times the product of the elements of FF.
+
+  This is not done very efficiently.
+  """
+  return reduce(lambda prod, f: prod*f, ff, one)
+
+def parse_label(line):
+  """
+  Split LINE at an `=' character and return the left and right halves.
+
+  The returned pieces have leading and trailing whitespace trimmed.
+  """
+  eq = line.find('=')
+  if eq < 0: raise ExpectedError('expected `LABEL = ...\'')
+  return line[:eq].strip(), line[eq + 1:].strip()
+
+def parse_list(s, n):
+  l = s.split(',', n - 1)
+  if n is not None and len(l) != n:
+    raise ExpectedError('expected `,\'-separated list of %d items' % n)
+  return l
+
+def conv_int(s):
+  """Convert S to a integer."""
+  try: return C.MP(s, 0)
+  except TypeError: raise ExpectedError('invalid integer `%s\'' % s)
+
+VERBOSITY = 1
+
+class ProgressReporter (object):
+  """
+  I keep users amused while the program looks for large prime numbers.
+
+  My main strategy is the printing of incomprehensible runes.  I can be
+  muffled by lowering by verbosity level.
+
+  Prime searches are recursive in nature.  When a new recursive level is
+  started, call `push'; and call `pop' when the level is finished.  This must
+  be done around the top level too.
+  """
+  def __init__(me):
+    """Initialize the ProgressReporter."""
+    me._level = -1
+    me._update()
+  def _update(me):
+    """
+    Update our idea of whether we're active.
+
+    We don't write inscrutable runes when inactive.  The current policy is to
+    write nothing if verbosity is zero, to write runes for the top level only
+    if verbosity is 1, and to write runes always if verbosity is higher than
+    that.
+    """
+    me._active = VERBOSITY >= 2 or (VERBOSITY == 1 and me._level == 0)
+  def push(me):
+    """Push a new search level."""
+    me._level += 1
+    me._update()
+    if me._level > 0: me.p('[')
+    else: me.p(';; ')
+  def pop(me):
+    """Pop a search level."""
+    if me._level > 0: me.p(']')
+    else: me.p('\n')
+    me._level -= 1
+    me._update()
+  def p(me, ch):
+    """Print CH as a progress rune."""
+    if me._active: stderr.write(ch); stderr.flush()
+
+def combinations(r, v):
+  """
+  Return an iterator which yields all combinations of R elements from V.
+
+  V must be an indexable sequence.  The each combination is returned as a
+  list, containing elements from V in their original order.
+  """
+
+  ## Set up the selection vector.  C will contain the indices of the items of
+  ## V we've selected for the current combination.  At all times, C contains
+  ## a strictly increasing sequence of integers in the interval [0, N).
+  n = len(v)
+  c = range(r)
+
+  while True:
+
+    ## Yield up the current combination.
+    vv = [v[i] for i in c]
+    yield vv
+
+    ## Now advance to the next one.  Find the last index in C which we can
+    ## increment subject to the rules.  As we iterate downwards, i will
+    ## contain the index into C, and j will be the maximum acceptable value
+    ## for the corresponding item.  We'll step the last index until it
+    ## reaches the limit, and then step the next one down, resetting the last
+    ## index, and so on.
+    i, j = r, n
+    while True:
+
+      ## If i is zero here, then we've advanced everything as far as it will
+      ## go.  We're done.
+      if i == 0: return
+
+      ## Move down to the next index.
+      i -= 1; j -= 1
+
+      ## If this index isn't at its maximum value, then we've found the place
+      ## to step.
+      if c[i] != j: break
+
+    ## Step this index on by one, and set the following indices to the
+    ## immediately following values.
+    j = c[i] + 1
+    while i < r: c[i] = j; i += 1; j += 1
+
+class ArgFetcher (object):
+  """
+  I return arguments from a list, reporting problems when they occur.
+  """
+  def __init__(me, argv, errfn):
+    """
+    Initialize, returning successive arguments from ARGV.
+
+    Errors are reported to ERRFN.
+    """
+    me._argv = argv
+    me._argc = len(argv)
+    me._errfn = errfn
+    me._i = 0
+  def arg(me, default = None, must = True):
+    """
+    Return the next argument.
+
+    If MUST is true, then report an error (to the ERRFN) if there are no more
+    arguments; otherwise, return the DEFAULT.
+    """
+    if me._i >= me._argc:
+      if must: me._errfn('missing argument')
+      return default
+    arg = me._argv[me._i]; me._i += 1
+    return arg
+  def int(me, default = None, must = True, min = None, max = None):
+    """
+    Return the next argument converted to an integer.
+
+    If MUST is true, then report an error (to the ERRFN) if there are no more
+    arguments; otherwise return the DEFAULT.  Report an error if the next
+    argument is not a valid integer, or if the integer is beyond the MIN and
+    MAX bounds.
+    """
+    arg = me.arg(default = None, must = must)
+    if arg is None: return default
+    try: arg = int(arg)
+    except ValueError: me._errfn('bad integer')
+    if (min is not None and arg < min) or (max is not None and arg > max):
+      me._errfn('out of range')
+    return arg
+
+###--------------------------------------------------------------------------
+### Sieving for small primes.
+
+class Sieve (object):
+  """
+  I represent a collection of small primes, up to some chosen limit.
+
+  The limit is available as the `limit' attribute.  Let L be this limit;
+  then, if N < L^2 is some composite, then N has at least one prime factor
+  less than L.
+  """
+
+  ## Figure out the number of bits in a (nonnegative) primitive `int'.  We'll
+  ## use a list of these as our sieve.
+  _NBIT = 15
+  while type(1 << (_NBIT + 1)) == int: _NBIT += 1
+
+  def __init__(me, limit):
+    """
+    Initialize a sieve holding all primes below LIMIT.
+    """
+
+    ## The sieve is maintained in the `_bits' attribute.  This is a list of
+    ## integers, used as a bitmask: let 2 < n < L be an odd integer; then bit
+    ## (n - 3)/2 will be clear iff n is prime.  Let W be the value of
+    ## `_NBIT', above; then bit W i + j in the sieve is stored in bit j of
+    ## `_bits[i]'.
+
+    ## Store the limit for later inspection.
+    me.limit = limit
+
+    ## Calculate the size of sieve we'll need and initialize the bit list.
+    n = (limit - 2)/2
+    sievesz = (n + me._NBIT - 1)/me._NBIT
+    me._sievemax = sievesz*me._NBIT
+    me._bits = n*[0]
+
+    ## This is standard Sieve of Eratosthenes.  For each index i: if
+    ## bit i is clear, then p = 2 i + 3 is prime, so set the bits
+    ## corresponding to each multiple of p, i.e., bits (k p - 3)/2 =
+    ## (2 k i + 3 - 3)/2 = k i for k > 1.
+    for i in xrange(me._sievemax):
+      if me._bitp(i): i += 1; continue
+      p = 2*i + 3
+      if p >= limit: break
+      for j in xrange(i + p, me._sievemax, p): me._setbit(j)
+      i += 1
+
+  def _bitp(me, i): i, j = divmod(i, me._NBIT); return (me._bits[i] >> j)&1
+  def _setbit(me, i): i, j = divmod(i, me._NBIT); me._bits[i] |= 1 << j
+
+  def smallprimes(me):
+    """
+    Return an iterator over the known small primes.
+    """
+    yield 2
+    n = 3
+    for b in me._bits:
+      for j in xrange(me._NBIT):
+        if not (b&1): yield n
+        b >>= 1; n += 2
+
+## We generate the sieve on demand.
+SIEVE = None
+
+def initsieve(sievebits):
+  """
+  Generate the sieve.
+
+  Ensure that it can be used to check the primality of numbers up to (but not
+  including) 2^SIEVEBITS.
+  """
+  global SIEVE
+  if SIEVE is not None: raise ValueError('sieve already defined')
+  if sievebits < 6: sievebits = 6
+  SIEVE = Sieve(1 << (sievebits + 1)/2)
+
+###--------------------------------------------------------------------------
+### Primality checking.
+
+def small_test(p):
+  """
+  Check that P is a small prime.
+
+  If not, raise an `ExpectedError'.  The `SIEVE' variable must have been
+  initialized.
+  """
+  if p < 2: raise ExpectedError('%d too small' % p)
+  if SIEVE.limit*SIEVE.limit < p:
+    raise ExpectedError('%d too large for small prime' % p)
+  for q in SIEVE.smallprimes():
+    if q*q > p: return
+    if p%q == 0: raise ExpectedError('%d divides %d' % (q, p))
+
+def pock_test(p, a, qq):
+  """
+  Check that P is prime using Pocklington's criterion.
+
+  If not, raise an `ExpectedError'.
+
+  Let Q be the product of the elements of the sequence QQ.  The test works as
+  follows.  Suppose p is the smallest prime factor of P.  If A^{P-1} /== 1
+  (mod P) then P is certainly composite (Fermat's test); otherwise, we have
+  established that the order of A in (Z/pZ)^* divides P - 1.  Next, let t =
+  A^{(P-1)/q} for some prime factor q of Q, and let g = gcd(t - 1, P).  If g
+  = P then the proof is inconclusive; if 1 < g < P then g is a nontrivial
+  factor of P, so P is composite; otherwise, t has order q in (Z/pZ)^*, so
+  (Z/pZ)^* contains a subgroup of size q, and therefore q divides p - 1.  If
+  QQ is a sequence of distinct primes, and the preceding criterion holds for
+  all q in QQ, then Q divides p - 1.  If Q^2 < P then the proof is
+  inconclusive; otherwise, let p' be any prime dividing P/p.  Then p' >= p >
+  Q, so p p' > Q^2 > P; but p p' divides P, so this is a contradiction.
+  Therefore P/p has no prime factors, and P is prime.
+  """
+
+  ## We don't actually need the distinctness criterion.  Suppose that q^e
+  ## divides Q.  Then gcd(t - 1, P) = 1 implies that A^{(P-1)/q^{e-1}} has
+  ## order q^e in (Z/pZ)^*, which accounts for the multiplicity.
+
+  Q = prod(qq)
+  if p < 2: raise ExpectedError('%d too small' % p)
+  if Q*Q <= p:
+    raise ExpectedError('too few Pocklington factors for %d' % p)
+  if pow(a, p - 1, p) != 1:
+    raise ExpectedError('%d is Fermat witness for %d' % (a, p))
+  for q in qq:
+    if Q%(q*q) == 0:
+      raise ExpectedError('duplicate Pocklington factor %d for %d' % (q, p))
+    g = p.gcd(pow(a, (p - 1)/q, p) - 1)
+    if g == p:
+      raise ExpectedError('%d order not multiple of %d mod %d' % (a, q, p))
+    elif g != 1:
+      raise ExpectedError('%d divides %d' % (g, p))
+
+def ecpp_test(p, a, b, x, y, qq):
+  """
+  Check that P is prime using Goldwasser and Kilian's ECPP method.
+
+  If not, raise an `ExpectedError'.
+
+  Let Q be the product of the elements of the sequence QQ.  Suppose p is the
+  smallest prime factor of P.  Let g = gcd(4 A^3 + 27 B^2, P).  If g = P then
+  the test is inconclusive; otherwise, if g /= 1 then g is a nontrivial
+  factor of P.  Define E(GF(p)) = { (x, y) | y^2 = x^3 + A x + B } U { inf }
+  to be the elliptic curve over p with short-Weierstraß coefficients A and B;
+  we have just checked that this curve is not singular.  If R = (X, Y) is not
+  a point on this curve, then the test is inconclusive.  If Q R is not the
+  point at infinity, then the test fails; otherwise we deduce that P has
+  Q-torsion in E.  Let S = (Q/q) R for some prime factor q of Q.  If S is the
+  point at infinity then the test is inconclusive; otherwise, q divides the
+  order of S in E.  If QQ is a sequence of distinct primes, and the preceding
+  criterion holds for all q in QQ, then Q divides the order of S.  Therefore
+  #E(p) >= Q.  If Q <= (qrrt(P) + 1)^2 then the test is inconclusive.
+  Otherwise, Hasse's theorem tells us that |p + 1 - #E(p)| <= 2 sqrt(p);
+  hence we must have p + 1 + 2 sqrt(p) = (sqrt(p) + 1)^2 >= #E(p) >= Q >
+  (qrrt(P) + 1)^2; so sqrt(p) + 1 > qrrt(P) + 1, i.e., p^2 > P.  As for
+  Pocklington above, if p' is any prime factor of P/p, then p p' >= p^2 > P,
+  which is a contradiction, and we conclude that P is prime.
+  """
+
+  ## This isn't going to work if gcd(P, 6) /= 1: we're going to use the
+  ## large-characteristic addition formulae.
+  g = p.gcd(6)
+  if g != 1: raise ExpectedError('%d divides %d' % (g, p))
+
+  ## We want to check that Q > (qrrt(P) + 1)^2 iff sqrt(Q) > qrrt(P) + 1; but
+  ## calculating square roots is not enjoyable (partly because we have to
+  ## deal with the imprecision).  Fortunately, some algebra will help: the
+  ## condition holds iff qrrt(P) < sqrt(Q) - 1 iff P < Q^2 - 4 Q sqrt(Q) +
+  ## 6 Q - 4 sqrt(Q) + 1 = Q (Q + 6) + 1 - 4 sqrt(Q) (Q + 1) iff Q (Q + 6) -
+  ## P + 1 > 4 sqrt(Q) (Q + 1) iff (Q (Q + 6) - P + 1)^2 > 16 Q (Q + 1)^2
+  Q = prod(qq)
+  t, u = Q*(Q + 6) - p + 1, 4*(Q + 1)
+  if t*t <= Q*u*u: raise ExpectedError('too few subgroups for ECPP')
+
+  ## Construct the curve.
+  E = C.PrimeField(p).ec(a, b) # careful: may not be a prime!
+
+  ## Find the base point.
+  R = E(x, y)
+  if not R.oncurvep():
+    raise ExpectedError('(%d, %d) is not on the curve' % (x, y))
+
+  ## Check that it has Q-torsion.
+  if Q*R: raise ExpectedError('(%d, %d) not a %d-torsion point' % (x, y, Q))
+
+  ## Now check the individual factors.
+  for q in qq:
+    if Q%(q*q) == 0:
+      raise ExpectedError('duplicate ECPP factor %d for %d' % (q, p))
+    S = (Q/q)*R
+    if not S:
+      raise ExpectedError('(%d, %d) order not a multiple of %d' % (x, y, q))
+    g = p.gcd(S._z)
+    if g != 1:
+      raise ExpectedError('%d divides %d' % (g, p))
+
+###--------------------------------------------------------------------------
+### Proof steps and proofs.
+
+class BaseStep (object):
+  """
+  I'm a step in a primality proof.
+
+  I assert that a particular number is prime, and can check this.
+
+  This class provides basic protocol for proof steps, mostly to do with
+  handling labels.
+
+  The step's label is kept in its `label' attribute.  It can be set by the
+  constructor, and is `None' by default.  Users can modify this attribute if
+  they like.  Labels beginning `$' are assumed to be internal and
+  uninteresting; other labels cause `check' lines to be written to the output
+  listing the actual number of interest.
+
+  Protocol that proof steps should provide:
+
+  label         A string labelling the proof step and the associated prime
+                number.
+
+  p             The prime number which this step proves to be prime.
+
+  check()       Check that the proof step is actually correct, assuming that
+                any previous steps have already been verified.
+
+  out(FILE)     Write an appropriate encoding of the proof step to the output
+                FILE.
+  """
+  def __init__(me, label = None, *arg, **kw):
+    """Initialize a proof step, setting a default label if necessary."""
+    super(BaseStep, me).__init__(*arg, **kw)
+    me.label = label
+  def out(me, file):
+    """
+    Write the proof step to an output FILE.
+
+    Subclasses must implement a method `_out' which actually does the work.
+    Here, we write a `check' line to verify that the proof actually applies
+    to the number we wanted, if the label says that this is an interesting
+    step.
+    """
+    me._out(file)
+    if me.label is not None and not me.label.startswith('$'):
+      file.write('check %s, %d, %d\n' % (me.label, me.p.nbits, me.p))
+
+class SmallStep (BaseStep):
+  """
+  I represent a claim that a number is a small prime.
+
+  Such claims act as the base cases in a complicated primality proof.  When
+  verifying, the claim is checked by trial division using a collection of
+  known small primes.
+  """
+  def __init__(me, pp, p, *arg, **kw):
+    """
+    Initialize a small-prime step.
+
+    PP is the overall PrimeProof object of which this is a step; P is the
+    small number whose primality is asserted.
+    """
+    super(SmallStep, me).__init__(*arg, **kw)
+    me.p = p
+  def check(me):
+    """Check that the number is indeed a small prime."""
+    return small_test(me.p)
+  def _out(me, file):
+    """Write a small-prime step to the FILE."""
+    file.write('small %s = %d\n' % (me.label, me.p))
+  def __repr__(me): return 'SmallStep(%d)' % (me.p)
+  @classmethod
+  def parse(cls, pp, line):
+    """
+    Parse a small-prime step from a LINE in a proof file.
+
+    SMALL-STEP ::= `small' LABEL `=' P
+
+    PP is a PrimeProof object holding the results from the previous steps.
+    """
+    if SIEVE is None: raise ExpectedError('missing `sievebits\' line')
+    label, p = parse_label(line)
+    return cls(pp, conv_int(p), label = label)
+
+class PockStep (BaseStep):
+  """
+  I represent a Pocklington certificate for a number.
+
+  The number is not explicitly represented in a proof file.  See `pock_test'
+  for the underlying mathematics.
+  """
+  def __init__(me, pp, a, R, qqi, *arg, **kw):
+    """
+    Inititialize a Pocklington step.
+
+    PP is the overall PrimeProof object of which this is a step; A is the
+    generator of a substantial subgroup of units; R is a cofactor; and QQI is
+    a sequence of labels for previous proof steps.  If Q is the product of
+    the primes listed in QQI, then the number whose primality is asserted is
+    2 Q R + 1.
+    """
+    super(PockStep, me).__init__(*arg, **kw)
+    me._a = a
+    me._R = R
+    me._qqi = qqi
+    me._qq = [pp.get_step(qi).p for qi in qqi]
+    me.p = prod(me._qq, 2*R) + 1
+  def check(me):
+    """Verify a proof step based on Pocklington's theorem."""
+    return pock_test(me.p, me._a, me._qq)
+  def _out(me, file):
+    """Write a Pocklington step to the FILE."""
+    file.write('pock %s = %d, %d, [%s]\n' % \
+                 (me.label, me._a,
+                  me._R, ', '.join('%s' % qi for qi in me._qqi)))
+  def __repr__(me): return 'PockStep(%d, %d, %s)' % (me._a, me._R, me._qqi)
+  @classmethod
+  def parse(cls, pp, line):
+    """
+    Parse a Pocklington step from a LINE in a proof file.
+
+    POCK-STEP ::= `pock' LABEL `=' A `,' R `,' `[' Q-LIST `]'
+    Q-LIST ::= Q [`,' Q-LIST]
+
+    PP is a PrimeProof object holding the results from the previous steps.
+    """
+    label, rest = parse_label(line)
+    a, R, qq = parse_list(rest, 3)
+    qq = qq.strip()
+    if not qq.startswith('[') or not qq.endswith(']'):
+      raise ExpectedError('missing `[...]\' around Pocklington factors')
+    return cls(pp, conv_int(a), conv_int(R),
+               [q.strip() for q in qq[1:-1].split(',')], label = label)
+
+class ECPPStep (BaseStep):
+  """
+  I represent a Goldwasser--Kilian ECPP certificate for a number.
+  """
+  def __init__(me, pp, p, a, b, x, y, qqi, *arg, **kw):
+    """
+    Inititialize an ECPP step.
+
+    PP is the overall PrimeProof object of which this is a step; P is the
+    number whose primality is asserted; A and B are the short Weierstraß
+    curve coefficients; X and Y are the base point coordinates; and QQI is a
+    sequence of labels for previous proof steps.
+    """
+    super(ECPPStep, me).__init__(*arg, **kw)
+    me._a, me._b = a, b
+    me._x, me._y = x, y
+    me._qqi = qqi
+    me._qq = [pp.get_step(qi).p for qi in qqi]
+    me.p = p
+  def check(me):
+    """Verify a proof step based on Goldwasser and Kilian's theorem."""
+    return ecpp_test(me.p, me._a, me._b, me._x, me._y, me._qq)
+  def _out(me, file):
+    """Write an ECPP step to the FILE."""
+    file.write('ecpp %s = %d, %d, %d, %d, %d, [%s]\n' % \
+                 (me.label, me.p, me._a, me._b, me._x, me._y,
+                  ', '.join('%s' % qi for qi in me._qqi)))
+  def __repr__(me):
+    return 'ECPPstep(%d, %d, %d, %d, %d, %s)' % \
+        (me.p, me._a, me._b, me._x, me._y, me._qqi)
+  @classmethod
+  def parse(cls, pp, line):
+    """
+    Parse an ECPP step from a LINE in a proof file.
+
+    ECPP-STEP ::= `ecpp' LABEL `=' P `,' A `,' B `,' X `,' Y `,'
+        `[' Q-LIST `]'
+    Q-LIST ::= Q [`,' Q-LIST]
+
+    PP is a PrimeProof object holding the results from the previous steps.
+    """
+    label, rest = parse_label(line)
+    p, a, b, x, y, qq = parse_list(rest, 6)
+    qq = qq.strip()
+    if not qq.startswith('[') or not qq.endswith(']'):
+      raise ExpectedError('missing `[...]\' around ECPP factors')
+    return cls(pp, conv_int(p), conv_int(a), conv_int(b),
+               conv_int(x), conv_int(y),
+               [q.strip() for q in qq[1:-1].split(',')], label = label)
+
+def check(pp, line):
+  """
+  Handle a `check' line in a proof file.
+
+  CHECK ::= `check' LABEL, B, N
+
+  Verify that the proof step with the given LABEL asserts the primality of
+  the integer N, and that 2^{B-1} <= N < 2^B.
+  """
+  label, nb, p = parse_list(line, 3)
+  label, nb, p = label.strip(), conv_int(nb), conv_int(p)
+  pi = pp.get_step(label).p
+  if pi != p:
+    raise ExpectedError('check failed: %s = %d /= %d' % (label, pi, p))
+  if p.nbits != nb:
+    raise ExpectedError('check failed: nbits(%s) = %d /= %d' % \
+                        (label, p.nbits, nb))
+  if VERBOSITY: print ';; %s = %d [%d]' % (label, p, nb)
+
+def setsievebits(pp, line):
+  """
+  Handle a `sievebits' line in a proof file.
+
+  SIEVEBITS ::= `sievebits' N
+
+  Ensure that the verifier is willing to accept small primes up to 2^N.
+  """
+  initsieve(int(line))
+
+class PrimeProof (object):
+  """
+  I represent a proof of primality for one or more numbers.
+
+  I can encode my proof as a line-oriented text file, in a simple format, and
+  read such a proof back to check it.
+  """
+
+  ## A table to dispatch on keywords read from a file.
+  STEPMAP = { 'small': SmallStep.parse,
+              'pock': PockStep.parse,
+              'ecpp': ECPPStep.parse,
+              'sievebits': setsievebits,
+              'check': check }
+
+  def __init__(me):
+    """
+    Initialize a proof object.
+    """
+    me._steps = {}                      # Maps labels to steps.
+    me._stepseq = []                    # Sequence of labels, in order.
+    me._pmap = {}                       # Maps primes to steps.
+    me._i = 0
+
+  def addstep(me, step):
+    """
+    Add a new STEP to the proof.
+
+    The STEP may have a label already.  If not, a new internal label is
+    chosen.  The proof step is checked before being added to the proof.  The
+    label is returned.
+    """
+
+    ## If there's already a step for this prime, and the new step doesn't
+    ## have a label, then return the old one instead.
+    if step.label is None:
+      try: return me._pmap[step.p]
+      except KeyError: pass
+
+    ## Make sure the step is actually correct.
+    step.check()
+
+    ## Generate a label if the step doesn't have one already.
+    if step.label is None: step.label = '$t%d' % me._i; me._i += 1
+
+    ## If the label is already taken then we have a problem.
+    if step.label in me._steps:
+      raise ValueError('duplicate label `%s\'' % step.label)
+
+    ## Store the proof step.
+    me._pmap[step.p] = step.label
+    me._steps[step.label] = step
+    me._stepseq.append(step.label)
+    return step.label
+
+  def get_step(me, label):
+    """
+    Check that LABEL labels a known step, and return that step.
+    """
+    try: return me._steps[label]
+    except KeyError: raise ExpectedError('unknown label `%s\'' % label)
+
+  def write(me, file):
+    """
+    Write the proof to the given FILE.
+    """
+
+    ## Prefix the main steps with a `sievebits' line.
+    file.write('sievebits %d\n' % (2*(SIEVE.limit.bit_length() - 1)))
+
+    ## Write the steps out one by one.
+    for label in me._stepseq: me._steps[label].out(file)
+
+  def read(me, file):
+    """
+    Read a proof from a given FILE.
+
+    FILE ::= {STEP | CHECK | SIEVEBITS} [FILE]
+    STEP ::= SMALL-STEP | POCK-STEP
+
+    Comments (beginning `;') and blank lines are ignored.  Other lines begin
+    with a keyword.
+    """
+    lastp = None
+    for lno, line in enumerate(file, 1):
+      line = line.strip()
+      if line.startswith(';'): continue
+      ww = line.split(None, 1)
+      if not ww: continue
+      w = ww[0]
+      if len(ww) > 1: tail = ww[1]
+      else: tail = ''
+      try:
+        try: op = me.STEPMAP[w]
+        except KeyError:
+          raise ExpectedError('unrecognized keyword `%s\'' % w)
+        step = op(me, tail)
+        if step is not None:
+          me.addstep(step)
+          lastp = step.p
+      except ExpectedError, e:
+        raise ExpectedError('%s:%d: %s' % (file.name, lno, e.message))
+    return lastp
+
+###--------------------------------------------------------------------------
+### Finding provable primes.
+
+class BasePrime (object):
+  """
+  I represent a prime number which has been found and can be proven.
+
+  This object can eventually be turned into a sequence of proof steps and
+  added to a PrimeProof.  This isn't done immediately, because some
+  prime-search strategies want to build a pool of provable primes and will
+  then select some subset of them to actually construct the number of final
+  interest.  This way, we avoid cluttering the output proof with proofs of
+  uninteresting numbers.
+
+  Protocol required.
+
+  p             The prime number in question.
+
+  label(LABEL)  Associate LABEL with this prime, and the corresponding proof
+                step.  A label can be set in the constructor, or later using
+                this method.
+
+  register(PP)  Register the prime with a PrimeProof, adding any necessary
+                proof steps.  Returns the label of the proof step for this
+                number.
+
+  _mkstep(PP, **KW)
+                Return a proof step for this prime.
+  """
+  def __init__(me, label = None, *args, **kw):
+    """Initialize a provable prime number object."""
+    super(BasePrime, me).__init__(*args, **kw)
+    me._index = me._pp = None
+    me._label = label
+  def label(me, label):
+    """Set this number's LABEL."""
+    me._label = label
+  def register(me, pp):
+    """
+    Register the prime's proof steps with PrimeProof PP.
+
+    Return the final step's label.
+    """
+    if me._pp is not None:
+      assert me._pp == pp
+    else:
+      me._pp = pp
+      me._index = pp.addstep(me._mkstep(pp, label = me._label))
+      ##try: me._index = pp.addstep(me._mkstep(pp, label = me._label))
+      ##except: raise RuntimeError('generated proof failed sanity check')
+    return me._index
+
+class SmallPrime (BasePrime):
+  """I represent a prime small enough to be checked in isolation."""
+  def __init__(me, p, *args, **kw):
+    super(SmallPrime, me).__init__(*args, **kw)
+    me.p = p
+  def _mkstep(me, pp, **kw):
+    return SmallStep(pp, me.p, **kw)
+
+class PockPrime (BasePrime):
+  """I represent a prime proven using Pocklington's theorem."""
+  def __init__(me, p, a, qq, *args, **kw):
+    super(PockPrime, me).__init__(*args, **kw)
+    me.p = p
+    me._a = a
+    me._qq = qq
+  def _mkstep(me, pp, **kw):
+    return PockStep(pp, me._a, (me.p - 1)/prod((q.p for q in me._qq), 2),
+                    [q.register(pp) for q in me._qq], **kw)
+
+def gen_small(nbits, label = None, p = None):
+  """
+  Return a new small prime.
+
+  The prime will be exactly NBITS bits long.  The proof step will have the
+  given LABEL attached.  Report progress to the ProgressReporter P.
+  """
+  while True:
+
+    ## Pick a random NBITS-bit number.
+    n = C.rand.mp(nbits, 1)
+    assert n.nbits == nbits
+
+    ## If it's probably prime, then check it against the small primes we
+    ## know.  If it passes then we're done.  Otherwise, try again.
+    if n.primep():
+      for q in SIEVE.smallprimes():
+        if q*q > n: return SmallPrime(n, label = label)
+        if n%q == 0: break
+
+def gen_pock(nbits, nsubbits = 0, label = None, p = ProgressReporter()):
+  """
+  Return a new prime provable using Pocklington's theorem.
+
+  The prime N will be exactly NBITS long, of the form N = 2 Q R + 1.  If
+  NSUBBITS is nonzero, then each prime factor of Q will be NSUBBITS bits
+  long; otherwise a suitable default will be chosen.  The proof step will
+  have the given LABEL attached.  Report progress to the ProgressReporter P.
+
+  The prime numbers this function returns are a long way from being uniformly
+  distributed.
+  """
+
+  ## Pick a suitable value for NSUBBITS if we don't have one.
+  if not nsubbits:
+
+    ## This is remarkably tricky.  Picking about 1/3 sqrt(NBITS) factors
+    ## seems about right for large numbers, but there's serious trouble
+    ## lurking for small sizes.
+    nsubbits = int(3*M.sqrt(nbits))
+    if nbits < nsubbits + 3: nsubbits = nbits//2 + 1
+    if nbits == 2*nsubbits: nsubbits += 1
+
+  ## Figure out how many subgroups we'll need.
+  npiece = ((nbits + 1)//2 + nsubbits - 1)//nsubbits
+  p.push()
+
+  ## Keep searching...
+  while True:
+
+    ## Come up with a collection of known prime factors.
+    p.p('!'); qq = [gen(nsubbits, p = p) for i in xrange(npiece)]
+    Q = prod(q.p for q in qq)
+
+    ## Come up with bounds on the cofactor.  If we're to have N = 2 Q R + 1,
+    ## and 2^{B-1} <= N < 2^B, then we must have 2^{B-2}/Q <= R < 2^{B-1}/Q.
+    Rbase = (C.MP(0).setbit(nbits - 2) + Q - 1)//Q
+    Rwd = C.MP(0).setbit(nbits - 2)//Q
+
+    ## Probe the available space of cofactors.  If the space is kind of
+    ## narrow, then we want to give up quickly if we're not finding anything
+    ## suitable.
+    step = 0
+    while step < Rwd:
+      step += 1
+
+      ## Pick a random cofactor and examine the number we ended up with.
+      ## Make sure it really does have the length we expect.
+      R = C.rand.range(Rwd) + Rbase
+      n = 2*Q*R + 1
+      assert n.nbits == nbits
+
+      ## As a complication, if NPIECE is 1, it's just about possible that Q^2
+      ## <= n, in which case this isn't going to work.
+      if Q*Q < n: continue
+
+      ## If n has small factors, then pick another cofactor.
+      if C.PrimeFilter.smallfactor(n) == C.PGEN_FAIL: continue
+
+      ## Work through the small primes to find a suitable generator.  The
+      ## value 2 is almost always acceptable, so don't try too hard here.
+      for a in I.islice(SIEVE.smallprimes(), 16):
+
+        ## First, try the Fermat test.  If that fails, then n is definitely
+        ## composite.
+        if pow(a, n - 1, n) != 1: p.p('.'); break
+        p.p('*')
+
+        ## Work through the subgroup orders, checking that suitable powers of
+        ## a generate the necessary subgroups.
+        for q in qq:
+          if n.gcd(pow(a, (n - 1)/q.p, n) - 1) != 1:
+            p.p('@'); ok = False; break
+        else:
+          ok = True
+
+        ## we're all good.
+        if ok: p.pop(); return PockPrime(n, a, qq, label = label)
+
+def gen(nbits, label = None, p = ProgressReporter()):
+  """
+  Generate a prime number with NBITS bits.
+
+  Give it the LABEL, and report progress to P.
+  """
+  if SIEVE.limit >> (nbits + 1)/2: g = gen_small
+  else: g = gen_pock
+  return g(nbits, label = label, p = p)
+
+def gen_limlee(nbits, nsubbits,
+               label = None, qlfmt = None, p = ProgressReporter()):
+  """
+  Generate a Lim--Lee prime with NBITS bits.
+
+  Let p be the prime.  Then we'll have p = 2 q_0 q_1 ... q_k, with all q_i at
+  least NSUBBITS bits long, and all but q_k exactly that long.
+
+  The prime will be given the LABEL; progress is reported to P.  The factors
+  q_i will be labelled by filling in the `printf'-style format string QLFMT
+  with the argument i.
+  """
+
+  ## Figure out how many factors (p - 1)/2 will have.
+  npiece = nbits//nsubbits
+  if npiece < 2: raise ExpectedError('too few pieces')
+
+  ## Decide how big to make the pool of factors.
+  poolsz = max(3*npiece + 5, 25) # Heuristic from GnuPG
+
+  ## Prepare for the main loop.
+  disp = nstep = 0
+  qbig = None
+  p.push()
+
+  ## Try to make a prime.
+  while True:
+    p.p('!')
+
+    ## Construct a pool of NSUBBITS-size primes.  There's a problem with very
+    ## small sizes: we might not be able to build a pool of distinct primes.
+    pool = []; qmap = {}
+    for i in xrange(poolsz):
+      for j in xrange(64):
+        q = gen(nsubbits, p = p)
+        if q.p not in qmap: break
+      else:
+        raise ExpectedError('insufficient diversity')
+      qmap[q.p] = q
+      pool.append(q)
+
+    ## Work through combinations of factors from the pool.
+    for qq in combinations(npiece - 1, pool):
+
+      ## Construct the product of the selected factors.
+      qsmall = prod(q.p for q in qq)
+
+      ## Maybe we'll need to replace the large factor.  Try not to do this
+      ## too often.  DISP measures the large factor's performance at
+      ## producing candidates with the right length.  If it looks bad then
+      ## we'll have to replace it.
+      if 3*disp*disp > nstep*nstep:
+        qbig = None
+        if disp < 0: p.p('<')
+        else: p.p('>')
+
+      ## If we don't have a large factor, then make one.
+      if qbig is None:
+        qbig = gen(nbits - qsmall.nbits, p = p)
+        disp = 0; nstep = 0
+
+      ## We have a candidate.  Calculate it and make sure it has the right
+      ## length.
+      n = 2*qsmall*qbig.p + 1
+      nstep += 1
+      if n.nbits < nbits: disp -= 1
+      elif n.nbits > nbits: disp += 1
+      elif C.PrimeFilter.smallfactor(n) == C.PGEN_FAIL: pass
+      else:
+
+        ## The candidate has passed the small-primes test.  Now check it
+        ## against Pocklington.
+        for a in I.islice(SIEVE.smallprimes(), 16):
+
+          ## Fermat test.
+          if pow(a, n - 1, n) != 1: p.p('.'); break
+          p.p('*')
+
+          ## Find a generator of a sufficiently large subgroup.
+          if n.gcd(pow(a, (n - 1)/qbig.p, n) - 1) != 1: p.p('@'); continue
+          ok = True
+          for q in qq:
+            if n.gcd(pow(a, (n - 1)/q.p, n) - 1) != 1:
+              p.p('@'); ok = False; break
+
+          ## We're done.
+          if ok:
+
+            ## Label the factors.
+            qq.append(qbig)
+            if qlfmt:
+              for i, q in enumerate(qq): q.label(qlfmt % i)
+
+            ## Return the number we found.
+            p.pop(); return PockPrime(n, a, qq, label = label)
+
+###--------------------------------------------------------------------------
+### Main program.
+
+def __main__():
+  global VERBOSITY
+
+  ## Prepare an option parser.
+  op = OP.OptionParser(
+    usage = '''\
+pock [-qv] CMD ARGS...
+        gen NBITS
+        ll NBITS NSUBBITS
+        [check] [FILE]''',
+    description = 'Generate or verify certified prime numbers.')
+  op.add_option('-v', '--verbose', dest = 'verbosity',
+                action = 'count', default = 1,
+                help = 'Print mysterious runes while looking for prime numbers.')
+  op.add_option('-q', '--quiet', dest = 'quietude',
+                action = 'count', default = 0,
+                help = 'be quiet while looking for prime numbers.')
+  op.add_option('-s', '--sievebits', dest = 'sievebits',
+                type = 'int', default = 32,
+                help = 'Size (in bits) of largest small prime.')
+  opts, argv = op.parse_args()
+  VERBOSITY = opts.verbosity - opts.quietude
+  p = ProgressReporter()
+  a = ArgFetcher(argv, op.error)
+
+  ## Process arguments and do what the user asked.
+  w = a.arg()
+
+  if w == 'gen':
+    ## Generate a prime with no special structure.
+    initsieve(opts.sievebits)
+    nbits = a.int(min = 4)
+    pp = PrimeProof()
+    p = gen(nbits, 'p', p = p)
+    p.register(pp)
+    pp.write(stdout)
+
+  elif w == 'll':
+    ## Generate a Lim--Lee prime.
+    initsieve(opts.sievebits)
+    nbits = a.int(min = 4)
+    nsubbits = a.int(min = 4, max = nbits)
+    pp = PrimeProof()
+    p = gen_limlee(nbits, nsubbits, 'p', 'q_%d', p = p)
+    p.register(pp)
+    pp.write(stdout)
+
+  elif w == 'check':
+    ## Check an existing certificate.
+    fn = a.arg(default = '-', must = False)
+    if fn == '-': f = stdin
+    else: f = open(fn, 'r')
+    pp = PrimeProof()
+    p = pp.read(f)
+
+  else:
+    raise ExpectedError("unknown command `%s'" % w)
+
+if __name__ == '__main__':
+  prog = OS.path.basename(argv[0])
+  try: __main__()
+  except ExpectedError, e: exit('%s: %s' % (prog, e.message))
+  except IOError, e: exit('%s: %s' % (prog, e))
+
+###----- That's all, folks --------------------------------------------------