nealmcb · nealmcb · Jun 10, 2018 · Dec 23, 2018 · Oct 23, 2018 · Jun 11, 2021
diff --git a/.gitignore b/.gitignore
@@ -1,3 +1,7 @@
 *.pyc
 .*swp
-db.sqlite3*
+db.sqlite3*
+.hypothesis
+.cache
+.ipynb_checkpoints
+.idea
diff --git a/audit_cvrs/TODO b/audit_cvrs/TODO
@@ -0,0 +1,5 @@
+rlacalc ballot-polling branch:
+ does it work with python 3?
+  with amazon lambda?
+ Add a test for OverflowError
+ add smart_boolean support to make web form make more sense(?)
diff --git a/audit_cvrs/parse_dominion_cvrs.py b/audit_cvrs/parse_dominion_cvrs.py
@@ -64,14 +64,14 @@ def parse():
 
         contestManifest = json.loads(rawJson)
 
-        contests = collections.OrderedDict()
+        all_contests = collections.OrderedDict()
 
         for contest in contestManifest['List']:
-            contests[contest['Id']] = contest['Description']
+            all_contests[contest['Id']] = contest['Description']
 
-        numContests = len(contests)
+        numContests = len(all_contests)
 
-        logging.debug("Manifest for %d contests:\n%s" % (numContests, contests.items()))
+        logging.debug("Manifest for %d contests:\n%s" % (numContests, all_contests.items()))
 
     with zipf.open("CandidateManifest.json") as jsonFile:
         rawJson = jsonFile.read()
@@ -82,9 +82,9 @@ def parse():
         unordered_candidates = {}
 
         for candidate in candidateManifest['List']:
-            unordered_candidates[candidate['Id']] = "%s\t%s" % (contests[candidate['ContestId']], candidate['Description'])
+            unordered_candidates[candidate['Id']] = "%s\t%s" % (all_contests[candidate['ContestId']], candidate['Description'])
 
-        logging.debug(sorted(unordered_candidates.items()))
+        # same as below logging.debug("Sorted candidate items: %s" % sorted(unordered_candidates.items()))
 
     candidates = collections.OrderedDict(sorted(unordered_candidates.items()))
     numCandidates = len(candidates)
@@ -98,15 +98,15 @@ def parse():
     i = 0
     for id, name in candidates.iteritems():
         if "," in name:
-            print "Error: Found , in name"
+            pass # print "Error: Found , in name:", name
         headers += "%s," % name
         candidateIndex[id] = i
         i += 1
 
     headers = headers.strip(",")
 
-    logging.info("Found %d candidates:\n%s" % (numCandidates, candidates))
-    logging.info(candidateIndex)
+    logging.info("Found %d candidates:\n %s" % (numCandidates, candidates))
+    logging.info("Candidate Index by contest: %s" % candidateIndex)
 
     logging.info("First manifest item: %s" % candidateManifest['List'][1])
 
@@ -163,7 +163,15 @@ def parse():
 
                 voteArray = ["0"] * numCandidates
                 votes = ""
-                for contest in original['Contests']:
+                try:
+                    # e.g. in Dominion Democracy Suite version 4.21.3.0
+                    contests = original['Contests']
+                except KeyError:
+                    logging.debug("For %s, original doesn't have 'Contests' in it!\n Keys: %s\n Dump: %s" % (zipinfo.filename, original.keys(), original))
+                    # e.g. in Dominion Democracy Suite version 5.5.32.4
+                    contests = original['Cards'][0]['Contests']
+
+                for contest in contests:
                     contestBallots[contest['Id']] += 1
                     contestBallotsByBatch = contestBallotsByBatchManager.get(contest['Id'], collections.Counter())
                     contestBallotsByBatch[session['BatchId']] += 1
@@ -225,11 +233,16 @@ def parse():
     print contestBallots.most_common(10)
 
     for contestId in sorted(contestBallots):
-        logging.warning("%d Ballots for contest %s" % (contestBallots[contestId], contests[contestId]))
+        logging.warning("%d Ballots for contest %s" % (contestBallots[contestId], all_contests[contestId]))
 
     import pandas as pd
     df = pd.DataFrame.from_dict(contestBallotsByBatchManager, orient='index').transpose()
+
+    # Print description statistics for each contest of number of ballots by batch
+    # FIXME: assumes a single tabulator. need to combine tabulator and batch ids....
+
     # hmmm - how to add the contest name (Description) to the mix? df['Contest'] = apply(
+    # Use option_context to print all rows and columns out, no maximums
     with pd.option_context('display.max_rows', None, 'display.max_columns', None):
         print df.describe().transpose()
 

diff --git a/audit_cvrs/rlacalc.py b/audit_cvrs/rlacalc.py
@@ -51,6 +51,14 @@
  rlacalc.py --test
 
 TODO:
+ check hug parameters, test more
+ check command line calling sequences and printouts
+ use different names if I change parameter order
+ update rlacalc.html
+ make "Note, can be less than nmin" example into test case
+ more p-value tests
+ test multi-times thru loop
+
  Model variance for ballot-polling audits, add estimates for quantiles.
  Add calculations for DiffSum, ClipAudit etc.
  Add pretty API documentation via pydoc3 and json2html
@@ -64,7 +72,7 @@
 import sys
 import logging
 from optparse import OptionParser
-from math import log, ceil, isnan
+from math import log, exp, ceil, isnan
 # from numpy import log, ceil
 
 try:
@@ -101,7 +109,7 @@ def decorator(f):
   action="store_true", default=False,
   help="Calculate nmin from observed discrepancies, not rates")
 
-parser.add_option("-R", "--rawrates",
+parser.add_option("--rawrates",
   action="store_true", default=False,
   help="Calculate KM_Expected_sample_size value, with no rounding")
 
@@ -113,13 +121,19 @@ def decorator(f):
   action="store_true", default=False,
   help="Calculate nminToGo value: calculate rates from o1 o2 u1 u2 / samplesize")
 
-parser.add_option("-l", "--level",
+parser.add_option("--level",
   action="store_true", default=False,
   help="Calculate risk level, the p-value")
 
 parser.add_option("-p", "--polling",
   action="store_true", default=False,
-  help="Ballot polling audit")
+  help="Ballot polling audit. Add --level for levels")
+
+parser.add_option("-R", "--risk_level",
+  type="float", default=100.0,
+                  help="risk level based on ballots tallied so far."
+                  "Corresponds to one divided by the test statistic, as a fraction."
+                  "Default: 1.0 (corresponding to no ballots tallied)")
 
 parser.add_option("-r", "--alpha",
   type="float", default=10.0,
@@ -133,6 +147,22 @@ def decorator(f):
   type="int", default=95,
   help="Sample size, for --level option")
 
+parser.add_option("-W", "--winnervotes",
+  type="int", default=0,
+  help="Reported votes for the winner -p --level options")
+
+parser.add_option("-L", "--loservotes",
+  type="int", default=0,
+  help="Reported votes for the loser -p --level options")
+
+parser.add_option("-w", "--winnersamples",
+  type="int", default=0,
+  help="Sampled votes for the winner -p --level options")
+
+parser.add_option("-l", "--losersamples",
+  type="int", default=0,
+  help="Sampled votes for the winner -p --level options")
+
 parser.add_option("-b", "--binom",
   action="store_true", default=False,
   help="Calculate binomial confidence interval")
@@ -494,7 +524,7 @@ def nminEst(alpha=0.1, gamma=1.03905, margin=0.05, or1=0.001, or2=0.0001, ur1=0.
 @annotate(dict(alpha=hug.types.float_number, gamma=hug.types.float_number, margin=hug.types.float_number,
                or1=hug.types.float_number, or2=hug.types.float_number,
                ur1=hug.types.float_number, ur2=hug.types.float_number,
-               roundUp1=hug.types.boolean, roundUp2=hug.types.boolean))
+               roundUp1=hug.types.boolean, roundUp2=hug.types.boolean))  # smart_boolean when supported
 def nminFromRates(alpha=0.1, gamma=1.03905, margin=0.05, or1=0.001, or2=0.0001, ur1=0.001, ur2=0.0001, roundUp1=True, roundUp2=False):
     """Return expected sample size for a ballot-level comparison Risk-Limiting Audit
     alpha: maximum risk level (alpha), as a fraction
@@ -562,8 +592,19 @@ def nminFromRates(alpha=0.1, gamma=1.03905, margin=0.05, or1=0.001, or2=0.0001,
     return(n0)
 
 
+def recalculateSamplesToAudit(num_audited, a, gamma, m, o1, o2, u1, u2):
+    """Sample size calculation from ColoradoRLA v1.1: 
+    https://github.com/FreeAndFair/ColoradoRLA/issues/695
+    """
+
+    nm = nmin(a, gamma, m, o1, o2, u1, u2)
+    return ceil(nm * (1 + ((o1 + o2) * 1.0 / num_audited)))
+
+
 def KM_P_value(n=95, gamma=1.03905, margin=0.05, o1=0, o2=0, u1=0, u2=0):
-    """Return P-values (risk level achieved?) for given sample size n and discrepancy counts.
+    """Return P-values (risk level achieved) for a comparison audit with the
+    given sample size n and discrepancy counts.
+
     n: sample size
     margin: diluted margin; 
     From https://github.com/pbstark/S157F17/blob/master/audit.ipynb
@@ -580,22 +621,68 @@ def KM_P_value(n=95, gamma=1.03905, margin=0.05, o1=0, o2=0, u1=0, u2=0):
            (1 + 1/gamma)**(-u2))
 
 
-@hug.get(examples='alpha=0.1&margin=0.05')
+def ballot_polling_risk_level(winner_votes, loser_votes, winner_obs, loser_obs):
+    """
+    Return the ballot polling risk level for a contest with the given overall
+    vote totals and observed votes on selected ballots during a ballot polling
+    risk-limiting audit.
+
+    This method should be called for each winner-loser pair (w,l).
+    calculate s_wl = (number of votes for w)/(number of votes for w + number of votes for l)
+    For each contest, for each winner-loser pair (w,l), set T_wl =1.
+    For each line in `all_contest_audit_details_by_cvr` with consensus = "YES",
+     change any T_wl values as indicated by the BRAVO algorithm.
+    The risk level achieved so far is the inverse of the resulting T_wl value.
+
+    >>> ballot_polling_risk_level(1410, 1132, 170, 135) # Custer County 2018
+    0.1342382069344729
+    >>> ballot_polling_risk_level(2894, 1695, 45, 32)   # Las Animas County 2018
+    0.47002027242290234
+    >>> ballot_polling_risk_level(0, 0, 2000, 0)
+    1.0
+    >>> ballot_polling_risk_level(2894, 0, 1130, 0)   # Test overflow
+    nan
+    >>> ballot_polling_risk_level(100000, 0, 50000, 0)   # Test overflow
+    nan
+
+    The core of the code is equivalent to this, but uses logs to prevent overflow
+    T_wl = 1.0
+    T_wl = T_wl * ((s_wl)/0.5) ** winner_obs
+    T_wl = T_wl * ((1.0 - s_wl)/0.5) ** loser_obs
+    """
+
+    try:
+        s_wl = winner_votes / (winner_votes + loser_votes)
+    except ZeroDivisionError:
+        return 1.0
+
+    log_T_wl = log(1.0)
+    try:
+        log_T_wl = log_T_wl + ((log(s_wl) - log(0.5)) * winner_obs)
+        log_T_wl = log_T_wl + ((log(1.0 - s_wl) - log(0.5)) * loser_obs)
+        log_risk_level = log(1.0) - log_T_wl
+        risk_level = exp(log_risk_level)
+    except (ValueError, OverflowError): # TODO: Add test case, reevaluate for OverflowError e.g. Lt Governer
+        risk_level = float('NaN')
+
+    return risk_level
+
+
+@hug.get(examples='alpha=0.1&margin=0.05&risk_level=1.0')
 @hug.local()
-@annotate(dict(alpha=hug.types.float_number, margin=hug.types.float_number))
-def findAsn(alpha=0.1, margin=0.05):
+@annotate(dict(alpha=hug.types.float_number, margin=hug.types.float_number, risk_level=hug.types.float_number))
+def findAsn(alpha=0.1, margin=0.05, risk_level=1.0):
     """Return expected sample size for a ballot-polling Risk-Limiting Audit
     alpha: maximum risk level (alpha), as a fraction
     margin: margin of victory, as a fraction
-
-    TODO: enhance to allow for other than a perfect split
-    between 2 candidates, and various numbers of ballots.
+    risk_level: risk level for ballots tallied so far.
 
     Model variance for ballot-polling audits, add estimates for quantiles.
      Quantile           25th        50th    75th    90th    99th
      fraction of mean   0.41        0.71    1.25    2.09    4.64
 
     Based on Javascript code in https://www.stat.berkeley.edu/~stark/Java/Html/ballotPollTools.htm
+    and BRAVO paper section 9.2.
 
     Tests, based on table 1 in BRAVO: Ballot-polling Risk-limiting Audits to Verify Outcomes
       Mark Lindeman, Philip B. Stark, Vincent S. Yates
@@ -607,6 +694,10 @@ def findAsn(alpha=0.1, margin=0.05):
     2902.0
     >>> findAsn(margin=0.2)
     119.0
+    >>> findAsn(margin=0.2,)
+    119.0
+
+    TODO: add tests that use risk_level
 
     v_c: reported votes for the candidate
     p_c: reported proportion of ballots with votes for candidate
@@ -617,6 +708,9 @@ def findAsn(alpha=0.1, margin=0.05):
     vw = ballots * (0.5 + margin / 2.)
     vl = ballots * (0.5 - margin / 2.)
 
+    if vl <= 0:
+        return 4  # FIXME: for 100% margin, use same value as 99% margin
+
     if (vw > vl):
         sw = vw / (vw + vl)
         zw = log(2.0 * sw)
@@ -626,7 +720,7 @@ def findAsn(alpha=0.1, margin=0.05):
 
         logging.debug("%s, %s, %s, %s, %s, %s, %s, %s, %s, %s" % (alpha, margin, ballots, vw, vl, sw, zw, zl, pw, pl))
 
-        asn = ceil((log(1.0 / alpha) + zw / 2.0) / (((vw + vl) / ballots) * (pw * zw + pl * zl)))
+        asn = ceil((log(1.0 / alpha * risk_level) + zw / 2.0) / (((vw + vl) / ballots) * (pw * zw + pl * zl)))
 
     else:
         asn = float('nan')
@@ -738,8 +832,12 @@ def main(parser):
         sys.exit(0)
 
     if opts.polling:
-        samplesize = findAsn(opts.alpha / 100.0, opts.margin / 100.0)
-        print("Sample size = %d for ballot polling, margin %g%%, risk %g%%" % (samplesize, opts.margin, opts.alpha))
+        if opts.level:
+            risk_level = ballot_polling_risk_level(opts.winnervotes, opts.loservotes, opts.winnersamples, opts.losersamples)
+            print("Risk level: %.4g" % risk_level)
+        else:
+            samplesize = findAsn(opts.alpha / 100.0, opts.margin / 100.0, opts.risk_level / 100.0)
+            print("Sample size = %d for ballot polling, margin %g%%, risk %g%%" % (samplesize, opts.margin, opts.alpha))
 
     elif opts.nmin:
         samplesize = nmin(opts.alpha / 100.0, opts.gamma, opts.margin / 100.0, opts.o1, opts.o2, opts.u1, opts.u2)

diff --git a/audit_cvrs/test.py b/audit_cvrs/test.py
@@ -0,0 +1,49 @@
+"""Test rlacalc
+Use hypothesis testing framework:
+ https://hypothesis.readthedocs.io/en/latest/quickstart.html
+
+TODO:
+ see what's up with really small margins, e.g.
+ falsified: test_nmin(alpha=1e-06, gamma=1.001, margin=1e-10, o1=0, o2=0, u1=0, u2=0)
+
+"""
+
+import sys
+# TODO: get pytest working without this and without python3 -m pytest
+#sys.path.insert(0, '/home/neal/py/projects/audit_cvrs/audit_cvrs')
+
+import logging
+logging.basicConfig(filename='hypothesis-test.log', level=logging.DEBUG)
+logging.debug("pytest path: %s" % sys.path)
+
+import rlacalc
+
+# print("raw nmin test: %s" % rlacalc.nmin(0.05, 1.03905, 0.02, 0, 0, 0, 0))
+
+from hypothesis import given, settings, Verbosity, example, assume
+
+import hypothesis.strategies as st
+
+@given(st.floats(10**-6, 1.01),
+       st.floats(1.01, 10.0),
+       st.floats(10**-6, 1.01),
+       st.integers(0, 100), st.integers(0, 100), st.integers(0, 100), st.integers(0, 100))
+@settings(max_examples=1000)
+@example(0.05, 1.03905, 0.02, 1, 1, 1, 1)
+def test_nmin(alpha, gamma, margin, o1, o2, u1, u2):
+
+    assume(0.0 < alpha <= 1.0)
+    assume(0.0 < margin <= 1.0)
+    assume(gamma > 1.0)
+    assume(not (o1 < 0  or  o2 < 0  or u1 < 0  or u2 < 0))
+
+    samples = rlacalc.nmin(alpha, gamma, margin, o1, o2, u1, u2)
+    assert samples >= 0
+    assert rlacalc.KM_P_value(samples, gamma, margin, o1, o2, u1, u2) <= alpha, "Didn't meet alpha; samples = %d" % samples
+
+"""
+    perhaps useful?
+    try: ...nmin...
+    except OverflowError:
+        assume(False)
+"""