From 8d49545b4111532f459b8f25aeb1e378ac959cc5 Mon Sep 17 00:00:00 2001
From: Peter Hurford <peter@peterhurford.com>
Date: Sat, 8 Oct 2022 17:28:19 -0500
Subject: [PATCH] Add integration tests

---
 tests/integration.py | 313 +++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 313 insertions(+)
 create mode 100644 tests/integration.py

diff --git a/tests/integration.py b/tests/integration.py
new file mode 100644
index 0000000..e0e218a
--- /dev/null
+++ b/tests/integration.py
@@ -0,0 +1,313 @@
+import random
+import numpy as np
+import squigglepy as sq
+from squigglepy.numbers import K, M
+from squigglepy import bayes
+
+
+sq.set_seed(42)
+random.seed(42)
+
+
+print('Test 1...')
+pop_of_ny_2022 = sq.to(8.1*M, 8.4*M)
+
+
+def pct_of_pop_w_pianos():
+    percentage = sq.to(.2, 1)
+    return sq.sample(percentage) * 0.01
+
+
+def piano_tuners_per_piano():
+    pianos_per_piano_tuner = sq.to(2*K, 50*K)
+    return 1 / sq.sample(pianos_per_piano_tuner)
+
+
+def total_tuners_in_2022():
+    return (sq.sample(pop_of_ny_2022) *
+            pct_of_pop_w_pianos() *
+            piano_tuners_per_piano())
+
+
+out = sq.get_percentiles(sq.sample(total_tuners_in_2022, n=1000), digits=1)
+expected = {1: 0.3, 5: 0.6, 10: 0.9, 20: 1.5, 30: 2.2, 40: 2.9,
+            50: 3.8, 60: 4.9, 70: 6.8, 80: 9.8, 90: 14.5,
+            95: 23.9, 99: 39.5}
+if out != expected:
+    print('ERROR 1')
+    import pdb
+    pdb.set_trace()
+
+
+print('Test 2...')
+# Time in years after 2022
+
+
+def pop_at_time(t):
+    avg_yearly_pct_change = sq.to(-0.01, 0.05)
+    return sq.sample(pop_of_ny_2022) * ((sq.sample(avg_yearly_pct_change) + 1) ** t)
+
+
+def total_tuners_at_time(t):
+    return (pop_at_time(t) *
+            pct_of_pop_w_pianos() *
+            piano_tuners_per_piano())
+
+
+# Get total piano tuners at 2030
+out = sq.get_percentiles(sq.sample(lambda: total_tuners_at_time(2030-2022), n=1000), digits=1)
+expected = {1: 0.3, 5: 0.7, 10: 1.0, 20: 1.8, 30: 2.7, 40: 3.5, 50: 4.5, 60: 6.1,
+            70: 8.1, 80: 11.4, 90: 18.8, 95: 26.6, 99: 67.5}
+
+if out != expected:
+    print('ERROR 2')
+    import pdb
+    pdb.set_trace()
+
+
+print('Test 3...')
+# Normal distribution
+sq.sample(sq.norm(1, 3))  # 90% interval from 1 to 3
+
+# Distribution can be sampled with mean and sd too
+sq.sample(sq.norm(mean=0, sd=1))
+sq.sample(sq.norm(-1.67, 1.67))  # This is equivalent to mean=0, sd=1
+
+# Get more than one sample
+sq.sample(sq.norm(1, 3), n=100)
+
+# Other distributions exist
+sq.sample(sq.lognorm(1, 10))
+sq.sample(sq.tdist(1, 10, t=5))
+sq.sample(sq.triangular(1, 2, 3))
+sq.sample(sq.binomial(p=0.5, n=5))
+sq.sample(sq.beta(a=1, b=2))
+sq.sample(sq.bernoulli(p=0.5))
+sq.sample(sq.poisson(10))
+sq.sample(sq.gamma(3, 2))
+sq.sample(sq.exponential(scale=1))
+
+# Discrete sampling
+sq.sample(sq.discrete({'A': 0.1, 'B': 0.9}))
+
+# Can return integers
+sq.sample(sq.discrete({0: 0.1, 1: 0.3, 2: 0.3, 3: 0.15, 4: 0.15}))
+
+# Alternate format (also can be used to return more complex objects)
+sq.sample(sq.discrete([[0.1,  0],
+                       [0.3,  1],
+                       [0.3,  2],
+                       [0.15, 3],
+                       [0.15, 4]]))
+
+sq.sample(sq.discrete([0, 1, 2]))  # No weights assumes equal weights
+
+# You can mix distributions together
+sq.sample(sq.mixture([sq.norm(1, 3),
+                      sq.norm(4, 10),
+                      sq.lognorm(1, 10)],  # Distributions to mix
+                     [0.3, 0.3, 0.4]))     # These are the weights on each distribution
+
+# This is equivalent to the above, just a different way of doing the notation
+sq.sample(sq.mixture([[0.3, sq.norm(1, 3)],
+                      [0.3, sq.norm(4, 10)],
+                      [0.4, sq.lognorm(1, 10)]]))
+
+sq.sample(lambda: sq.sample(sq.norm(1, 3)) + sq.sample(sq.norm(4, 5)), n=100)
+sq.sample(lambda: sq.sample(sq.norm(1, 3)) - sq.sample(sq.norm(4, 5)), n=100)
+sq.sample(lambda: sq.sample(sq.norm(1, 3)) * sq.sample(sq.norm(4, 5)), n=100)
+sq.sample(lambda: sq.sample(sq.norm(1, 3)) / sq.sample(sq.norm(4, 5)), n=100)
+
+sq.sample(sq.norm(1, 3, credibility=0.8))
+sq.sample(sq.norm(0, 3, lclip=0, rclip=5))
+sq.sample(sq.const(4))
+
+
+def roll_die(sides, n=1):
+    return sq.sample(sq.discrete(list(range(1, sides + 1))), n=n) if sides > 0 else None
+
+
+roll_die(sides=6, n=10)
+
+
+print('Test 4...')
+
+
+def mammography(has_cancer):
+    p = 0.8 if has_cancer else 0.096
+    return bool(sq.sample(sq.bernoulli(p)))
+
+
+def define_event():
+    cancer = sq.sample(sq.bernoulli(0.01))
+    return ({'mammography': mammography(cancer),
+             'cancer': cancer})
+
+
+out = bayes.bayesnet(define_event,
+                     find=lambda e: e['cancer'],
+                     conditional_on=lambda e: e['mammography'],
+                     n=10*K)
+expected = 0.09
+if round(out, 2) != expected:
+    print('ERROR 4')
+    import pdb
+    pdb.set_trace()
+
+
+print('Test 5...')
+out = bayes.simple_bayes(prior=0.01, likelihood_h=0.8, likelihood_not_h=0.096)
+expected = None
+if round(out, 2) != 0.08:
+    print('ERROR 5')
+    import pdb
+    pdb.set_trace()
+
+
+print('Test 6...')
+prior = sq.norm(1, 5)
+prior_samples = sq.sample(prior, n=K)
+evidence = sq.norm(2, 3)
+evidence_samples = sq.sample(evidence, n=K)
+posterior = bayes.update(prior_samples, evidence_samples)
+posterior_samples = sq.sample(posterior, n=K)
+out = (np.mean(posterior_samples), np.std(posterior_samples))
+if round(out[0], 2) != 2.53 and round(out[1], 2) != 0.3:
+    print('ERROR 6')
+    import pdb
+    pdb.set_trace()
+
+
+print('Test 7...')
+average = bayes.average(prior, evidence)
+average_samples = sq.sample(average, n=K)
+out = (np.mean(average_samples), np.std(average_samples))
+if round(out[0], 2) != 2.73 and round(out[1], 2) != 0.97:
+    print('ERROR 7')
+    import pdb
+    pdb.set_trace()
+
+
+print('Test 8...')
+
+
+def p_alarm_goes_off(burglary, earthquake):
+    if burglary and earthquake:
+        return 0.95
+    elif burglary and not earthquake:
+        return 0.94
+    elif not burglary and earthquake:
+        return 0.29
+    elif not burglary and not earthquake:
+        return 0.001
+
+
+def p_john_calls(alarm_goes_off):
+    return 0.9 if alarm_goes_off else 0.05
+
+
+def p_mary_calls(alarm_goes_off):
+    return 0.7 if alarm_goes_off else 0.01
+
+
+def define_event():
+    burglary_happens = bool(sq.sample(sq.bernoulli(p=0.001)))
+    earthquake_happens = bool(sq.sample(sq.bernoulli(p=0.002)))
+    alarm_goes_off = bool(sq.sample(sq.bernoulli(p_alarm_goes_off(burglary_happens,
+                                                                  earthquake_happens))))
+    john_calls = bool(sq.sample(sq.bernoulli(p_john_calls(alarm_goes_off))))
+    mary_calls = bool(sq.sample(sq.bernoulli(p_mary_calls(alarm_goes_off))))
+    return {'burglary': burglary_happens,
+            'earthquake': earthquake_happens,
+            'alarm_goes_off': alarm_goes_off,
+            'john_calls': john_calls,
+            'mary_calls': mary_calls}
+
+
+# What are the chances that both John and Mary call if an earthquake happens?
+out = bayes.bayesnet(define_event,
+                     n=10*K,
+                     find=lambda e: (e['mary_calls'] and e['john_calls']),
+                     conditional_on=lambda e: e['earthquake'])
+if round(out, 2) != 0.1:
+    print('ERROR 8')
+    import pdb
+    pdb.set_trace()
+
+print('Test 9...')
+# If both John and Mary call, what is the chance there's been a burglary?
+out = bayes.bayesnet(define_event,
+                     n=10*K,
+                     find=lambda e: e['burglary'],
+                     conditional_on=lambda e: (e['mary_calls'] and e['john_calls']))
+if round(out, 2) != 0.32:
+    print('ERROR 9')
+    import pdb
+    pdb.set_trace()
+
+
+print('Test 10...')
+
+
+def monte_hall(door_picked, switch=False):
+    doors = ['A', 'B', 'C']
+    car_is_behind_door = random.choice(doors)
+    reveal_door = random.choice([d for d in doors if d != door_picked and d != car_is_behind_door])
+
+    if switch:
+        old_door_picked = door_picked
+        door_picked = [d for d in doors if d != old_door_picked and d != reveal_door][0]
+
+    won_car = (car_is_behind_door == door_picked)
+    return won_car
+
+
+def define_event():
+    door = random.choice(['A', 'B', 'C'])
+    switch = random.random() >= 0.5
+    return {'won': monte_hall(door_picked=door, switch=switch),
+            'switched': switch}
+
+
+RUNS = 10*K
+out = bayes.bayesnet(define_event,
+                     find=lambda e: e['won'],
+                     conditional_on=lambda e: e['switched'],
+                     n=RUNS)
+if round(out, 2) != 0.66:
+    print('ERROR 10')
+    import pdb
+    pdb.set_trace()
+
+
+print('Test 11...')
+out = bayes.bayesnet(define_event,
+                     find=lambda e: e['won'],
+                     conditional_on=lambda e: not e['switched'],
+                     n=RUNS)
+if round(out, 2) != 0.33:
+    print('ERROR 11')
+    import pdb
+    pdb.set_trace()
+
+
+def define_event():
+    flip = sq.flip_coin()
+    if flip == 'heads':
+        dice_sides = 6
+    else:
+        dice_sides = sq.sample(sq.discrete([4, 6, 10, 20]))
+    return sq.roll_die(dice_sides)
+
+
+print('Test 12...')
+out = bayes.bayesnet(define_event,
+                     find=lambda e: e == 6,
+                     n=10*K)
+if round(out, 2) != 0.12:
+    print('ERROR 12')
+    import pdb
+    pdb.set_trace()
+
+
+print('DONE! INTEGRATION TEST SUCCESS!')