PythonProgrammingPuzzles/generators/probability.py at main · NulledExceptions/PythonProgrammingPuzzles · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
"""Probability problems"""

from puzzle_generator import PuzzleGenerator, Tags
from typing import List


# See https://github.com/microsoft/PythonProgrammingPuzzles/wiki/How-to-add-a-puzzle to learn about adding puzzles


class BirthdayParadox(PuzzleGenerator):
    """
    Adaptation of the classic
    [Birthday Problem](https://en.wikipedia.org/wiki/Birthday_problem (Mathematical Problems category)).

    The year length is year_len (365 is earth, while Neptune year is 60,182).
    """

    @staticmethod
    def sat(n: int, year_len=365):
        """Find n such that the probability of two people having the same birthday in a group of n is near 1/2."""
        prob = 1.0
        for i in range(n):
            prob *= (year_len - i) / year_len
        return (prob - 0.5) ** 2 <= 1/year_len

    @staticmethod
    def sol(year_len):
        n = 1
        distinct_prob = 1.0
        best = (0.5, 1)  # (difference between probability and 1/2, n)
        while distinct_prob > 0.5:
            distinct_prob *= (year_len - n) / year_len
            n += 1
            best = min(best, (abs(0.5 - distinct_prob), n))

        return best[1]

    def safe_add(self, **inputs):
        if self.sat(self.sol(**inputs), **inputs):
            self.add(inputs)

    def gen(self, target_num_instances):
        self.safe_add(year_len=60182)  # Neptune year!
        for year_len in range(2, target_num_instances):
            self.safe_add(year_len=year_len)


class BirthdayParadoxMonteCarlo(BirthdayParadox):
    """A slower, Monte Carlo version of the above Birthday Paradox problem."""

    @staticmethod
    def sat(n: int, year_len=365):
        """Find n such that the probability of two people having the same birthday in a group of n is near 1/2."""
        import random
        random.seed(0)
        K = 1000  # number of samples
        prob = sum(len({random.randrange(year_len) for i in range(n)}) < n for j in range(K)) / K
        return (prob - 0.5) ** 2 <= year_len


class BallotProblem(PuzzleGenerator):
    """
    See the [Wikipedia article](https://en.wikipedia.org/wiki/Bertrand%27s_ballot_theorem) or
    or  [Addario-Berry L., Reed B.A. (2008) Ballot Theorems, Old and New. In: Gyori E., Katona G.O.H., Lovász L.,
    Sági G. (eds) Horizons of Combinatorics. Bolyai Society Mathematical Studies, vol 17.
    Springer, Berlin, Heidelberg.](https://doi.org/10.1007/978-3-540-77200-2_1)
    """

    @staticmethod
    def sat(counts: List[int], target_prob=0.5):
        """
        Suppose a list of m 1's and n -1's are permuted at random.
        What is the probability that all of the cumulative sums are positive?
        The goal is to find counts = [m, n] that make the probability of the ballot problem close to target_prob.
        """
        m, n = counts  # m = num 1's, n = num -1's
        probs = [1.0] + [0.0] * n  # probs[n] is probability for current m, starting with m = 1
        for i in range(2, m + 1):  # compute probs using dynamic programming for m = i
            old_probs = probs
            probs = [1.0] + [0.0] * n
            for j in range(1, min(n + 1, i)):
                probs[j] = (
                        j / (i + j) * probs[j - 1]  # last element is a -1 so use probs
                        +
                        i / (i + j) * old_probs[j]  # last element is a 1 so use old_probs, m = i - 1
                )
        return abs(probs[n] - target_prob) < 1e-6

    @staticmethod
    def sol(target_prob):
        for m in range(1, 10000):
            n = round(m * (1 - target_prob) / (1 + target_prob))
            if abs(target_prob - (m - n) / (m + n)) < 1e-6:
                return [m, n]

    def gen_random(self):
        m = self.random.randrange(1, self.random.choice([10, 100, 200, 300, 400, 500, 1000]))
        n = self.random.randrange(1, m + 1)
        target_prob = (m - n) / (m + n)
        self.add(dict(target_prob=target_prob))


class BinomialProbabilities(PuzzleGenerator):
    """See [Binomial distribution](https://en.wikipedia.org/wiki/Binomial_distribution)"""

    @staticmethod
    def sat(counts: List[int], p=0.5, target_prob=1 / 16.0):
        """Find counts = [a, b] so that the probability of  a H's and b T's among a + b coin flips is ~ target_prob."""
        from itertools import product
        a, b = counts
        n = a + b
        prob = (p ** a) * ((1-p) ** b)
        tot = sum([prob for sample in product([0, 1], repeat=n) if sum(sample) == a])
        return abs(tot - target_prob) < 1e-6

    @staticmethod
    def sol(p, target_prob):
        probs = [1.0]
        q = 1 - p
        while len(probs) < 20:
            probs = [(p * a + q * b) for a, b in zip([0] + probs, probs + [0])]
            answers = [i for i, p in enumerate(probs) if abs(p - target_prob) < 1e-6]
            if answers:
                return [answers[0], len(probs) - 1 - answers[0]]

    def gen_random(self):
        probs = [1.0]
        p = self.random.random()
        q = 1 - p
        for n in range(self.random.randrange(1, 11)):
            probs = [(p * a + q * b) for a, b in zip([0] + probs, probs + [0])]
        target_prob = self.random.choice(probs)
        self.add(dict(p=p, target_prob=target_prob))


class ExponentialProbability(PuzzleGenerator):
    """See [Exponential distribution](https://en.wikipedia.org/wiki/Exponential_distribution)"""

    @staticmethod
    def sat(p_stop: float, steps=10, target_prob=0.5):
        """
        Find p_stop so that the probability of stopping in steps or fewer time steps is the given target_prob if you
        stop each step with probability p_stop
        """
        prob = sum(p_stop*(1-p_stop)**t for t in range(steps))
        return abs(prob - target_prob) < 1e-6

    @staticmethod
    def sol(steps, target_prob):
        return 1 - (1 - target_prob) ** (1.0/steps)

    def gen_random(self):
        steps = self.random.randrange(1, 100)
        target_prob = self.random.random()
        self.add(dict(steps=steps, target_prob=target_prob))


if __name__ == "__main__":
    PuzzleGenerator.debug_problems()