import numpy as np
#Specify the priors for theta_A and theta_B
#First let us list out all possible values for theta_A and theta_B
resolution = 0.01
theta_A_values = np.arange(0, 1+resolution, resolution)
print(theta_A_values)
theta_B_values = np.arange(0, 1+resolution, resolution)
print(theta_B_values)
#Now we specify the prior probabilities
prior_A = np.full(len(theta_A_values), 1/len(theta_A_values))
prior_B = np.full(len(theta_B_values), 1/len(theta_B_values))
print(prior_A)

[0.   0.01 0.02 0.03 0.04 0.05 0.06 0.07 0.08 0.09 0.1  0.11 0.12 0.13
 0.14 0.15 0.16 0.17 0.18 0.19 0.2  0.21 0.22 0.23 0.24 0.25 0.26 0.27
 0.28 0.29 0.3  0.31 0.32 0.33 0.34 0.35 0.36 0.37 0.38 0.39 0.4  0.41
 0.42 0.43 0.44 0.45 0.46 0.47 0.48 0.49 0.5  0.51 0.52 0.53 0.54 0.55
 0.56 0.57 0.58 0.59 0.6  0.61 0.62 0.63 0.64 0.65 0.66 0.67 0.68 0.69
 0.7  0.71 0.72 0.73 0.74 0.75 0.76 0.77 0.78 0.79 0.8  0.81 0.82 0.83
 0.84 0.85 0.86 0.87 0.88 0.89 0.9  0.91 0.92 0.93 0.94 0.95 0.96 0.97
 0.98 0.99 1.  ]
[0.   0.01 0.02 0.03 0.04 0.05 0.06 0.07 0.08 0.09 0.1  0.11 0.12 0.13
 0.14 0.15 0.16 0.17 0.18 0.19 0.2  0.21 0.22 0.23 0.24 0.25 0.26 0.27
 0.28 0.29 0.3  0.31 0.32 0.33 0.34 0.35 0.36 0.37 0.38 0.39 0.4  0.41
 0.42 0.43 0.44 0.45 0.46 0.47 0.48 0.49 0.5  0.51 0.52 0.53 0.54 0.55
 0.56 0.57 0.58 0.59 0.6  0.61 0.62 0.63 0.64 0.65 0.66 0.67 0.68 0.69
 0.7  0.71 0.72 0.73 0.74 0.75 0.76 0.77 0.78 0.79 0.8  0.81 0.82 0.83
 0.84 0.85 0.86 0.87 0.88 0.89 0.9  0.91 0.92 0.93 0.94 0.95 0.96 0.97
 0.98 0.99 1.  ]
[0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099
 0.00990099 0.00990099 0.00990099 0.00990099 0.00990099]

#Plot the prior probabilities:
import matplotlib.pyplot as plt

plt.vlines(theta_A_values, ymin = 0, ymax = prior_A, color = 'b')
plt.xlabel("Possible Values for theta_A")
plt.ylabel("Probability")
plt.show()

plt.vlines(theta_B_values, ymin = 0, ymax = prior_B, color = 'b')
plt.xlabel("Possible Values for theta_B")
plt.ylabel("Probability")
plt.show()

#Likelihood Computation (this is the only place where the observed data enters the calculation)
#Since the likelihood is of product form (i.e., a function of theta_A multiplied by another function of theta_B), 
#we can compute the likelihood of A and likelihood of B separately. Overall likelihood is the product of these two separate likelihoods.
plus_A = 3
minus_A = 0
likelihood_A = (theta_A_values ** plus_A) * ((1 - theta_A_values) ** minus_A)
plus_B = 19
minus_B = 1
likelihood_B = (theta_B_values ** plus_B) * ((1 - theta_B_values) ** minus_B)

#Let us plot the likelihoods 
plt.vlines(theta_A_values, ymin = 0, ymax = likelihood_A, color = 'b', linewidth = 2)
plt.xlabel("Possible Values for theta_A")
plt.ylabel("Likelihood")
plt.show()

plt.vlines(theta_B_values, ymin = 0, ymax = likelihood_B, color = 'b', linewidth = 2)
plt.xlabel("Possible Values for theta_B")
plt.ylabel("Likelihood")
plt.show()

#Note that the scales in the two plots are different (likelihoods across different problems cannot be directly compared)

#Posterior Probability Computation
posterior_A_unnormalized = prior_A * likelihood_A
posterior_A = posterior_A_unnormalized / np.sum(posterior_A_unnormalized)
#Let us plot the likelihoods 
plt.vlines(theta_A_values, ymin = 0, ymax = posterior_A, color = 'b', linewidth = 2)
plt.xlabel("Possible Values for theta_A")
plt.ylabel("Posterior Probability")
plt.show()

posterior_B_unnormalized = prior_B * likelihood_B
posterior_B = posterior_B_unnormalized / np.sum(posterior_B_unnormalized)
#Let us plot the likelihoods 
plt.vlines(theta_B_values, ymin = 0, ymax = posterior_B, color = 'b', linewidth = 2)
plt.xlabel("Possible Values for theta_B")
plt.ylabel("Posterior Probability")
plt.show()

#Required Probability Calculation
#Joint Probability Matrix
joint_posterior = np.outer(posterior_A, posterior_B)
print(joint_posterior.shape)
print(joint_posterior)

#Posterior probability that theta_A <= theta_B
probAleqB = np.sum(np.triu(joint_posterior))
print(probAleqB)
#Posterior probability that theta_A >= theta_B
probAgeqB = np.sum(np.tril(joint_posterior))
print(probAgeqB)
#Posterior probability that theta_A < theta_B
probAstrictlyworseB = np.sum(np.triu(joint_posterior, k = 1))
print(probAstrictlyworseB)
#Posterior probability that theta_A > theta_B
probAstrictlybetterB = np.sum(np.tril(joint_posterior, k = -1))
print(probAstrictlybetterB)
#Posterior probability that theta_A = theta_B
probAeqB = np.trace(joint_posterior)
print(probAeqB)

(101, 101)
[[0.00000000e+00 0.00000000e+00 0.00000000e+00 ... 0.00000000e+00
  0.00000000e+00 0.00000000e+00]
 [0.00000000e+00 1.63614512e-45 8.49146490e-40 ... 2.25170794e-09
  1.36538561e-09 0.00000000e+00]
 [0.00000000e+00 1.30891609e-44 6.79317192e-39 ... 1.80136635e-08
  1.09230849e-08 0.00000000e+00]
 ...
 [0.00000000e+00 1.53992669e-39 7.99209883e-34 ... 2.11928950e-03
  1.28509002e-03 0.00000000e+00]
 [0.00000000e+00 1.58754997e-39 8.23925990e-34 ... 2.18482996e-03
  1.32483230e-03 0.00000000e+00]
 [0.00000000e+00 1.63614512e-39 8.49146490e-34 ... 2.25170794e-03
  1.36538561e-03 0.00000000e+00]]
0.7001613554736524
0.3296409466685906
0.6703590533314093
0.29983864452634756
0.02980230214224308

#Plotting the Posterior Beta densities for theta_A and theta_B:
from scipy.stats import beta
a = plus_A + 1
b = minus_A + 1
x = np.linspace(0, 1, 1000)
y = beta.pdf(x, a, b)
plt.plot(x, y, label = f"Beta({a}, {b})")
plt.title("Beta Distribution")
plt.xlabel("x")
plt.ylabel("Density")
plt.legend()
plt.show()

a = plus_B + 1
b = minus_B + 1
x = np.linspace(0, 1, 1000)
y = beta.pdf(x, a, b)
plt.plot(x, y, label = f"Beta({a}, {b})")
plt.title("Beta Distribution")
plt.xlabel("x")
plt.ylabel("Density")
plt.legend()
plt.show()
#These continuous posterior densities look very similar to the ones we obtained previously with discrete priors

#With the continuous prior. 
#Posterior for theta_A is Beta(+_A + a, -_A + b) and the posterior for theta_B is Beta(+_B + a, -_B + b). 
#To calculate the posterior probability that theta_A is strictly smaller than theta_B, we can discretize as before.
#An alternative approach uses Monte Carlo.
N = 20000
plus_A = 3
minus_A = 0
plus_B = 19
minus_B = 1
a = 1
b = 1
beta_samples_1 = np.random.beta(plus_A + a, minus_A + b, N)
beta_samples_2 = np.random.beta(plus_B + a, minus_B + b, N)
proportion_AleqB = np.sum(beta_samples_1 < beta_samples_2)/N
print(proportion_AleqB)

0.69815

Lecture Six: Overview of Bayesian Modeling¶

What is Bayesian Statistics?¶

Example One: Microwave Selection¶

Analysis with Continuous Priors¶