import numpy as np
import matplotlib.pyplot as plt
import scipy.stats as scpst
import math
# set up thw two populations, assume they are Gaussian with different means
mu_d = 176.5 # mean of the population of Dutch
sd_d = 10. # standard deviation of the population of Dutch

mu_f = 173.59 # mean of the population of Flemish Belgian
sd_f = 10. # standard deviation of the population of flemish belgian

rng = np.random.default_rng(seed=12) # set up random number generator
np.random.seed(5) # also seed in the old way for sampling from distributions not supported by numpy.Generator


n_d = 10 # sample size of the Dutch
n_f = 10 # sample size of the Flemish

sample_d = rng.normal(loc=mu_d,scale=sd_d,size=n_d) # sample the heights of 10 Dutch
sample_f = rng.normal(loc=mu_f,scale=sd_f,size=n_f) # sample the heights of 10 Flemish

xbar_d = np.mean(sample_d) # mean height of the sample of Dutch
xbar_f = np.mean(sample_f) # mean height of the sample of Flemish
xbar_diff = xbar_d - xbar_f # difference between the two sample means

print('Mean height of Dutch sample = '+str(xbar_d))
print('Mean height of Flemish sample = '+str(xbar_f))
print('Difference in sample mean heights = '+str(xbar_diff))

Mean height of Dutch sample = 178.3614720207531
Mean height of Flemish sample = 175.5598796893783
Difference in sample mean heights = 2.801592331374792

N_REPS = 10000

# sample 10 000 times from a population with a mean of zero
sample_a_null = [rng.normal(loc=0,scale=sd_d, size=n_d) for x in range(N_REPS)]
# sample another 10 000 times from a population with a mean of zero
sample_b_null = [rng.normal(loc=0,scale=sd_f, size=n_f) for x in range(N_REPS)]

# for each pair of samples calculate the difference between the two means
diff_distr_null =  np.array([np.mean(sample_a_null[x])-np.mean(sample_b_null[x]) for x in range(N_REPS)])

# plot the distribution of the results
plt.hist(diff_distr_null,bins = 30)
plt.title('Sampling distribution of the difference between means')
plt.xlabel('Difference between sample means')
plt.ylabel('Count')
plt.show()

# plot again and add a bar showing our observed mean difference
plt.hist(diff_distr_null,bins = 30)
l = plt.axvline(x=xbar_diff,c = [0,1,0])
plt.title('Sampling distribution of the difference between means')
plt.xlabel('Difference between sample means')
plt.ylabel('Count')
plt.legend([l],['Observed\n Mean Difference'])
plt.show()

# calculate the p value
p_val_mean_diff = np.sum(np.abs(diff_distr_null)>np.abs(xbar_diff)) / N_REPS
print('P value = '+ str(p_val_mean_diff))

P value = 0.5272

# define statistics
def get_n(x,correction = False):
    """
    Returns the length of the vector len(x) if correction == False
    Otherwise returns len(x) - 1
    """
    n = len(x)
    if not correction:
        return n
    return n-1

def variance(x,correction=False):
    """ Compute the sample variance"""
    x_bar = np.mean(x)
    squ_devs = (x-x_bar)**2
    n = get_n(x,correction=correction)
    return np.sum(squ_devs) / n

def pooled_variance(x1,x2,correction=False):
    """Compute the pooled variance for x1 and x2 """
    var1 = variance(x1,correction=correction)
    var2 = variance(x2,correction=correction)
    n1 = get_n(x1,correction=correction)
    n2 = get_n(x2,correction=correction)
    return (var1*n1 + var2*n2) / (n1 + n2)

def t_statistic(x1,x2, correction=False):
    x_bar1 = np.mean(x1)
    x_bar2 = np.mean(x2)
    n1 = get_n(x1, correction=correction)
    n2 = get_n(x2, correction=correction)
    s_p = pooled_variance(x1,x2,correction=correction)
    return (x_bar1 - x_bar2) /np.sqrt(s_p*(1/n1 + 1/n2))

def cohens_d(x1, x2,correction=False):
    x_bar1 = np.mean(x1)
    x_bar2 = np.mean(x2)
    return (x_bar1-x_bar2) / np.sqrt(pooled_variance(x1,x2,correction=correction))

def t_to_d(t,n1,n2):
    return t*np.sqrt(1/n1+1/n2)

def d_to_t(d,n1,n2):
    return d/np.sqrt(1/n1+1/n2)

# compute null distribution of t
t_distr_null = np.array([t_statistic(sample_a_null[x],sample_b_null[x],correction=True) for x in range(N_REPS)])

# compute null distribution of d
d_distr_null = np.array([cohens_d(sample_a_null[x],sample_b_null[x],correction=True) for x in range(N_REPS)])

obs_t = t_statistic(sample_d,sample_f,correction=True)
obs_d = cohens_d(sample_d,sample_f,correction=True)

# get their p-values from the simulated sampling distributions
p_val_t = np.sum(np.abs(t_distr_null)>np.abs(obs_t)) / N_REPS
p_val_d = np.sum(np.abs(d_distr_null)>np.abs(obs_d)) / N_REPS

# plot sampling distribution of the difference between the means
plt.hist(diff_distr_null,bins = 30)
l1 = plt.axvline(x=xbar_diff,c = [0,1,0])
plt.title('Sampling distribution of the difference between means')
plt.xlabel('Difference between sample means')
plt.ylabel('Count')
plt.legend([l1],['Observed mean\n difference'])
plt.show()

# plot sampling distribution of t
plt.hist(t_distr_null,bins = 30)
l2 = plt.axvline(x=obs_t,c = [0,1,0])
plt.title('Sampling distribution of t')
plt.xlabel('Student\'s t')
plt.ylabel('Count')
plt.legend([l2],['Observed t'])
plt.show()

# plot sampling distribution of t
plt.hist(d_distr_null,bins = 30)
l3 = plt.axvline(x=obs_d,c = [0,1,0])
plt.title('Sampling distribution of d')
plt.xlabel('Cohen\'s d')
plt.ylabel('Count')
plt.legend([l3],['Observed d'])
plt.show()

print('p value (mean diff) = ' + str(p_val_mean_diff))
print('p value (d) = ' + str(p_val_d))
print('p value (t) = ' + str(p_val_t))

p value (mean diff) = 0.5272
p value (d) = 0.5397
p value (t) = 0.5397

# plot the simulated sampling distribution overlayed with the analytical on
def t_sampling_distr_pdf(t,v):
    # calculate the first fraction
    return math.gamma( (v+1) / 2 ) / (np.sqrt(math.pi * v) * math.gamma(v/2)  ) *\
        np.power((1+t**2/v),-(v+1)/2)

def get_degrees_of_freedom(x1,x2,correction=False):
    return get_n(x1,correction=correction) + get_n(x2,correction=correction)

# plot simulated sampling distribution
plt.hist(t_distr_null,bins=30,density = True,label='Simulated') # plot

# plot analytical
t = np.linspace(-4,4,50)
pdf = t_sampling_distr_pdf(t,get_degrees_of_freedom(sample_d,sample_f))
plt.plot(t,pdf,label = 'Analytical')
plt.title('Sampling distribution of t')
plt.xlabel('Student\'s t')
plt.ylabel('Density')
plt.legend()
plt.show()

# set some colors for plotting, associated with each hypothesis
NULL_COLOR = [0,0,1]
ALT_COLOR = [0,1,0]

def evaluate_prior(delt,type='point'):
    """ Evaluates the prior distribution for the given value of delta (delt)
    """
    if type=='point':
        y = np.zeros_like(delt)
        y[np.isclose(delt,0.)] = 1. # assign 1 to zero values
        return y
    elif type == 'cauchy':
        return scpst.cauchy.pdf(delt,loc=0,scale=np.sqrt(2)/2)

# values of delta to plot
delts = np.linspace(-5,5,101)

# evaluate each prior for the specified values of delta
y_point = evaluate_prior(delts,'point')
y_cauch = evaluate_prior(delts,'cauchy')

# set up plots
f, axs = plt.subplots(1,2,sharex=True, sharey=True)

# plot point prior in the first axis
axs[0].plot(delts,y_point,c=NULL_COLOR)
axs[0].set_xlabel(r'Population Effect Size ($\delta$)')
axs[0].set_title(r'Point Prior ($H_{0}$)')
axs[0].set_ylabel('Probability\nDensity')

# plot Cauchy prior in the second axis
axs[1].plot(delts,y_cauch,c=ALT_COLOR)
axs[1].set_xlabel(r'Population Effect Size ($\delta$)')
axs[1].set_title('Cauchy Prior ($H_{A}$)')
plt.show()

def sample_delta_from_prior(distr_type):
    """
    Randomly sample a value of the population effect size delta from one of the prior distributions
    """
    if distr_type == 'point':
        return 0 # return always 0
    if distr_type == 'cauchy':
        # draw a random sample from a cauchy distribution
        sample = scpst.cauchy.rvs(loc=0,scale=np.sqrt(2)/2,size=1)
        return sample

def sample_from_independent_pops(delta,n1,n2,pooled_var=1):
    """
    Draw two samples of sizes n1 and n2 from two populations, where the difference between the population means is consistent with the specified population effect size 'delta'. 'pooled_var' specifies the pooled variance
    """
    # set up population mean and variance consistent with the pop effect size
    mu2 = 0.
    mu1 = delta*np.sqrt(pooled_var)

    sd1 = np.sqrt(pooled_var)
    sd2 = np.sqrt(pooled_var)

    # draw samples
    sample1 = rng.normal(loc=mu1,scale=sd1,size=n1)
    sample2 = rng.normal(loc=mu2,scale=sd2,size=n2)
    return sample1, sample2


N_SAMPLES = 10000 # how many times to repeat the experiment
cohens_d_null = np.zeros(N_SAMPLES)
cohens_d_alternative = np.zeros(N_SAMPLES)
####### calculate d 10000 times under the null hypothesis
for i in range(N_SAMPLES):
    # sample population delta from prior distribution - this will always be zero for the 'point' prior
    delta = sample_delta_from_prior('point')
    # draw two samples from two populations consistent with this effect size - in the case of the null these are populations with identical means
    sim_a,sim_b = sample_from_independent_pops(delta,n_d,n_f)
    # compute the observed sample d
    cohens_d_null[i] = cohens_d(sim_a,sim_b,correction=True)
####### calculate d 10000 times under the alternative hypothesis
for i in range(N_SAMPLES):
    # sample population delta randomly from Cauchy prior
    delta = sample_delta_from_prior('cauchy')
    # draw two samples from two populations consistent with this effect size
    sim_a,sim_b = sample_from_independent_pops(delta,n_d,n_f)
     # compute the observed sample d
    cohens_d_alternative[i] = cohens_d(sim_a,sim_b,correction=True)

# plot the distributions of sampled values of d
f, axs2 = plt.subplots(1,2,sharex=True,sharey=True)
null_h,null_b,_,=axs2[0].hist(cohens_d_null,bins = np.linspace(-3,3,60),color=NULL_COLOR,alpha=0.5,density=True)
axs2[0].set_xlabel(r"Sample Effect Size (Cohen's $d$)")
axs2[0].set_title(r'Prior Predictive ($H_{0}$)')
alt_h,alt_b,_=axs2[1].hist(cohens_d_alternative,bins = np.linspace(-5,5,60),color=ALT_COLOR,alpha=0.5,density=True)
axs2[1].set_xlabel(r"Sample Effect Size (Cohen's $d$)")
axs2[1].set_title('Prior Predictive ($H_{A}$)')
axs2[0].set_ylabel('Probability\nDensity')

plt.xlim([-5,5])
plt.show()

def get_bf_from_histogram(observed_d,height_null,null_bins,height_alt,alt_bins):
    """
    Get approximate Bayes' factor for the observed value of Cohen's d from the heights of the two prior predictive histograms.
    """

    # convert bin edges to bin centers
    def bin_edges_to_centers(edges):
        bw = edges[1]-edges[0]
        return edges[:-1] + bw /2

    null_bins = bin_edges_to_centers(null_bins)
    alt_bins = bin_edges_to_centers(alt_bins)

    # get the height of the bin whose center is nearest to the observed d for the null prior predictive distribution
    i = np.argmin(np.abs(null_bins-observed_d))
    pr_0 = height_null[i]

     # get the height of the bin whose center is nearest to the observed d for the alternative prior predictive distribution
    j = np.argmin(np.abs(alt_bins-observed_d))
    pr_a = height_alt[j]
    return pr_a /pr_0, pr_a, pr_0

def print_result(bf_a0):
    """Print a message describing the given Bayes' Factor """
    if bf_a0<1.:
        supported_hyp = 'Null'
        unsupported_hyp = 'Alternative'
        fact = 1/bf_a0
    if bf_a0>1.:
        supported_hyp = 'Alternative'
        unsupported_hyp = 'Null'
        fact = bf_a0
    print('BF = '+ '%.3f'%bf_a0)
    print('Observed d is '+ '%.3f'%fact +' times more likely given the '+
          supported_hyp+' hypothesis than the '+ unsupported_hyp)

# get approximate probabilities and the BF from the histograms
bf_hist_approx,pr_a,pr_0  = get_bf_from_histogram(obs_d,null_h,null_b,alt_h,alt_b)

# plot the two histograms overlayed with indications of the selected bins
plt.hist(cohens_d_null,bins = np.linspace(-3,3,60),color=NULL_COLOR,alpha=0.5,density=True)
plt.xlabel(r"Sample Effect Size (Cohen's $d$)")
plt.ylabel('Probability\nDensity')
plt.hist(cohens_d_alternative,bins = np.linspace(-5,5,60),color=ALT_COLOR,alpha=0.5,density=True)
plt.xlim([-5,5])

# add a vertical line at the observed Cohen's d
plt.axvline(x=obs_d,label=r"Cohen's $d$ = "+'%.2f'%obs_d)
# add a horizontal line at the height of pr_a
pr0_lh=plt.axhline(y=pr_0,color=NULL_COLOR,label=r'$P(data | H_{0}) \sim $'+('%.3f'%pr_0)[1:])
pra_lh = plt.axhline(y=pr_a,color=ALT_COLOR,label=r'$P(data | H_{A}) \sim $'+('%.3f'%pr_a)[1:])

plt.legend()
plt.show()
print('BF (Histogram Approximation)')
print_result(bf_hist_approx)

BF (Histogram Approximation)
BF = 0.490
Observed d is 2.043 times more likely given the Null hypothesis than the Alternative

Statistical inference from frequentist and Bayesian perspectives¶

Population vs sample¶

Statistical inference: the frequentist perspective¶

The alternative hypothesis¶

Testing against the null hypothesis¶

Mathematically more convenient test statistics¶

Correction of n¶

Sampling distributions of t and Cohen's d¶

Statistical inference: the Bayesian perspective¶

A motivation¶

The default Bayes' Factor¶

Simulation overview and rationale¶

The prior distributions¶

Prior predictive distributions¶