from scipy import stats
from math import sqrt
import matplotlib.pyplot as plt
import numpy as np
import seaborn as sns

def sampleU(n, theta):
    """
        Returns a sample of num independent values from U(0,theta).
    """
    return stats.uniform.rvs(loc=0,scale=theta,size=n)

def my_estimate(x):
    return 2*x.mean()

def my_estimate2(x):
    return x.max()

def my_estimate3(x):
    n = len(x)
    return x.max()*(n+1)/n

def test_my_method(theta, sample_method, estimate_method, n=5, num=10**4, image=True, eps=0.1):
    if theta is None: theta  = 130
    L = []
    D = []
    for _ in range(num):
        data = sample_method(n,theta)   # one experiment -- perform sample_size measurements, predict what it implies
        D.append(data)
        L.append(estimate_method(data))

    estimates = np.array(L)   # theta se striskou
    MSE = np.mean((estimates-theta)**2)
    bias = estimates.mean()-theta
    p = np.mean(abs(estimates-theta)>eps)
    
    print(f"Mean: {estimates.mean():.3f}")
    print(f"Bias: {bias:.3f}")

    print(f"Mean squared error: {MSE:.3f}")
    print(f"Var+Bias^2: {estimates.var()+bias**2:.3f}, ")    
    print(f"P(error > {eps}) = {p}")
    
    if image:
        sns.set_style('whitegrid')
        sns.histplot(estimates)

test_my_method(130, sampleU, my_estimate, n=100, num=10000, eps=5, image=True)

Mean: 129.975
Bias: -0.025
Mean squared error: 54.634
Var+Bias^2: 54.634, 
P(error > 5) = 0.5014

test_my_method(130, sampleU, my_estimate, n=5, num=10**4, image=False, eps=10); print()
test_my_method(130, sampleU, my_estimate, n=50, num=10**4, image=False, eps=10); print()
test_my_method(130, sampleU, my_estimate, n=500, num=10**4, image=False, eps=10)

Mean: 130.374
Bias: 0.374
Mean squared error: 1096.876
Var+Bias^2: 1096.876, 
P(error > 10) = 0.7685

Mean: 130.030
Bias: 0.030
Mean squared error: 111.129
Var+Bias^2: 111.129, 
P(error > 10) = 0.3485

Mean: 130.010
Bias: 0.010
Mean squared error: 10.929
Var+Bias^2: 10.929, 
P(error > 10) = 0.0013

test_my_method(130, sampleU, my_estimate2, sample_size=100, num=10000, eps=5)

Mean: 128.721
Bias: -1.279
Mean squared error: 3.296
Var+Bias^2: 3.296, 
P(error > 5) = 0.0204

test_my_method(130, sampleU, my_estimate3, sample_size=100, num=10000, eps=5)

Mean: 130.011
Bias: 0.011
Mean squared error: 1.673
Var+Bias^2: 1.673, 
P(error > 5) = 0.0076

def sampleGeom(n, secretp):
    """
        Returns a sample of num independent values from Geom(secretp).
    """
    return stats.geom.rvs(secretp,size=n)

def sampleExp(n, secretp):
    """
        Returns a sample of num independent values from Exp(secretp).
    """
    return stats.expon.rvs(scale=secretp,size=n)

a = sampleExp(10000,3)

a.mean()

2.975340338068114

def my_estimate4(x):
    return 1/x.mean()

def my_estimate5(x):
    return x.mean()

test_my_method(1/6, sampleGeom, my_estimate4, n=50, num=10000, eps=0.05)

Mean: 0.170
Bias: 0.003
Mean squared error: 0.000
Var+Bias^2: 0.000, 
P(error > 0.05) = 0.0279

test_my_method(1/6, sampleGeom, my_estimate4, n=50, num=10000, eps=0.05)

Mean: 0.169
Bias: 0.003
Mean squared error: 0.000
Var+Bias^2: 0.000, 
P(error > 0.05) = 0.0277

test_my_method(3, sampleExp, my_estimate5, n=5, num=10**5, eps=0.5)

Mean: 3.000
Bias: 0.000
Mean squared error: 1.795
Var+Bias^2: 1.795, 
P(error > 0.5) = 0.71342

Point estimates¶