import math
import matplotlib.pyplot as plt
import numpy as np
import scipy
import scipy.stats

TRUE_MEAN = 40
TRUE_STD = 10
X = np.random.normal(TRUE_MEAN, TRUE_STD, 1000)

def normal_mu_MLE(X):
    # Get the number of observations
    T = len(X)
    # Sum the observations
    s = sum(X)
    return 1.0/T * s

def normal_sigma_MLE(X):
    T = len(X)
    # Get the mu MLE
    mu = normal_mu_MLE(X)
    # Sum the square of the differences
    s = sum( np.power((X - mu), 2) )
    # Compute sigma^2
    sigma_squared = 1.0/T * s
    return math.sqrt(sigma_squared)

print("Mean Estimation")
print(normal_mu_MLE(X))
print(np.mean(X))
print("Standard Deviation Estimation")
print(normal_sigma_MLE(X))
print(np.std(X))

Mean Estimation
39.97339283238262
39.97339283238264
Standard Deviation Estimation
10.110058391084257
10.110058391084253

mu, std = scipy.stats.norm.fit(X)
print("mu estimate:",  str(mu))
print("std estimate:", str(std))

mu estimate: 39.97339283238264
std estimate: 10.110058391084253

pdf = scipy.stats.norm.pdf
# We would like to plot our data along an x-axis ranging from 0-80 with 80 intervals
# (increments of 1)
x = np.linspace(0, 80, 80)
plt.hist(X, bins=x, density='true')
plt.plot(pdf(x, loc=mu, scale=std))
plt.xlabel('Value')
plt.ylabel('Observed Frequency')
plt.legend(['Fitted Distribution PDF', 'Observed Data', ]);

TRUE_LAMBDA = 5
X = np.random.exponential(TRUE_LAMBDA, 1000)

def exp_lamda_MLE(X):
    T = len(X)
    s = sum(X)
    return s/T

print("lambda estimate:", str(exp_lamda_MLE(X)))

lambda estimate: 5.19533144751805

# The scipy version of the exponential distribution has a location parameter
# that can skew the distribution. We ignore this by fixing the location
# parameter to 0 with floc=0
_, l = scipy.stats.expon.fit(X, floc=0)

pdf = scipy.stats.expon.pdf
x = range(0, 80)
plt.hist(X, bins=x, density='true')
plt.plot(pdf(x, scale=l))
plt.xlabel('Value')
plt.ylabel('Observed Frequency')
plt.legend(['Fitted Distribution PDF', 'Observed Data', ]);

# Cài thư viện lấy dữ liệu miễn phí
!curl -fsSLO https://raw.githubusercontent.com/algo-stocks/data/master/data.py

from data import get_prices

start = '2022-01-01'
end = '2025-01-01'

closes = get_prices('FPT', start_date=start, end_date=end)
returns = closes.pct_change()[1:]

mu, std = scipy.stats.norm.fit(returns)
pdf = scipy.stats.norm.pdf
x = np.linspace(-.1,.1, num=100)
h = plt.hist(returns, bins=x, density='true')
l = plt.plot(x, pdf(x, loc=mu, scale=std))

from statsmodels.stats.stattools import jarque_bera
jarque_bera(returns)

(array([306.70352218]),
 array([2.51290672e-67]),
 array([0.10809672]),
 array([6.13164315]))

jarque_bera(np.random.normal(0, 1, 100))

(np.float64(0.2612005890317266),
 np.float64(0.8775684732297053),
 np.float64(0.049438133164470335),
 np.float64(3.2300252710561663))

¶

Ước lượng Maximum Likelihood (MLEs)¶

Phân phối chuẩn¶

Phân phối mũ¶

MLE cho Lợi suất (returns) của Tài sản¶