import numpy as np
from matplotlib import pyplot as plt
from matplotlib import transforms as trans
from scipy import special
plt.style.use('ggplot')


%matplotlib inline


x = np.round(np.random.rand(1)) # first toss
print(x)
x = np.round(np.random.rand(1)) # secon toss
print(x)

[1.]
[1.]


# simulate 10 tosses 
x = np.round(np.random.rand(10))
print(x)

[0. 1. 1. 1. 0. 0. 0. 1. 0. 1.]


x = np.round(np.random.rand(1000))
# Let us take a long direct approach
count_0 = np.count_nonzero(x==0)
count_1 = np.count_nonzero(x==1)
px_0 = count_0/len(x)
px_1 = count_1/len(x)
# plot the bar graph
plt.stem([0,1],[px_0,px_1],use_line_collection=True)
plt.title('Probablity Distribution')
plt.xlabel(r'$x$')
plt.ylabel(r'$P(x)$')
plt.axis([-0.1,1.1,0,1])
plt.show()


plt.hist(x,6,density=True,cumulative=True,histtype='step')
plt.title('Cumulative Distribution')
plt.xlabel(r'$i$')
plt.ylabel(r'$P(x<i)$')
plt.show()
#There is a small mistake in the appearance of the distribution, of course


n=10
x = np.random.randint(0,7,(n)) # from uniform distribution
print(x)

[3 6 1 6 0 3 6 5 6 6]


n = 1000
x = np.random.randint(0,7,(n))
px_i = []
# Let us take a long direct approach
for i in range(7):
    px_i.append(np.count_nonzero(x==i)/n)
    
plt.stem([0,1,2,3,4,5,6],px_i,use_line_collection=True)
plt.title('Probablity Distribution')
plt.xlabel(r'$x$')
plt.ylabel(r'$P(x)$')
plt.axis([-0.1,6.1,0,1])
plt.show()


plt.hist(x,7,density=True,cumulative=True,histtype='step')
plt.title('Cumulative Distribution')
plt.xlabel(r'$i$')
plt.ylabel(r'$P(x<i)$')
plt.show()


#binomial {You could have written a still better code using loops and lists}, i want it to be readble!
n = 30 
k = np.arange(0,n+1)
p = np.array([0.25,0.5,0.75])
q = 1-p
nCk = special.comb(n,k)
pk0 = p[0]**k
qk0 = q[0]**(n-k)
pk1 = p[1]**k
qk1 = q[1]**(n-k)
pk2 = p[2]**k
qk2 = q[2]**(n-k)
pq0 = np.multiply(pk0,qk0)
prob0 = np.multiply(nCk,pq0)
pq1 = np.multiply(pk1,qk1)
prob1 = np.multiply(nCk,pq1)
pq2 = np.multiply(pk2,qk2)
prob2 = np.multiply(nCk,pq2)


fig,ax = plt.subplots()
ax.scatter(k,prob0)
ax.scatter(k,prob1)
ax.scatter(k,prob2)
ax.plot(k,prob0,label='p=0.25',linestyle='dashed')
ax.plot(k,prob1,label='p=0.5',linestyle='dashed')
ax.plot(k,prob2,label='p=0.75',linestyle='dashed')
ax.legend()
ax.set_xlabel('k')
ax.set_ylabel('p(k,n)')
ax.set_title('Binomial Distribution')
fig.tight_layout()


y0 = np.cumsum(prob0)
y1 = np.cumsum(prob1)
y2 = np.cumsum(prob2)


fig,ax = plt.subplots()
ax.scatter(k,y0)
ax.scatter(k,y1)
ax.scatter(k,y2)
ax.plot(k,y0,label='p=0.25',linestyle='dashed')
ax.plot(k,y1,label='p=0.5',linestyle='dashed')
ax.plot(k,y2,label='p=0.75',linestyle='dashed')
ax.legend()
ax.set_xlabel('k')
ax.set_ylabel(r'$p(x \leq k)$')
ax.set_title('Cumulative Distribution')
fig.tight_layout()


x = np.random.randn(1,100) # an observed data
x = x.reshape(100)
x_org = np.linspace(-3,3,100)
p_x = (1/np.sqrt(2*np.pi))*np.exp(-0.5*x_org**2) # original distribution
# Let us presume that we don't know about the distribution of x


# Let us create a layout
gridsize = (1,3)
fig = plt.figure(figsize=(14,4))
ax1 = plt.subplot2grid(gridsize,(0,1),colspan=2,rowspan=1)
ax2 = plt.subplot2grid(gridsize,(0,0),colspan=1,rowspan=1)
ax2.hist(x,10,density=True,histtype='step',orientation='vertical',label='Estimate')
ax2.plot(x_org,p_x,label='Original')
ax2.legend()
ax2.set_xlabel('Range of RV,x')
ax2.set_ylabel(r'$p(x)$')
ax1.plot(x)
ax1.set_xlabel('Sample Number')
ax1.set_ylabel('Range of RV,x')
plt.show()


x = np.random.randn(1,100)+1 # an observed data
x = x.reshape(100)
x_org = np.linspace(-3,3,100)
p_x = (1/np.sqrt(2*np.pi))*np.exp(-0.5*(x_org-1)**2) # original distribution centered around mean
#Ploting
gridsize = (1,3)
fig = plt.figure(figsize=(14,4))
ax1 = plt.subplot2grid(gridsize,(0,1),colspan=2,rowspan=1)
ax2 = plt.subplot2grid(gridsize,(0,0),colspan=1,rowspan=1)
ax2.hist(x,10,density=True,histtype='step',orientation='vertical',label='Estimate')
ax2.plot(x_org,p_x,label='Original')
ax2.legend()
ax2.set_xlabel('Range of RV,x')
ax2.set_ylabel(r'$p(x)$')
ax1.plot(x)
ax1.set_xlabel('Sample Number')
ax1.set_ylabel('Range of RV,x')
plt.show()


from mpl_toolkits.mplot3d import Axes3D # To render 3D


x1= np.random.randn(1,200)
x2 = np.random.randn(1,200)


gridsize = (4,4)
fig = plt.figure(figsize=(10,10))
ax1 = plt.subplot2grid(gridsize,(2,2),colspan=2,rowspan=2)
ax2 = plt.subplot2grid(gridsize,(0,0),colspan=2,rowspan=2)
ax3 =  plt.subplot2grid(gridsize,(2,0),colspan=2,rowspan=2)

ax3.scatter(x1,x2)
ax3.set_xlabel('x1')
ax3.set_ylabel('x2')

ax1.hist(x2[0],20,density=True,orientation='horizontal')
ax1.set_title('Distribution of x2')
ax1.axes.get_yaxis().set_visible(False)

ax2.hist(x1[0],20,density=True)
ax2.set_title('Distribution of x1')
ax2.axes.get_xaxis().set_visible(False)


plt.show()


x1= np.random.randn(1,20000)
x2 = np.random.randn(1,20000)


h,x,y,_=plt.hist2d(x1[0],x2[0],15)
x,y = np.meshgrid(x,y)
fig = plt.figure(figsize=(8,6))
ax = fig.add_subplot(111,projection='3d')
ax.plot_surface(x[:15,:15],y[:15,:15],h/(20000))
ax.set_xlabel('x1')
ax.set_ylabel('x2')
ax.set_zlabel('P(x1,x2)')
plt.show()

C:\Users\Hp\AppData\Local\Temp\ipykernel_15240\3229337596.py:1: MatplotlibDeprecationWarning: Auto-removal of grids by pcolor() and pcolormesh() is deprecated since 3.5 and will be removed two minor releases later; please call grid(False) first.
  h,x,y,_=plt.hist2d(x1[0],x2[0],15)


x1 = np.random.normal(0,1,1000)
x2 = 0.7*x1+np.random.normal(0,1,1000)
Cx1x2 = np.cov( np.array([x1,x2]),rowvar=True)
x3 = -0.7*x1+np.random.normal(0,1,1000)
Cx1x3 = np.cov( np.array([x1,x3]),rowvar=True)
#plotting
fig,[ax0,ax1] = plt.subplots(1,2,figsize=(10,5))
ax0.scatter(x1,x2)
ax0.set_xlabel('x1')
ax0.set_ylabel('x2')
ax0.set_title(r'$\sigma_{12}=0.6$')
ax1.scatter(x1,x3)
ax1.set_xlabel('x1')
ax1.set_ylabel('x3')
ax1.set_title(r'$\sigma_{13}=-0.6$')
plt.show()


from matplotlib.patches import Ellipse
import matplotlib.transforms as transforms


def confidence_ellipse(x, y, ax, n_std=3.0, facecolor='none', **kwargs):
    """
    Create a plot of the covariance confidence ellipse of `x` and `y`

    Parameters
    ----------
    x, y : array_like, shape (n, )
        Input data.

    ax : matplotlib.axes.Axes
        The axes object to draw the ellipse into.

    n_std : float
        The number of standard deviations to determine the ellipse's radiuses.

    Returns
    -------
    matplotlib.patches.Ellipse

    Other parameters
    ----------------
    kwargs : `~matplotlib.patches.Patch` properties
    """
    if x.size != y.size:
        raise ValueError("x and y must be the same size")

    cov = np.cov(x, y)
    pearson = cov[0, 1]/np.sqrt(cov[0, 0] * cov[1, 1])
    # Using a special case to obtain the eigenvalues of this
    # two-dimensionl dataset.
    ell_radius_x = np.sqrt(1 + pearson)
    ell_radius_y = np.sqrt(1 - pearson)
    ellipse = Ellipse((0, 0),
        width=ell_radius_x * 2,
        height=ell_radius_y * 2,
        facecolor=facecolor,
        **kwargs)

    # Calculating the stdandard deviation of x from
    # the squareroot of the variance and multiplying
    # with the given number of standard deviations.
    scale_x = np.sqrt(cov[0, 0]) * n_std
    mean_x = np.mean(x)

    # calculating the stdandard deviation of y ...
    scale_y = np.sqrt(cov[1, 1]) * n_std
    mean_y = np.mean(y)

    transf = transforms.Affine2D() \
        .rotate_deg(45) \
        .scale(scale_x, scale_y) \
        .translate(mean_x, mean_y)

    ellipse.set_transform(transf + ax.transData)
    return ax.add_patch(ellipse)


# Let us generate some data from the distribution
x1 = np.random.normal(0,1,1000)
x2 = 0.7*x1+np.random.normal(0,1,1000)
C12 = np.cov( np.array([x1,x2]),rowvar=True)
x3 = -0.7*x1+np.random.normal(0,1,1000)
C13 = np.cov( np.array([x1,x3]),rowvar=True)


fig,[ax0,ax1] = plt.subplots(1,2,figsize=(10,5))
ax0.scatter(x1,x2)
confidence_ellipse(x1,x2,ax0,edgecolor='red')
ax0.set_xlabel('x1')
ax0.set_ylabel('x2')
ax0.set_title(r'$\sigma_{12}=0.6$')
ax1.scatter(x1,x3)
confidence_ellipse(x1,x3,ax1,edgecolor='red')
ax1.set_xlabel('x1')
ax1.set_ylabel('x3')
ax1.set_title(r'$\sigma_{13}=-0.6$')
plt.show()

Distribution of Random Variables

Joint PDF¶