# First, let's import all the needed libraries.
import numpy as np
import matplotlib.pyplot as plt
import scipy.stats as stats


mu = 0
sigma = 1
cut_a = -4
cut_b = 0.5

x = np.arange(-4, 4.01, 0.01)
yy = stats.norm.pdf(x, mu, sigma)

plt.figure(figsize=(10, 5))
plt.plot(x, yy, color="darkblue")

plt.title("The probability density function of the standard normal distribution")
plt.xticks(
    [
        mu - 3 * sigma,
        mu - 2 * sigma,
        mu - sigma,
        mu,
        0.5,
        mu + sigma,
        mu + 2 * sigma,
        mu + 3 * sigma,
    ],
    [-3, -2, -1, 0, "z", 1, 2, 3],
)

plt.fill_between(
    x=x,
    y1=yy,
    where=(x <= 0.5),
    color="red",
    edgecolor="black",
    alpha=0.75,
)


xpos = [-3, -2, -1, 0, 1, 2, 3]
ypos = [0.005, 0.05, 0.25, max(yy), 0.25, 0.05, 0.005]
for px, py in zip(xpos, ypos):
    plt.vlines(x=mu + px, ymin=0, ymax=py, color="blue", linestyle="--")

plt.text(
    2.5, 0.3, "$f(x) = \\frac{1}{\\sqrt{2\\pi}}e^{-\\frac{1}{2} x^2}$", fontsize=16
)

plt.arrow(
    2.2,
    0.26,
    -0.9,
    -0.08,
    length_includes_head=True,
    head_width=0.02,
    head_length=0.1,
    color="black",
)

plt.arrow(
    -2.2,
    0.28,
    1.3,
    -0.1,
    length_includes_head=True,
    head_width=0.02,
    head_length=0.1,
    color="black",
)

plt.text(-2.5, 0.3, "$\\phi(z)$", fontsize=16)
plt.xlabel("z score")
plt.ylabel("f(x)")
plt.show()


mu = 0
sigma = 1
cut_a = -4
cut_b = 0.5

x = np.arange(-4, 4.01, 0.01)
yy = stats.norm.cdf(x, mu, sigma)

plt.figure(figsize=(10, 5))
plt.plot(x, yy, color="darkblue")

plt.title(
    "The cummulative probability density function\nof the standard normal distribution"
)
plt.xlabel("z score")
plt.ylabel("$\\phi(z)$")
plt.xticks(
    [
        mu - 3 * sigma,
        mu - 2 * sigma,
        mu - sigma,
        mu,
        0.5,
        mu + sigma,
        mu + 2 * sigma,
        mu + 3 * sigma,
    ],
    [-3, -2, -1, 0, "z", 1, 2, 3],
)

plt.fill_between(
    x=x,
    y1=yy,
    where=(x <= 0.5),
    color="red",
    edgecolor="black",
    alpha=0.75,
)


xpos = [-3, -2, -1, 0, 1, 2, 3]
ypos = [0.0001, 0.01, 0.15, 0.5, 0.83, 0.97, max(yy)]
for px, py in zip(xpos, ypos):
    plt.vlines(x=mu + px, ymin=0, ymax=py, color="blue", linestyle="--")

plt.arrow(
    -1,
    0.7,
    1.2,
    -0.3,
    length_includes_head=True,
    head_width=0.02,
    head_length=0.1,
    color="black",
)

plt.text(
    -2,
    0.8,
    "$\\phi (z) = \\frac{1}{\\sqrt{2\\pi}} \\int_{-\\infty}^{z}e^{-\\frac{1}{2}x^2}dx$",
    fontsize=16,
)

plt.show()


stats.norm.cdf(-3)
stats.norm.cdf(-2)
## and so on...

0.022750131948179195


## ... or simplified in a loop:
z = [-3, -2, -1, 0, 1, 2, 3]
for i in z:
    print(i, "->", stats.norm.cdf(i))

-3 -> 0.0013498980316300933
-2 -> 0.022750131948179195
-1 -> 0.15865525393145707
0 -> 0.5
1 -> 0.8413447460685429
2 -> 0.9772498680518208
3 -> 0.9986501019683699


# 1st standard deviation
stats.norm.cdf(1) - stats.norm.cdf(-1)

0.6826894921370859


# 2nd standard deviations
stats.norm.cdf(2) - stats.norm.cdf(-2)

0.9544997361036416


# 3rd standard deviation
stats.norm.cdf(3) - stats.norm.cdf(-3)

0.9973002039367398


mu = 0
sigma = 1
cut_a = -1
cut_b = 1

x = np.arange(-4, 4.01, 0.01)
yy = stats.norm.pdf(x, mu, sigma)

plt.figure(figsize=(10, 5))
plt.plot(x, yy, color="black")

plt.title("The area between the interval z = [-1,1]")
plt.yticks([])

plt.fill_between(
    x=x,
    y1=yy,
    where=(x >= -1) & (x <= 1),
    color="red",
    alpha=0.75,
)


plt.text(
    2.5,
    0.3,
    "$\\phi(z) =\\int_{-1}^{1}f(z)dz = P(z \\leq 1) - P(z \\leq -1)$",
    fontsize=14,
)

plt.text(
    -0.5,
    0.15,
    "$\\phi(z) \\approx 0.68$",
    fontsize=14,
)

plt.axhline(-0.001, color="black")
plt.xlabel("z score")

plt.show()


mu = 0
sigma = 1
cut_a = -1
cut_b = 1

x = np.arange(-4, 4.01, 0.01)
yy = stats.norm.pdf(x, mu, sigma)

plt.figure(figsize=(10, 5))
plt.plot(x, yy, color="black")

plt.title("The area between the interval z = [-2,2]")
plt.yticks([])

plt.fill_between(
    x=x,
    y1=yy,
    where=(x >= -2) & (x <= 2),
    color="red",
    alpha=0.75,
)


plt.text(
    2.5,
    0.3,
    "$\\phi(z) =\\int_{-2}^{2}f(z)dz = P(z \\leq 2) - P(z \\leq -2)$",
    fontsize=14,
)


plt.text(
    -0.5,
    0.15,
    "$\\phi(z) \\approx 0.95$",
    fontsize=14,
)

plt.axhline(-0.001, color="black")
plt.xlabel("z score")

plt.show()


mu = 0
sigma = 1
cut_a = -1
cut_b = 1

x = np.arange(-4, 4.01, 0.01)
yy = stats.norm.pdf(x, mu, sigma)

plt.figure(figsize=(10, 5))
plt.plot(x, yy, color="black")

plt.title("The area between the interval z = [-3,3]")
plt.yticks([])

plt.fill_between(
    x=x,
    y1=yy,
    where=(x >= -3) & (x <= 3),
    color="red",
    alpha=0.75,
)


plt.text(
    2.5,
    0.3,
    "$\\phi(z) =\\int_{-3}^{3}f(z)dz = P(z \\leq 3) - P(z \\leq -3)$",
    fontsize=14,
)

plt.text(
    -0.5,
    0.15,
    "$\\phi(z) \\approx 0.97$",
    fontsize=14,
)

plt.axhline(-0.001, color="black")
plt.xlabel("z score")

plt.show()

Basic Properties of the Standard Normal Curve¶