import numpy as np
import math

def ols_grad_descent(x, y, epochs, initial_beta1 = 0, initial_beta0 = 1, eta = 0.1):
    beta1 = initial_beta1
    beta0 = initial_beta0
    n = x.shape[0]
    losses = []
    for i in range(epochs):
        y_pred = (beta1 * x) + beta0
        losses.append(np.mean(np.square(y - y_pred)))
        grad_beta1 = (-1 / n) * np.sum(x * (y - y_pred))
        grad_beta0 = (-1 / n) * np.sum(y - y_pred)
        beta1 = beta1 - eta * grad_beta1
        beta0 = beta0 - eta * grad_beta0
        if i % 50 == 0:
            print("Step {}: Current loss is {}, slope (beta1) is {}, and intercept (beta0) is {}."
                .format(i + 1, round(losses[i], 4), round(beta1, 4) , round(beta0, 4)))
    return beta1, beta0, losses


rng = np.random.RandomState(1)
x = 10 * rng.rand(1000)
y = 2 * x - 5 + rng.randn(1000)
beta1, beta0, losses = ols_grad_descent(x, y, epochs = 1000, initial_beta1 = 0, initial_beta0 = 1, eta= 0.01)

Step 1: Current loss is 50.8109, slope (beta1) is 0.3696, and intercept (beta0) is 1.0406.
Step 51: Current loss is 8.3511, slope (beta1) is 1.1844, and intercept (beta0) is 0.4467.
Step 101: Current loss is 6.768, slope (beta1) is 1.2782, and intercept (beta0) is -0.1738.
Step 151: Current loss is 5.5276, slope (beta1) is 1.3612, and intercept (beta0) is -0.7231.
Step 201: Current loss is 4.5556, slope (beta1) is 1.4347, and intercept (beta0) is -1.2093.
Step 251: Current loss is 3.794, slope (beta1) is 1.4997, and intercept (beta0) is -1.6397.
Step 301: Current loss is 3.1973, slope (beta1) is 1.5573, and intercept (beta0) is -2.0207.
Step 351: Current loss is 2.7297, slope (beta1) is 1.6082, and intercept (beta0) is -2.3579.
Step 401: Current loss is 2.3633, slope (beta1) is 1.6533, and intercept (beta0) is -2.6564.
Step 451: Current loss is 2.0762, slope (beta1) is 1.6932, and intercept (beta0) is -2.9207.
Step 501: Current loss is 1.8513, slope (beta1) is 1.7286, and intercept (beta0) is -3.1546.
Step 551: Current loss is 1.675, slope (beta1) is 1.7599, and intercept (beta0) is -3.3617.
Step 601: Current loss is 1.5369, slope (beta1) is 1.7876, and intercept (beta0) is -3.5449.
Step 651: Current loss is 1.4287, slope (beta1) is 1.8121, and intercept (beta0) is -3.7072.
Step 701: Current loss is 1.3439, slope (beta1) is 1.8338, and intercept (beta0) is -3.8508.
Step 751: Current loss is 1.2775, slope (beta1) is 1.853, and intercept (beta0) is -3.9779.
Step 801: Current loss is 1.2254, slope (beta1) is 1.87, and intercept (beta0) is -4.0904.
Step 851: Current loss is 1.1846, slope (beta1) is 1.885, and intercept (beta0) is -4.19.
Step 901: Current loss is 1.1527, slope (beta1) is 1.8983, and intercept (beta0) is -4.2782.
Step 951: Current loss is 1.1276, slope (beta1) is 1.9101, and intercept (beta0) is -4.3563.


from matplotlib import pyplot as plt

plt.plot(range(1, 1000+1), losses, label = "loss")
plt.legend()
plt.xlabel("iteration")
plt.show()


beta1, beta0, losses = ols_grad_descent(x, y, epochs = 2000, initial_beta1 = 0, initial_beta0 = 1, eta= 0.01)

Step 1: Current loss is 50.8109, slope (beta1) is 0.3696, and intercept (beta0) is 1.0406.
Step 51: Current loss is 8.3511, slope (beta1) is 1.1844, and intercept (beta0) is 0.4467.
Step 101: Current loss is 6.768, slope (beta1) is 1.2782, and intercept (beta0) is -0.1738.
Step 151: Current loss is 5.5276, slope (beta1) is 1.3612, and intercept (beta0) is -0.7231.
Step 201: Current loss is 4.5556, slope (beta1) is 1.4347, and intercept (beta0) is -1.2093.
Step 251: Current loss is 3.794, slope (beta1) is 1.4997, and intercept (beta0) is -1.6397.
Step 301: Current loss is 3.1973, slope (beta1) is 1.5573, and intercept (beta0) is -2.0207.
Step 351: Current loss is 2.7297, slope (beta1) is 1.6082, and intercept (beta0) is -2.3579.
Step 401: Current loss is 2.3633, slope (beta1) is 1.6533, and intercept (beta0) is -2.6564.
Step 451: Current loss is 2.0762, slope (beta1) is 1.6932, and intercept (beta0) is -2.9207.
Step 501: Current loss is 1.8513, slope (beta1) is 1.7286, and intercept (beta0) is -3.1546.
Step 551: Current loss is 1.675, slope (beta1) is 1.7599, and intercept (beta0) is -3.3617.
Step 601: Current loss is 1.5369, slope (beta1) is 1.7876, and intercept (beta0) is -3.5449.
Step 651: Current loss is 1.4287, slope (beta1) is 1.8121, and intercept (beta0) is -3.7072.
Step 701: Current loss is 1.3439, slope (beta1) is 1.8338, and intercept (beta0) is -3.8508.
Step 751: Current loss is 1.2775, slope (beta1) is 1.853, and intercept (beta0) is -3.9779.
Step 801: Current loss is 1.2254, slope (beta1) is 1.87, and intercept (beta0) is -4.0904.
Step 851: Current loss is 1.1846, slope (beta1) is 1.885, and intercept (beta0) is -4.19.
Step 901: Current loss is 1.1527, slope (beta1) is 1.8983, and intercept (beta0) is -4.2782.
Step 951: Current loss is 1.1276, slope (beta1) is 1.9101, and intercept (beta0) is -4.3563.
Step 1001: Current loss is 1.108, slope (beta1) is 1.9206, and intercept (beta0) is -4.4253.
Step 1051: Current loss is 1.0926, slope (beta1) is 1.9298, and intercept (beta0) is -4.4865.
Step 1101: Current loss is 1.0806, slope (beta1) is 1.938, and intercept (beta0) is -4.5406.
Step 1151: Current loss is 1.0711, slope (beta1) is 1.9452, and intercept (beta0) is -4.5886.
Step 1201: Current loss is 1.0637, slope (beta1) is 1.9517, and intercept (beta0) is -4.631.
Step 1251: Current loss is 1.0579, slope (beta1) is 1.9573, and intercept (beta0) is -4.6685.
Step 1301: Current loss is 1.0534, slope (beta1) is 1.9623, and intercept (beta0) is -4.7018.
Step 1351: Current loss is 1.0498, slope (beta1) is 1.9668, and intercept (beta0) is -4.7312.
Step 1401: Current loss is 1.0471, slope (beta1) is 1.9707, and intercept (beta0) is -4.7572.
Step 1451: Current loss is 1.0449, slope (beta1) is 1.9742, and intercept (beta0) is -4.7803.
Step 1501: Current loss is 1.0432, slope (beta1) is 1.9773, and intercept (beta0) is -4.8007.
Step 1551: Current loss is 1.0418, slope (beta1) is 1.98, and intercept (beta0) is -4.8187.
Step 1601: Current loss is 1.0408, slope (beta1) is 1.9824, and intercept (beta0) is -4.8347.
Step 1651: Current loss is 1.0399, slope (beta1) is 1.9846, and intercept (beta0) is -4.8489.
Step 1701: Current loss is 1.0393, slope (beta1) is 1.9865, and intercept (beta0) is -4.8614.
Step 1751: Current loss is 1.0388, slope (beta1) is 1.9881, and intercept (beta0) is -4.8725.
Step 1801: Current loss is 1.0384, slope (beta1) is 1.9896, and intercept (beta0) is -4.8823.
Step 1851: Current loss is 1.0381, slope (beta1) is 1.9909, and intercept (beta0) is -4.891.
Step 1901: Current loss is 1.0378, slope (beta1) is 1.9921, and intercept (beta0) is -4.8987.
Step 1951: Current loss is 1.0376, slope (beta1) is 1.9931, and intercept (beta0) is -4.9055.


plt.plot(range(1, 2000+1), losses, label = "loss")
plt.legend()
plt.xlabel("iteration")
plt.show()


def eps_ols_grad_descent(x, y, alpha = 0.001, initial_beta1 = 0, initial_beta0 = 1, eta = 0.1):
    beta1 = initial_beta1
    beta0 = initial_beta0
    old_beta1 = beta1
    old_beta0 = beta0
    n = x.shape[0]
    diff = 1.0
    # print(n)
    i = 0
    losses = []
    while diff > alpha:
        y_pred = (beta1 * x)  + beta0
        losses.append(np.mean(np.square(y - y_pred)))
        grad_beta1 = (-1 / n) * np.sum(x * (y - y_pred))
        grad_beta0 = (-1 / n) * np.sum(y - y_pred)
        beta1 = beta1 - eta * grad_beta1
        beta0 = beta0 - eta * grad_beta0
        if i % 50 == 0:
            print("Step {}: Current loss is {}, slope (beta1) is {} and intercept (beta0) is {}."
                  .format(i + 1, round(losses[i],4),  round(beta1, 4), round(beta0, 4)))
        i = i + 1
        diff = max(abs(old_beta1 - beta1), abs(old_beta0 - beta0))
        old_beta1 = beta1
        old_beta0 = beta0
    return beta1, beta0, losses


beta1, beta0, losses = eps_ols_grad_descent(x, y, alpha = 0.001, initial_beta1 = 0, initial_beta0 = 1, eta= 0.01)

Step 1: Current loss is 50.8109, slope (beta1) is 0.3696 and intercept (beta0) is 1.0406.
Step 51: Current loss is 8.3511, slope (beta1) is 1.1844 and intercept (beta0) is 0.4467.
Step 101: Current loss is 6.768, slope (beta1) is 1.2782 and intercept (beta0) is -0.1738.
Step 151: Current loss is 5.5276, slope (beta1) is 1.3612 and intercept (beta0) is -0.7231.
Step 201: Current loss is 4.5556, slope (beta1) is 1.4347 and intercept (beta0) is -1.2093.
Step 251: Current loss is 3.794, slope (beta1) is 1.4997 and intercept (beta0) is -1.6397.
Step 301: Current loss is 3.1973, slope (beta1) is 1.5573 and intercept (beta0) is -2.0207.
Step 351: Current loss is 2.7297, slope (beta1) is 1.6082 and intercept (beta0) is -2.3579.
Step 401: Current loss is 2.3633, slope (beta1) is 1.6533 and intercept (beta0) is -2.6564.
Step 451: Current loss is 2.0762, slope (beta1) is 1.6932 and intercept (beta0) is -2.9207.
Step 501: Current loss is 1.8513, slope (beta1) is 1.7286 and intercept (beta0) is -3.1546.
Step 551: Current loss is 1.675, slope (beta1) is 1.7599 and intercept (beta0) is -3.3617.
Step 601: Current loss is 1.5369, slope (beta1) is 1.7876 and intercept (beta0) is -3.5449.
Step 651: Current loss is 1.4287, slope (beta1) is 1.8121 and intercept (beta0) is -3.7072.
Step 701: Current loss is 1.3439, slope (beta1) is 1.8338 and intercept (beta0) is -3.8508.
Step 751: Current loss is 1.2775, slope (beta1) is 1.853 and intercept (beta0) is -3.9779.
Step 801: Current loss is 1.2254, slope (beta1) is 1.87 and intercept (beta0) is -4.0904.
Step 851: Current loss is 1.1846, slope (beta1) is 1.885 and intercept (beta0) is -4.19.
Step 901: Current loss is 1.1527, slope (beta1) is 1.8983 and intercept (beta0) is -4.2782.
Step 951: Current loss is 1.1276, slope (beta1) is 1.9101 and intercept (beta0) is -4.3563.
Step 1001: Current loss is 1.108, slope (beta1) is 1.9206 and intercept (beta0) is -4.4253.
Step 1051: Current loss is 1.0926, slope (beta1) is 1.9298 and intercept (beta0) is -4.4865.
Step 1101: Current loss is 1.0806, slope (beta1) is 1.938 and intercept (beta0) is -4.5406.


plt.plot(range(1, 1109+1), losses, label = "loss")
plt.legend()
plt.xlabel("iteration")
plt.show()


beta1, beta0, losses = ols_grad_descent(x, y, epochs = 500, initial_beta1 = 0, initial_beta0 = 1, eta= 0.1)

Step 1: Current loss is 50.8109, slope (beta1) is 3.696, and intercept (beta0) is 1.4059.
Step 51: Current loss is 7.342036083869394e+39, slope (beta1) is 3.499588537195117e+19, and intercept (beta0) is 5.287696237287645e+18.
Step 101: Current loss is 1.3329942304915815e+78, slope (beta1) is 4.715446945615442e+38, and intercept (beta0) is 7.124795045603993e+37.
Step 151: Current loss is 2.4201374090596947e+116, slope (beta1) is 6.353729777254186e+57, and intercept (beta0) is 9.600155183631025e+56.
Step 201: Current loss is 4.393916301175761e+154, slope (beta1) is 8.561199510452273e+76, and intercept (beta0) is 1.2935527121817004e+76.
Step 251: Current loss is 7.977439788941246e+192, slope (beta1) is 1.1535608158873063e+96, and intercept (beta0) is 1.7429703866096797e+95.
Step 301: Current loss is 1.4483558908291895e+231, slope (beta1) is 1.5543412512767047e+115, and intercept (beta0) is 2.3485287765927346e+114.
Step 351: Current loss is 2.6295839793207815e+269, slope (beta1) is 2.094364416809775e+134, and intercept (beta0) is 3.1644756886620065e+133.
Step 401: Current loss is inf, slope (beta1) is 2.8220072695079514e+153, and intercept (beta0) is 4.263906188393032e+152.
Step 451: Current loss is inf, slope (beta1) is 3.80245432229336e+172, and intercept (beta0) is 5.745310684027919e+171.

/usr/local/lib/python3.9/dist-packages/numpy/core/_methods.py:180: RuntimeWarning: overflow encountered in reduce
  ret = umr_sum(arr, axis, dtype, out, keepdims, where=where)
/tmp/ipykernel_8368/3847878196.py:11: RuntimeWarning: overflow encountered in square
  losses.append(np.mean(np.square(y - y_pred)))


plt.plot(range(1, 500+1), losses, label = "loss")
plt.legend()
plt.xlabel("iteration")
plt.show()

$F\left(\boldsymbol{X}\right)$	$\rightarrow$	$\triangledown F\left(\boldsymbol{X}\right)$
$A\boldsymbol{X}$	$\rightarrow$	$A$
$\boldsymbol{X}^TA\boldsymbol{X}$	$\rightarrow$	$2A\boldsymbol{X}$
$\boldsymbol{W}^T\boldsymbol{X}$	$\rightarrow$	$\boldsymbol{X}$
$\boldsymbol{X}^T\boldsymbol{X}$	$\rightarrow$	$2\boldsymbol{X}$

STATS 315: Statistics and Artificial Intelligence

Section 02

Linear Regression

1. Basics of Regression¶

2. Linear Regression¶

3. Gradient Descent¶

4. Minibatch Stochastic Gradient Descent¶

5. The Normal Distribution and Squared Loss¶

6. Neural Network and Biology¶

Summary¶