from autograd import grad

def fun(x):
    x1, x2 = x
    b = -3. if x1*(x2-1) > 2 else 1.
    return b * (x1**2 + x2**2)

fun_grad = grad(fun)

fun_grad([1., 2.])

[array(2.), array(4.)]

from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split
import torch
import torch.nn as nn
import torch.optim as optim

import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns 
sns.set_style("whitegrid")

# some artificial data

np.random.seed(0)
size = 1000

x = np.linspace(-2, 2, size)
y = 2.9 * np.sin(1.5 * x) + np.random.normal(size=size)

# view data
plt.scatter(x, y)
plt.show()

# create n x 1 arrays
X = x.reshape(-1, 1)
y = y.reshape(-1, 1)

# split into train and test sets
X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=0
)

# only important when you have multiple features

scaler = StandardScaler()
X_train_scaled = scaler.fit_transform(X_train)
X_test_scaled = scaler.transform(X_test)

X_train_scaled_tensor = torch.tensor(
    X_train_scaled, dtype=torch.float32
)
X_test_scaled_tensor = torch.tensor(
    X_test_scaled, dtype=torch.float32
)
y_train_tensor = torch.tensor(y_train, dtype=torch.float32)
y_test_tensor = torch.tensor(y_test, dtype=torch.float32)

class MyNeuralNetwork(nn.Module):
    def __init__(self):
        super(MyNeuralNetwork, self).__init__()

        # first hidden layer consists of 16 neurons
        self.fc1 = nn.Linear(1, 16)

        # second hidden layer consists of 8 neurons
        self.fc2 = nn.Linear(16, 8)

        # third hidden layer consists of 4 neurons
        self.fc3 = nn.Linear(8, 4)

        # output layer consists of 1 neuron
        self.fc4 = nn.Linear(4, 1)

    # forward pass through all four layers
    def forward(self, x):
        x = torch.relu(self.fc1(x))
        x = torch.relu(self.fc2(x))
        x = torch.relu(self.fc3(x))
        return self.fc4(x)

model = MyNeuralNetwork()

criterion = nn.MSELoss()

optimizer = optim.Adam(
    model.parameters(), 
    lr=0.001, 
    weight_decay=0.01
)

num_epochs = 1000

for epoch in range(num_epochs):
    model.train()
    optimizer.zero_grad()
    outputs = model(X_train_scaled_tensor)
    loss = criterion(outputs, y_train_tensor)
    loss.backward()
    optimizer.step()

    if (epoch+1) % 100 == 0:
        print(f'Epoch [{epoch+1}/{num_epochs}], Loss: {loss.item():.4f}')

Epoch [100/1000], Loss: 1.0052
Epoch [200/1000], Loss: 0.9982
Epoch [300/1000], Loss: 0.9974
Epoch [400/1000], Loss: 0.9962
Epoch [500/1000], Loss: 0.9943
Epoch [600/1000], Loss: 0.9941
Epoch [700/1000], Loss: 0.9939
Epoch [800/1000], Loss: 0.9938
Epoch [900/1000], Loss: 0.9937
Epoch [1000/1000], Loss: 0.9936

# predicted y's
y_hat = model(X_test_scaled_tensor).detach().numpy().flatten()

# true y's (without noise)
y_true = 2.9 * np.sin(1.5 * X_test)

plt.scatter(X_test, y_test, label="actual")
plt.scatter(X_test, y_hat, label="predicted")
plt.scatter(X_test, y_true, label="true")

plt.legend()
plt.show()

Day 11: More on Neural Networks¶

BUSI 520 - Python for Business Research¶

Kerry Back, JGSB, Rice University¶

Outline¶

Fitting a neural network¶

Mini-batch gradient descent¶

Stochastic gradient descent¶

Example of gradient calculation¶

Chain Rule¶

Forward and backward passes¶

Automatic differentiation¶

Automatic differentiation example¶

Pytorch¶

Install pytorch¶

Train-test split¶

Standard scaler¶

Convert to pytorch tensors¶

Build your network¶

Define loss function and optimizer¶

Fit the network¶

Evaluate performance¶