import numpy as np
import pandas as pd
import matplotlib.pyplot as plt


# Generate data

np.random.seed(0)
size = 100

x = np.linspace(-2, 2, size)
y = 2.9 * np.sin(1.5 * x) + 2*np.random.normal(size=size)

# View data
plt.scatter(x, y)
plt.show()


from sklearn.model_selection import train_test_split

X_train, X_test, y_train, y_test = train_test_split(
    x.reshape(-1, 1), y, 
    test_size=0.2, 
    random_state=0
)


from sklearn.neural_network import MLPRegressor

model = MLPRegressor(
  hidden_layer_sizes=(16, 8, 4, 2),
  random_state=0,
)
model.fit(X_train, y_train)

c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(

MLPRegressor(hidden_layer_sizes=(16, 8, 4, 2), random_state=0)

MLPRegressor(hidden_layer_sizes=(16, 8, 4, 2), random_state=0)


print(f"R-squared on test data is {model.score(X_test, y_test)}")

y_hat = model.predict(X_test)
y_true = 2.9 * np.sin(1.5 * X_test)
plt.scatter(X_test, y_test, label="actual")
plt.scatter(X_test, y_true, label="true")
plt.scatter(X_test, y_hat, label="predicted")
plt.legend()
plt.show()

R-squared on test data is 0.0886708545090823


# Generate 50 features (predictors)
np.random.seed(0)
size = 100

X = pd.DataFrame(
    np.random.normal(size=(size, 50))
)

# Some noise
noise = np.random.normal(size=size)

# Regression target
yr = X[0] + noise

# Binary target
yb = 1*(yr > 0)

# Multi-class target
ym = 1*(yr > -1) + 1*(yr > 1)


Xb_train, Xb_test, yb_train, yb_test = train_test_split(
    X, yb, 
    test_size=0.2, 
    random_state=0
)
Xm_train, Xm_test, ym_train, ym_test = train_test_split(
    X, ym, 
    test_size=0.2, 
    random_state=0
)
Xr_train, Xr_test, yr_train, yr_test = train_test_split(
    X, yr, 
    test_size=0.2, 
    random_state=0
)


from sklearn.neural_network import MLPClassifier

model = MLPClassifier(
  hidden_layer_sizes=(16, 8, 4, 2),
  random_state=0
)
model.fit(Xb_train, yb_train)
score_train = model.score(Xb_train, yb_train)
score_test = model.score(Xb_test, yb_test)
print("fraction of correct predictions on training data is", score_train)
print("fraction of correct predictions on test data is", score_test)

fraction of correct predictions on training data is 0.875
fraction of correct predictions on test data is 0.6

c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(


from sklearn.model_selection import GridSearchCV

hidden_layers = [
     (8, 4, 2),
    (8, 4),
    (8, 8),
]
cv = GridSearchCV(
    model,
    param_grid = {"hidden_layer_sizes": hidden_layers},
)
cv.fit(Xb_train, yb_train)
print(f"best hidden layers is {cv.best_params_}")
print(f"score on the test data is {cv.score(Xb_test, yb_test)}")

c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(
c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(
c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(
c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(
c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(
c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(
c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(
c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(
c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(
c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(
c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(
c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(
c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(
c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(
c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(

best hidden layers is {'hidden_layer_sizes': (8, 8)}
score on the test data is 0.6

c:\Users\kerry\AppData\Local\Programs\Python\Python310\lib\site-packages\sklearn\neural_network\_multilayer_perceptron.py:702: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
  warnings.warn(


import torch

# Creating a tensor from a list
tensor_from_list = torch.tensor([1, 2, 3, 4, 5])

# Creating a tensor from a numpy array
numpy_array = np.array([6, 7, 8, 9, 10])
tensor_from_numpy = torch.from_numpy(numpy_array)

# Creating a 2x3 matrix filled with zeros
zeros_tensor = torch.zeros(2, 3)

# Creating a 2x3 matrix filled with ones
ones_tensor = torch.ones(2, 3)

# Displaying the created tensors
tensor_from_list, tensor_from_numpy, zeros_tensor, ones_tensor

(tensor([1, 2, 3, 4, 5]),
 tensor([ 6,  7,  8,  9, 10], dtype=torch.int32),
 tensor([[0., 0., 0.],
         [0., 0., 0.]]),
 tensor([[1., 1., 1.],
         [1., 1., 1.]]))


# Creating a tensor and setting requires_grad to True
x = torch.tensor(2.0, requires_grad=True)

# Defining a simple function
y = x ** 2

# Computing the gradient
y.backward()

# Displaying the gradient dy/dx at x = 2
x.grad

tensor(4.)


x = torch.tensor(2.0, requires_grad=True)

# Defining a simple composite function
y = x ** 2
z = 3 * y

# Computing the gradient
z.backward()

# Displaying the gradient dz/dy * dy/dx at x = 2
x.grad

tensor(12.)


# Load the wine dataset
from sklearn.datasets import load_wine
X, y = load_wine(return_X_y=True)
print(f"(numobs, numfeatures) = {X.shape}")
print(f"(unique values of y are {np.unique(y)})")

# Split the data into training and testing sets (80% train, 20% test)
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=0)

(numobs, numfeatures) = (178, 13)
(unique values of y are [0 1 2])


from sklearn.preprocessing import StandardScaler

scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)


X_train_tensor = torch.tensor(X_train, dtype=torch.float32)
X_test_tensor = torch.tensor(X_test, dtype=torch.float32)

y_train_tensor = torch.tensor(y_train, dtype=torch.int64)
y_test_tensor = torch.tensor(y_test, dtype=torch.int64)


import torch.nn as nn
import torch.nn.functional as F

class WineClassifier(nn.Module):
    def __init__(self):
        super(WineClassifier, self).__init__()  # inherit from nn.Module
        # Define the layers
        self.layer1 = nn.Linear(13, 64)  # Hidden layer 1
        self.layer2 = nn.Linear(64, 32)  # Hidden layer 2
        self.layer3 = nn.Linear(32, 16)  # Hidden layer 3
        self.out = nn.Linear(16, 3)      # Output layer

    def forward(self, x):
        x = F.relu(self.layer1(x))
        x = F.relu(self.layer2(x))
        x = F.relu(self.layer3(x))
        x = self.out(x)
        return F.log_softmax(x, dim=1)


# Instantiate the model
model = WineClassifier()
model

WineClassifier(
  (layer1): Linear(in_features=13, out_features=64, bias=True)
  (layer2): Linear(in_features=64, out_features=32, bias=True)
  (layer3): Linear(in_features=32, out_features=16, bias=True)
  (out): Linear(in_features=16, out_features=3, bias=True)
)


import torch.optim as optim
criterion = nn.CrossEntropyLoss()
optimizer = optim.SGD(model.parameters(), lr=0.01)


num_epochs = 100
losses = []

for epoch in range(num_epochs):
    # Forward pass
    outputs = model(X_train_tensor)
    loss = criterion(outputs, y_train_tensor)
    losses.append(loss.item())

    # Zero the gradients
    optimizer.zero_grad()

    # Backward pass
    loss.backward()

    # Update the parameters
    optimizer.step()


# Plot the loss curve

plt.plot(losses)
plt.xlabel('Epoch')
plt.ylabel('Loss')
plt.title('Training Loss Curve')
plt.show()


logprobs = model(X_test_tensor)
maxlogprob, yhat = torch.max(logprobs, 1) # 1 means max across rows
correct = (yhat == y_test_tensor).sum().item()
accuracy = correct / len(y_test_tensor)
accuracy

0.6111111111111112

Neural Networks¶

BUSI 520 - Python for Business Research¶

Kerry Back, JGSB, Rice University¶

Neural networks (multi-layer perceptrons)¶

Noisy Sine Curve Example¶

Split into train and test¶

Define a model and train¶

Test¶

Question¶

Irrelevant features example¶

Split into train and test¶

Define a model, train, and test¶

GridSearchCV¶

Overview of fitting a neural network¶

Composite function¶

Backpropagation¶

Gradient descent¶

Stochastic gradient descent¶

Neural net libraries¶

Pytorch tensors¶

Automatic Differentiation¶

Automatic differentiation of a composite function¶

Pytorch example (sklearn's wine dataset)¶

Scale the data¶

Convert to tensors¶

Define a network structure¶

Define a loss function and optimizer¶

Train¶

Test¶