import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns 
sns.set_style("whitegrid")

# some artificial data

np.random.seed(0)
size = 1000

x = np.linspace(-2, 2, size)
y = 2.9 * np.sin(1.5 * x) + np.random.normal(size=size)

# view data
plt.scatter(x, y)
plt.show()

from sklearn.model_selection import train_test_split

X = x.reshape(-1, 1)
X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=0
)

from sklearn.preprocessing import StandardScaler

scaler = StandardScaler()
X_train_scaled = scaler.fit_transform(X_train)
X_test_scaled = scaler.transform(X_test)

from sklearn.neural_network import MLPRegressor

model = MLPRegressor(
  hidden_layer_sizes=(16, 8, 4),
  random_state=0,
  max_iter=2000
)
model.fit(X_train_scaled, y_train)
print(f"R-squared on test data is {model.score(X_test_scaled, y_test)}")

R-squared on test data is 0.8322573476968619

# actual y's
plt.scatter(X_test, y_test, label="actual")

# predicted y's
y_hat = model.predict(X_test)
plt.scatter(X_test, y_hat, label="predicted")

# true y's (without noise)
y_true = 2.9 * np.sin(1.5 * X_test)
plt.scatter(X_test, y_true, label="true")

plt.legend()
plt.show()

import pandas as pd  

networks = [
    (4,),
    (8,),
    (16,),
    (32,),
    (64,),
    (8, 4),
    (16, 8, 4),
    (32, 16, 8, 4),
    (64, 32, 16, 8, 4),
]

dct = {}
for n in networks:
    model = MLPRegressor(
        hidden_layer_sizes=n, random_state=0, max_iter=2000
    )
    model.fit(X_train, y_train)
    dct[n] = model.score(X_test, y_test)
print(pd.Series(dct))

4     0.791647
8     0.828308
16    0.832089
32    0.833226
64    0.832105
8     0.803791
16    0.832003
32    0.794628
64    0.832195
dtype: float64

Day 10: Neural Networks¶

BUSI 520 - Python for Business Research¶

Kerry Back, JGSB, Rice University¶

Multi-layer perceptrons¶

Illustration¶

Rectified linear units¶

Output neuron¶

Deep versus shallow learning¶

Neural net libraries¶

Example¶

Split into train and test¶

Scale the x variables¶

Define a model and train¶

View¶

Nonparametric estimation¶

Compare different network configurations¶

Ask Julius¶