debugging a learning algorithm

# for array computations and loading data

import numpy as np

# for building linear regression models and preparing data

from sklearn.linear_model import LinearRegression

from sklearn.preprocessing import StandardScaler, PolynomialFeatures

from sklearn.model_selection import train_test_split

from sklearn.metrics import mean_squared_error

# for building and training neural networks

import tensorflow as tf

# custom functions

import utils

# reduce display precision on numpy arrays

np.set_printoptions(precision=2)

# suppress warnings

tf.get_logger().setLevel('ERROR')

tf.autograph.set_verbosity(0)

# Load the dataset from the text file

data = np.loadtxt('./data/data_w3_ex1.csv', delimiter=',')

# Split the inputs and outputs into separate arrays

x = data[:,0]

y = data[:,1]

# Convert 1-D arrays into 2-D because the commands later will require it

x = np.expand_dims(x, axis=1)

y = np.expand_dims(y, axis=1)

print(f"the shape of the inputs x is: {x.shape}")

print(f"the shape of the targets y is: {y.shape}")

# Plot the entire dataset

utils.plot_dataset(x=x, y=y, title="input vs. target")

# Get 60% of the dataset as the training set. Put the remaining 40% in temporary variables: x_ and y_.

x_train, x_, y_train, y_ = train_test_split(x, y, test_size=0.40, random_state=1)

# Split the 40% subset above into two: one half for cross validation and the other for the test set

x_cv, x_test, y_cv, y_test = train_test_split(x_, y_, test_size=0.50, random_state=1)

# Delete temporary variables

del x_, y_

print(f"the shape of the training set (input) is: {x_train.shape}")

print(f"the shape of the training set (target) is: {y_train.shape}\n")

print(f"the shape of the cross validation set (input) is: {x_cv.shape}")

print(f"the shape of the cross validation set (target) is: {y_cv.shape}\n")

print(f"the shape of the test set (input) is: {x_test.shape}")

print(f"the shape of the test set (target) is: {y_test.shape}")

utils.plot_train_cv_test(x_train, y_train, x_cv, y_cv, x_test, y_test, title="input vs. target")

# Initialize the class

scaler_linear = StandardScaler()

# Compute the mean and standard deviation of the training set then transform it

X_train_scaled = scaler_linear.fit_transform(x_train)

print(f"Computed mean of the training set: {scaler_linear.mean_.squeeze():.2f}")

print(f"Computed standard deviation of the training set: {scaler_linear.scale_.squeeze():.2f}")

# Plot the results

utils.plot_dataset(x=X_train_scaled, y=y_train, title="scaled input vs. target")

# Initialize the class

linear_model = LinearRegression()

# Train the model

linear_model.fit(X_train_scaled, y_train )

# Feed the scaled training set and get the predictions

yhat = linear_model.predict(X_train_scaled)

# Use scikit-learn's utility function and divide by 2

print(f"training MSE (using sklearn function): {mean_squared_error(y_train, yhat) / 2}")

# for-loop implementation

total_squared_error = 0

for i in range(len(yhat)):

squared_error_i = (yhat[i] - y_train[i])**2

total_squared_error += squared_error_i

mse = total_squared_error / (2*len(yhat))

print(f"training MSE (for-loop implementation): {mse.squeeze()}")

# Scale the cross validation set using the mean and standard deviation of the training set

X_cv_scaled = scaler_linear.transform(x_cv)

print(f"Mean used to scale the CV set: {scaler_linear.mean_.squeeze():.2f}")

print(f"Standard deviation used to scale the CV set: {scaler_linear.scale_.squeeze():.2f}")

# Feed the scaled cross validation set

yhat = linear_model.predict(X_cv_scaled)

# Use scikit-learn's utility function and divide by 2

print(f"Cross validation MSE: {mean_squared_error(y_cv, yhat) / 2}")

# Instantiate the class to make polynomial features

poly = PolynomialFeatures(degree=2, include_bias=False)

# Compute the number of features and transform the training set

X_train_mapped = poly.fit_transform(x_train)

# Preview the first 5 elements of the new training set. Left column is `x` and right column is `x^2`

# Note: The `e+<number>` in the output denotes how many places the decimal point should

# be moved. For example, `3.24e+03` is equal to `3240`

print(X_train_mapped[:5])

# Instantiate the class

scaler_poly = StandardScaler()

# Compute the mean and standard deviation of the training set then transform it

X_train_mapped_scaled = scaler_poly.fit_transform(X_train_mapped)

# Preview the first 5 elements of the scaled training set.

print(X_train_mapped_scaled[:5])

# Initialize the class

model = LinearRegression()

# Train the model

model.fit(X_train_mapped_scaled, y_train )

# Compute the training MSE

yhat = model.predict(X_train_mapped_scaled)

print(f"Training MSE: {mean_squared_error(y_train, yhat) / 2}")

# Add the polynomial features to the cross validation set

X_cv_mapped = poly.transform(x_cv)

# Scale the cross validation set using the mean and standard deviation of the training set

X_cv_mapped_scaled = scaler_poly.transform(X_cv_mapped)

# Compute the cross validation MSE

yhat = model.predict(X_cv_mapped_scaled)

print(f"Cross validation MSE: {mean_squared_error(y_cv, yhat) / 2}")

# Initialize lists containing the lists, models, and scalers

train_mses = []

cv_mses = []

models = []

scalers = []

# Loop over 10 times. Each adding one more degree of polynomial higher than the last.

for degree in range(1,11):

# Add polynomial features to the training set

poly = PolynomialFeatures(degree, include_bias=False)

X_train_mapped = poly.fit_transform(x_train)

# Scale the training set

scaler_poly = StandardScaler()

X_train_mapped_scaled = scaler_poly.fit_transform(X_train_mapped)

scalers.append(scaler_poly)

# Create and train the model

model = LinearRegression()

model.fit(X_train_mapped_scaled, y_train )

models.append(model)

# Compute the training MSE

yhat = model.predict(X_train_mapped_scaled)

train_mse = mean_squared_error(y_train, yhat) / 2

train_mses.append(train_mse)

# Add polynomial features and scale the cross validation set

poly = PolynomialFeatures(degree, include_bias=False)

X_cv_mapped = poly.fit_transform(x_cv)

X_cv_mapped_scaled = scaler_poly.transform(X_cv_mapped)

# Compute the cross validation MSE

yhat = model.predict(X_cv_mapped_scaled)

cv_mse = mean_squared_error(y_cv, yhat) / 2

cv_mses.append(cv_mse)

# Plot the results

degrees=range(1,11)

utils.plot_train_cv_mses(degrees, train_mses, cv_mses, title="degree of polynomial vs. train and CV MSEs")

# Get the model with the lowest CV MSE (add 1 because list indices start at 0)

# This also corresponds to the degree of the polynomial added

degree = np.argmin(cv_mses) + 1

print(f"Lowest CV MSE is found in the model with degree={degree}")

# Add polynomial features to the test set

poly = PolynomialFeatures(degree, include_bias=False)

X_test_mapped = poly.fit_transform(x_test)

# Scale the test set

X_test_mapped_scaled = scalers[degree-1].transform(X_test_mapped)

# Compute the test MSE

yhat = models[degree-1].predict(X_test_mapped_scaled)

test_mse = mean_squared_error(y_test, yhat) / 2

print(f"Training MSE: {train_mses[degree-1]:.2f}")

print(f"Cross Validation MSE: {cv_mses[degree-1]:.2f}")

print(f"Test MSE: {test_mse:.2f}")

# Add polynomial features

degree = 1

poly = PolynomialFeatures(degree, include_bias=False)

X_train_mapped = poly.fit_transform(x_train)

X_cv_mapped = poly.transform(x_cv)

X_test_mapped = poly.transform(x_test)

# Scale the features using the z-score

scaler = StandardScaler()

X_train_mapped_scaled = scaler.fit_transform(X_train_mapped)

X_cv_mapped_scaled = scaler.transform(X_cv_mapped)

X_test_mapped_scaled = scaler.transform(X_test_mapped)

# Initialize lists that will contain the errors for each model

nn_train_mses = []

nn_cv_mses = []

# Build the models

nn_models = utils.build_models()

# Loop over the the models

for model in nn_models:

# Setup the loss and optimizer

model.compile(

loss='mse',

optimizer=tf.keras.optimizers.Adam(learning_rate=0.1),

)

print(f"Training {model.name}...")

# Train the model

model.fit(

X_train_mapped_scaled, y_train,

epochs=300,

verbose=0

)

print("Done!\n")

# Record the training MSEs

yhat = model.predict(X_train_mapped_scaled)

train_mse = mean_squared_error(y_train, yhat) / 2

nn_train_mses.append(train_mse)

# Record the cross validation MSEs

yhat = model.predict(X_cv_mapped_scaled)

cv_mse = mean_squared_error(y_cv, yhat) / 2

nn_cv_mses.append(cv_mse)

# print results

print("RESULTS:")

for model_num in range(len(nn_train_mses)):

print(

f"Model {model_num+1}: Training MSE: {nn_train_mses[model_num]:.2f}, " +

f"CV MSE: {nn_cv_mses[model_num]:.2f}"

)

# Select the model with the lowest CV MSE

model_num = 3

# Compute the test MSE

yhat = nn_models[model_num-1].predict(X_test_mapped_scaled)

test_mse = mean_squared_error(y_test, yhat) / 2

print(f"Selected Model: {model_num}")

print(f"Training MSE: {nn_train_mses[model_num-1]:.2f}")

print(f"Cross Validation MSE: {nn_cv_mses[model_num-1]:.2f}")

print(f"Test MSE: {test_mse:.2f}")

# Load the dataset from a text file

data = np.loadtxt('./data/data_w3_ex2.csv', delimiter=',')

# Split the inputs and outputs into separate arrays

x_bc = data[:,:-1]

y_bc = data[:,-1]

# Convert y into 2-D because the commands later will require it (x is already 2-D)

y_bc = np.expand_dims(y_bc, axis=1)

print(f"the shape of the inputs x is: {x_bc.shape}")

print(f"the shape of the targets y is: {y_bc.shape}")

utils.plot_bc_dataset(x=x_bc, y=y_bc, title="x1 vs. x2")

from sklearn.model_selection import train_test_split

# Get 60% of the dataset as the training set. Put the remaining 40% in temporary variables.

x_bc_train, x_, y_bc_train, y_ = train_test_split(x_bc, y_bc, test_size=0.40, random_state=1)

# Split the 40% subset above into two: one half for cross validation and the other for the test set

x_bc_cv, x_bc_test, y_bc_cv, y_bc_test = train_test_split(x_, y_, test_size=0.50, random_state=1)

# Delete temporary variables

del x_, y_

print(f"the shape of the training set (input) is: {x_bc_train.shape}")

print(f"the shape of the training set (target) is: {y_bc_train.shape}\n")

print(f"the shape of the cross validation set (input) is: {x_bc_cv.shape}")

print(f"the shape of the cross validation set (target) is: {y_bc_cv.shape}\n")

print(f"the shape of the test set (input) is: {x_bc_test.shape}")

print(f"the shape of the test set (target) is: {y_bc_test.shape}")

# Scale the features

# Initialize the class

scaler_linear = StandardScaler()

# Compute the mean and standard deviation of the training set then transform it

x_bc_train_scaled = scaler_linear.fit_transform(x_bc_train)

x_bc_cv_scaled = scaler_linear.transform(x_bc_cv)

x_bc_test_scaled = scaler_linear.transform(x_bc_test)

# Sample model output

probabilities = np.array([0.2, 0.6, 0.7, 0.3, 0.8])

# Apply a threshold to the model output. If greater than 0.5, set to 1. Else 0.

predictions = np.where(probabilities >= 0.5, 1, 0)

# Ground truth labels

ground_truth = np.array([1, 1, 1, 1, 1])

# Initialize counter for misclassified data

misclassified = 0

# Get number of predictions

num_predictions = len(predictions)

# Loop over each prediction

for i in range(num_predictions):

# Check if it matches the ground truth

if predictions[i] != ground_truth[i]:

# Add one to the counter if the prediction is wrong

misclassified += 1

# Compute the fraction of the data that the model misclassified

fraction_error = misclassified/num_predictions

print(f"probabilities: {probabilities}")

print(f"predictions with threshold=0.5: {predictions}")

print(f"targets: {ground_truth}")

print(f"fraction of misclassified data (for-loop): {fraction_error}")

print(f"fraction of misclassified data (with np.mean()): {np.mean(predictions != ground_truth)}")

Bu Blogda Ara

Emir of Things

debugging a learning algorithm

Yorumlar

Yorum Gönder