import pandas as pd
from pprint import pprint as pp
from itertools import combinations
from pathlib import Path
import requests
import numpy as np
import sys
import matplotlib.pyplot as plt
import matplotlib.ticker as mtick

from sklearn.metrics import mean_squared_error

from tensorflow.keras import datasets
from tensorflow.keras.layers import Dense
from tensorflow.keras.models import Sequential
from tensorflow.keras import layers
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import SGD
from tensorflow.keras.callbacks import EarlyStopping

import tensorflow as tf
tf.config.list_physical_devices('GPU')

[PhysicalDevice(name='/physical_device:GPU:0', device_type='GPU')]

# enable the last line to print device placement logging when running `.fit`
# example output: Executing op _EagerConst in device /job:localhost/replica:0/task:0/device:GPU:0
# tf.debugging.set_log_device_placement(True)

# set tf logging levels - 0: Info, 1: Warning, 2: Error, 3: None
# %env TF_CPP_MIN_LOG_LEVEL=3

# Create some tensors
a = tf.constant([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0]])
b = tf.constant([[1.0, 2.0], [3.0, 4.0], [5.0, 6.0]])
c = tf.matmul(a, b)

print(c)

tf.Tensor(
[[22. 28.]
 [49. 64.]], shape=(2, 2), dtype=float32)

# pd.set_option('max_columns', 200)
# pd.set_option('max_rows', 300)
# pd.set_option('display.expand_frame_repr', True)
# plt.rcParams["patch.force_edgecolor"] = True

def create_dir_save_file(dir_path: Path, url: str):
    """
    Check if the path exists and create it if it does not.
    Check if the file exists and download it if it does not.
    """
    if not dir_path.parents[0].exists():
        dir_path.parents[0].mkdir(parents=True)
        print(f'Directory Created: {dir_path.parents[0]}')
    else:
        print('Directory Exists')
        
    if not dir_path.exists():
        r = requests.get(url, allow_redirects=True)
        open(dir_path, 'wb').write(r.content)
        print(f'File Created: {dir_path.name}')
    else:
        print('File Exists')

data_dir = Path('data/2021-04-19_intro_to_deep_learning_in_python')
images_dir = Path('Images/2021-04-19_intro_to_deep_learning_in_python')

file_1 = 'https://assets.datacamp.com/production/repositories/654/datasets/8a57adcdb5bfb3e603dad7d3c61682dfe63082b8/hourly_wages.csv'
file_2 = 'https://assets.datacamp.com/production/repositories/654/datasets/24769dae9dc51a77b9baa785d42ea42e3f8f7538/mnist.csv'
file_3 = 'https://assets.datacamp.com/production/repositories/654/datasets/92b75b9bc0c0a8a30999d76f4a1ee786ef072a9c/titanic_all_numeric.csv'

datasets = [file_1, file_2, file_3]
data_paths = list()

for data in datasets:
    file_name = data.split('/')[-1].replace('?raw=true', '')
    data_path = data_dir / file_name
    create_dir_save_file(data_path, data)
    data_paths.append(data_path)

Directory Exists
File Exists
Directory Exists
File Exists
Directory Exists
File Exists

hw = pd.read_csv(data_paths[0])
hw.head(2)

mnist = pd.read_csv(data_paths[1], header=None)
mnist.iloc[:2, :6]

titanic = pd.read_csv(data_paths[2])
titanic.head(2)

# These are the usual ipython objects, including this one you are creating
ipython_vars = ['In', 'Out', 'exit', 'quit', 'get_ipython', 'ipython_vars']  # list a variables

# Get a sorted list of the objects and their sizes
sorted([(x, sys.getsizeof(globals().get(x))) for x in dir() if not x.startswith('_') and x not in sys.modules and x not in ipython_vars], key=lambda x: x[1], reverse=True)[:5]

[('mnist', 12566424),
 ('titanic', 72315),
 ('hw', 42864),
 ('Dense', 1064),
 ('EarlyStopping', 1064)]

import numpy as np
from keras.layers import Dense
from keras.models import Sequential
predictors = np.loadtxt('predictors_data.csv', delimiter=',')
n_cols = predictors.shape[1]
model = Sequential()
model.add(Dense(100, activation='relu', input_shape = (n_cols,)))
model.add(Dense(100, activation='relu'))
model.add(Dense(1))

input_data = np.array([2, 3])
weights = {'node_0': np.array([1, 1]),
'node_1': np.array([-1, 1]),
'output': np.array([2, -1])}
node_0_value = (input_data * weights['node_0']).sum()
node_1_value = (input_data * weights['node_1']).sum()

hidden_layer_values = np.array([node_0_value, node_1_value])
print(hidden_layer_values)

output = (hidden_layer_values * weights['output']).sum()
print(output)

[5 1]
9

input_data = np.array([3, 5])
weights = {'node_0': np.array([2, 4]), 'node_1': np.array([ 4, -5]), 'output': np.array([2, 7])}

# Calculate node 0 value: node_0_value
node_0_value = (input_data * weights['node_0']).sum()

# Calculate node 1 value: node_1_value
node_1_value = (input_data * weights['node_1']).sum()

# Put node values into array: hidden_layer_outputs
hidden_layer_outputs = np.array([node_0_value, node_1_value])

# Calculate output: output
output = (hidden_layer_outputs * weights['output']).sum()

# Print output
print(output)

-39

input_data = np.array([-1, 2])
weights = {'node_0': np.array([3, 3]), 'node_1': np.array([1, 5]), 'output': np.array([2, -1])}

node_0_input = (input_data * weights['node_0']).sum()
node_0_output = np.tanh(node_0_input)

node_1_input = (input_data * weights['node_1']).sum()
node_1_output = np.tanh(node_1_input)

hidden_layer_outputs = np.array([node_0_output, node_1_output])

output = (hidden_layer_outputs * weights['output']).sum()
output

0.99010953783342

def relu(input_):
    '''Define your relu activation function here'''
    # Calculate the value for the output of the relu function: output
    output = max(0, input_)
    
    # Return the value just calculated
    return(output)

input_data = np.array([3, 5])
weights = {'node_0': np.array([2, 4]), 'node_1': np.array([ 4, -5]), 'output': np.array([2, 7])}

# Calculate node 0 value: node_0_output
node_0_input = (input_data * weights['node_0']).sum()
node_0_output = relu(node_0_input)

# Calculate node 1 value: node_1_output
node_1_input = (input_data * weights['node_1']).sum()
node_1_output = relu(node_1_input)

# Put node values into array: hidden_layer_outputs
hidden_layer_outputs = np.array([node_0_output, node_1_output])

# Calculate model output (do not apply relu)
model_output = (hidden_layer_outputs * weights['output']).sum()

# Print model output
print(model_output)

52

# Define predict_with_network()
def predict_with_network1(input_data_row, weights):

    # Calculate node 0 value
    node_0_input = (input_data_row * weights['node_0']).sum()
    node_0_output = relu(node_0_input)

    # Calculate node 1 value
    node_1_input = (input_data_row * weights['node_1']).sum()
    node_1_output = relu(node_1_input)

    # Put node values into array: hidden_layer_outputs
    hidden_layer_outputs = np.array([node_0_output, node_1_output])
    
    # Calculate model output
    input_to_final_layer = (hidden_layer_outputs * weights['output']).sum()
    model_output = relu(input_to_final_layer)
    
    # Return model output
    return(model_output)

input_data = [np.array([3, 5]), np.array([ 1, -1]), np.array([0, 0]), np.array([8, 4])]
weights = {'node_0': np.array([2, 4]), 'node_1': np.array([ 4, -5]), 'output': np.array([2, 7])}

# Create empty list to store prediction results
results = []
for input_data_row in input_data:
    # Append prediction to results
    results.append(predict_with_network1(input_data_row, weights))

# Print results
print(results)

[52, 63, 0, 148]

def predict_with_network2(input_data, weights):
    # Calculate node 0 in the first hidden layer
    node_0_0_input = (input_data * weights['node_0_0']).sum()
    node_0_0_output = relu(node_0_0_input)

    # Calculate node 1 in the first hidden layer
    node_0_1_input = (input_data * weights['node_0_1']).sum()
    node_0_1_output = relu(node_0_1_input)

    # Put node values into array: hidden_0_outputs
    hidden_0_outputs = np.array([node_0_0_output, node_0_1_output])
    
    # Calculate node 0 in the second hidden layer
    node_1_0_input = (hidden_0_outputs * weights['node_1_0']).sum()
    node_1_0_output = relu(node_1_0_input)

    # Calculate node 1 in the second hidden layer
    node_1_1_input = (hidden_0_outputs * weights['node_1_1']).sum()
    node_1_1_output = relu(node_1_1_input)

    # Put node values into array: hidden_1_outputs
    hidden_1_outputs = np.array([node_1_0_output, node_1_1_output])

    # Calculate model output: model_output
    model_output = relu((hidden_1_outputs * weights['output']).sum())
    
    # Return model_output
    return(model_output)

input_data = np.array([3, 5])
weights = {'node_0_0': np.array([2, 4]),
           'node_0_1': np.array([ 4, -5]),
           'node_1_0': np.array([-1,  2]),
           'node_1_1': np.array([1, 2]),
           'output': np.array([2, 7])}

output = predict_with_network2(input_data, weights)
print(output)

182

# The data point you will make a prediction for
input_data = np.array([0, 3])

# Sample weights
weights_0 = {'node_0': [2, 1],
             'node_1': [1, 2],
             'output': [1, 1]
            }

# The actual target value, used to calculate the error
target_actual = 3

# Make prediction using original weights
model_output_0 = predict_with_network1(input_data, weights_0)

# Calculate error: error_0
error_0 = model_output_0 - target_actual
error_0

6

# Create weights that cause the network to make perfect prediction (3): weights_1
weights_1 = {'node_0': [2, 1],
             'node_1': [1, 0],
             'output': [1, 1]
            }

# Make prediction using new weights: model_output_1
model_output_1 = predict_with_network1(input_data, weights_1)

# Calculate error: error_1
error_1 = model_output_1 - target_actual

# Print error_1
error_1

0

weights_0 = {'node_0': np.array([2, 1]), 'node_1': np.array([1, 2]), 'output': np.array([1, 1])}
weights_1 = {'node_0': np.array([2, 1]), 'node_1': np.array([1. , 1.5]), 'output': np.array([1. , 1.5])}
input_data = [np.array([0, 3]), np.array([1, 2]), np.array([-1, -2]), np.array([4, 0])]
target_actuals = [1, 3, 5, 7]

# from sklearn.metrics import mean_squared_error

# Create model_output_0 
model_output_0 = []
# Create model_output_1
model_output_1 = []

# Loop over input_data
for row in input_data:
    # Append prediction to model_output_0
    model_output_0.append(predict_with_network1(row, weights_0))
    
    # Append prediction to model_output_1
    model_output_1.append(predict_with_network1(row, weights_1))

# Calculate the mean squared error for model_output_0: mse_0
mse_0 = mean_squared_error(target_actuals, model_output_0)

# Calculate the mean squared error for model_output_1: mse_1
mse_1 = mean_squared_error(target_actuals, model_output_1)

# Print mse_0 and mse_1
print(f"Mean squared error with weights_0: %{round(mse_0, 2)}")
print(f"Mean squared error with weights_1: %{round(mse_1, 2)}")

Mean squared error with weights_0: %37.5
Mean squared error with weights_1: %49.89

weights = np.array([1, 2])
input_data = np.array([3, 4])
target = 6
learning_rate = 0.01

preds = (weights * input_data).sum()
error = preds - target
error

5

gradient = 2 * input_data * error
gradient

array([30, 40])

weights_updated = weights - learning_rate * gradient
preds_updated = (weights_updated * input_data).sum()
error_updated = preds_updated - target
error_updated

2.5

def get_slope(input_data, target, weights):
    # Calculate the predictions: preds
    preds = (weights * input_data).sum()

    # Calculate the error: error
    error = preds - target

    # Calculate the slope: slope
    slope = 2 * input_data * error
    
    return slope

weights = np.array([0, 2, 1])
input_data = np.array([1, 2, 3])
target = 0

get_slope(input_data, target, weights)

array([14, 28, 42])

# Set the learning rate: learning_rate
learning_rate = 0.01

# Calculate the predictions: preds
preds = (weights * input_data).sum()

# Calculate the error: error
error = preds - target

# Calculate the slope: slope
slope = 2 * input_data * error

# Update the weights: weights_updated
weights_updated = weights - learning_rate * slope

# Get updated predictions: preds_updated
preds_updated = (weights_updated * input_data).sum()

# Calculate updated error: error_updated
error_updated = preds_updated - target

# Print the original error
print(error)

# Print the updated error
print(error_updated)

7
5.04

def get_mse(input_data, target, weights):
    
    preds = (weights * input_data).sum()
    mse = mean_squared_error([target], [preds])
    return mse

weights = np.array([0, 2, 1])
input_data = np.array([1, 2, 3])
target = 0

n_updates = 20
mse_hist = []

# Iterate over the number of updates
for i in range(n_updates):
    # Calculate the slope: slope
    slope = get_slope(input_data, target, weights)
    
    # Update the weights: weights
    weights = weights - 0.01 * slope
    
    # Calculate mse with new weights: mse
    mse = get_mse(input_data, target, weights)
    
    # Append the mse to mse_hist
    mse_hist.append(mse)

# Plot the mse history
plt.plot(mse_hist)
plt.xlabel('Iterations')
plt.ylabel('Mean Squared Error')
plt.gca().yaxis.set_major_formatter(mtick.PercentFormatter())
plt.show()

import numpy as np
from keras.layers import Dense
from keras.models import Sequential

predictors = np.loadtxt('predictors_data.csv', delimiter=',')
n_cols = predictors.shape[1]

model = Sequential()
model.add(Dense(100, activation='relu', input_shape=(n_cols,)))
model.add(Dense(100, activation='relu'))
model.add(Dense(1))

# hourly_wages.csv
hw = pd.read_csv(data_paths[0])

display(hw.head(3))

hw.describe()

# Import necessary modules
# import keras
# from keras.layers import Dense
# from keras.models import Sequential

predictors = hw.iloc[:, 1:].values

# Save the number of columns in predictors: n_cols
n_cols = predictors.shape[1]

# Set up the model: model
model = Sequential()

# Add the first layer
model.add(Dense(50, activation='relu', input_shape=(n_cols,)))

# Add the second layer
model.add(Dense(30, activation='relu'))

# Add the output layer
model.add(Dense(1))

n_cols = predictors.shape[1]
model = Sequential()
model.add(Dense(100, activation='relu', input_shape = (n_cols,)))
model.add(Dense(100, activation='relu'))
model.add(Dense(1))
model.compile(optimizer='adam', loss='mean_squared_error')

# Import necessary modules
# import keras
# from keras.layers import Dense
# from keras.models import Sequential

# Specify the model
n_cols = predictors.shape[1]
model = Sequential()
model.add(Dense(50, activation='relu', input_shape = (n_cols,)))
model.add(Dense(32, activation='relu'))
model.add(Dense(1))

# Compile the model
model.compile(optimizer='adam', loss='mean_squared_error')

# Verify that model contains information from compiling
print("Loss function: " + model.loss)

Loss function: mean_squared_error

# Import necessary modules
# import keras
# from keras.layers import Dense
# from keras.models import Sequential

target = hw.wage_per_hour.values

# Specify the model
n_cols = predictors.shape[1]
model = Sequential()
model.add(Dense(50, activation='relu', input_shape = (n_cols,)))
model.add(Dense(32, activation='relu'))
model.add(Dense(1))

# Compile the model
model.compile(optimizer='adam', loss='mean_squared_error')

# Fit the model
model.fit(x=predictors, y=target, epochs=5, verbose=1)

Epoch 1/5
17/17 [==============================] - 0s 2ms/step - loss: 30.3772
Epoch 2/5
17/17 [==============================] - 0s 1ms/step - loss: 22.7786
Epoch 3/5
17/17 [==============================] - 0s 1ms/step - loss: 21.8462
Epoch 4/5
17/17 [==============================] - 0s 1ms/step - loss: 21.4328
Epoch 5/5
17/17 [==============================] - 0s 1ms/step - loss: 21.2286

<tensorflow.python.keras.callbacks.History at 0x1e23df18940>

from tensorflow.keras.utils import to_categorical

data = pd.read_csv('basketball_shot_log.csv')
predictors = data.drop(['shot_result'], axis=1).values
target = to_categorical(data['shot_result'])

model = Sequential()
model.add(Dense(100, activation='relu', input_shape=(n_cols,)))
model.add(Dense(100, activation='relu'))
model.add(Dense(100, activation='relu'))
model.add(Dense(2, activation='softmax'))
model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])
model.fit(predictors, target)

# titanic data
df = pd.read_csv(data_paths[2])
df.age_was_missing = df.age_was_missing.astype(int)  # convert Boolean to a number
display(df.head(2))
df.describe()

# Import necessary modules
# import keras
# from keras.layers import Dense
# from keras.models import Sequential
# from keras.utils import to_categorical

predictors = df.iloc[:, 1:].values
n_cols = predictors.shape[1]

# Convert the target to categorical: target
target = to_categorical(df.survived)

# Set up the model
model = Sequential()

# Add the first layer
model.add(Dense(32, activation='relu', input_shape=(n_cols,)))

# Add the output layer
model.add(Dense(2, activation='softmax'))

# Compile the model
model.compile(optimizer='sgd', loss='categorical_crossentropy', metrics=['accuracy'])

# Fit the model
model.fit(predictors, target, epochs=5, verbose=1)

Epoch 1/5
28/28 [==============================] - 0s 1ms/step - loss: 2.5361 - accuracy: 0.6218
Epoch 2/5
28/28 [==============================] - 0s 1ms/step - loss: 1.1159 - accuracy: 0.6330
Epoch 3/5
28/28 [==============================] - 0s 1ms/step - loss: 0.7131 - accuracy: 0.6891
Epoch 4/5
28/28 [==============================] - 0s 1ms/step - loss: 0.6187 - accuracy: 0.6790
Epoch 5/5
28/28 [==============================] - 0s 1ms/step - loss: 0.6200 - accuracy: 0.6902

<tensorflow.python.keras.callbacks.History at 0x1e4c09b5550>

from tensorflow.keras.models import load_model
model.save('model_file.h5')
my_model = load_model('model_file.h5')
predictions = my_model.predict(data_to_predict_with)
probability_true = predictions[:, 1]

# Specify, compile, and fit the model
model = Sequential()
model.add(Dense(32, activation='relu', input_shape=(n_cols,)))
model.add(Dense(2, activation='softmax'))
model.compile(optimizer='sgd', 
              loss='categorical_crossentropy', 
              metrics=['accuracy'])

model.fit(predictors[:800, :], target[:800, :])

# Calculate predictions: predictions
pred_data = predictors[800:, :]
predictions = model.predict(pred_data)

# Calculate predicted probability of survival: predicted_prob_true
predicted_prob_true = predictions[:, 1]

# Print predicted_prob_true
predicted_prob_true

25/25 [==============================] - 0s 1ms/step - loss: 2.1631 - accuracy: 0.5562

array([0.14567937, 0.18335524, 0.990599  , 0.7644454 , 0.20688732,
       0.16710629, 0.02948781, 0.32653692, 0.10595483, 0.34744728,
       0.22476563, 0.1340201 , 0.12653537, 0.7111234 , 0.17362803,
       0.05378632, 0.25303987, 0.29152656, 0.07391907, 0.5541538 ,
       0.26096934, 0.21695887, 0.03222005, 0.21665907, 0.8414357 ,
       0.17796974, 0.40962723, 0.90199107, 0.18228547, 0.21002501,
       0.38249457, 0.75846094, 0.17792921, 0.26488808, 0.34510124,
       0.36842877, 0.3003544 , 0.17345351, 0.45608845, 0.23062544,
       0.31014034, 0.3439002 , 0.26858   , 0.13600093, 0.36479202,
       0.08198298, 0.23487027, 0.13783525, 0.32359642, 0.70273167,
       0.76990974, 0.00844374, 0.5318753 , 0.53725845, 0.09431058,
       0.32170808, 0.96364856, 0.05290617, 0.2508271 , 0.17792921,
       0.12100039, 0.30353713, 0.05930348, 0.22118652, 0.24584311,
       0.08197409, 0.22468218, 0.40365848, 0.1811305 , 0.6053713 ,
       0.22482468, 0.18244971, 0.10741129, 0.06134324, 0.22722283,
       0.38229367, 0.32472122, 0.32566735, 0.17256665, 0.29156753,
       0.31471428, 0.14831473, 0.28564858, 0.19433397, 0.23238342,
       0.11268502, 0.21445668, 0.42943263, 0.20138258, 0.31850585,
       0.16675813], dtype=float32)

def get_new_model(input_shape):
    model = Sequential()
    model.add(Dense(100, activation='relu', input_shape=input_shape))
    model.add(Dense(100, activation='relu'))
    model.add(Dense(2, activation='softmax'))
    return model

lr_to_test = [0.000001, 0.01, 1]

# loop over learning rates
for lr in lrt_to_test:
    model = get_new_model()
    my_optimizer = SGD(lr=lr)
    model.compile(optimizer=my_optimizer, loss='categorical_crossentropy')
    model.fit(predictors, target)

# setup data
# titanic data
df = pd.read_csv(data_paths[2])
df.age_was_missing = df.age_was_missing.astype(int)  # convert Boolean to a number

predictors = df.iloc[:, 1:].values
n_cols = predictors.shape[1]
input_shape = (n_cols,)

# Convert the target to categorical: target
target = to_categorical(df.survived)

# Import the SGD optimizer, which is done in the Imports section
# from tensorflow.keras.optimizers import SGD

# Create list of learning rates: lr_to_test
lr_to_test = [0.000001, 0.01, 0.1]

# Loop over learning rates
for lr in lr_to_test:
    print('\n\nTesting model with learning rate: %f\n'%lr )
    
    # Build new model to test, unaffected by previous models
    model = get_new_model(input_shape)
    
    # Create SGD optimizer with specified learning rate: my_optimizer
    my_optimizer = SGD(learning_rate=lr)
    
    # Compile the model
    model.compile(optimizer=my_optimizer, loss='categorical_crossentropy')
    
    # Fit the model
    model.fit(predictors, target)


Testing model with learning rate: 0.000001

28/28 [==============================] - 0s 1ms/step - loss: 4.9162


Testing model with learning rate: 0.010000

28/28 [==============================] - 0s 1ms/step - loss: 1.7546


Testing model with learning rate: 0.100000

28/28 [==============================] - 0s 1ms/step - loss: 5.9029

# Save the number of columns in predictors: n_cols
n_cols = predictors.shape[1]
input_shape = (n_cols,)

# Specify the model
model = Sequential()
model.add(Dense(100, activation='relu', input_shape=input_shape))
model.add(Dense(100, activation='relu'))
model.add(Dense(2, activation='softmax'))

# Compile the model
model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

# Fit the model
hist = model.fit(predictors, target, validation_split=0.3)

20/20 [==============================] - 0s 8ms/step - loss: 0.8591 - accuracy: 0.6453 - val_loss: 0.7441 - val_accuracy: 0.6642

# Import EarlyStopping
# from tensorflow.keras.callbacks import EarlyStopping

# Save the number of columns in predictors: n_cols
n_cols = predictors.shape[1]
input_shape = (n_cols,)

# Specify the model
model = Sequential()
model.add(Dense(100, activation='relu', input_shape=input_shape))
model.add(Dense(100, activation='relu'))
model.add(Dense(2, activation='softmax'))

# Compile the model
model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

# Define early_stopping_monitor
early_stopping_monitor = EarlyStopping(patience=2)

# Fit the model
hist = model.fit(predictors, target, validation_split=0.3, epochs=30, callbacks=[early_stopping_monitor])

Epoch 1/30
20/20 [==============================] - 0s 7ms/step - loss: 1.0995 - accuracy: 0.6067 - val_loss: 1.0541 - val_accuracy: 0.3545
Epoch 2/30
20/20 [==============================] - 0s 3ms/step - loss: 0.7416 - accuracy: 0.6100 - val_loss: 0.6975 - val_accuracy: 0.6493
Epoch 3/30
20/20 [==============================] - 0s 3ms/step - loss: 0.6284 - accuracy: 0.6918 - val_loss: 0.6053 - val_accuracy: 0.6791
Epoch 4/30
20/20 [==============================] - 0s 3ms/step - loss: 0.6310 - accuracy: 0.6790 - val_loss: 0.5499 - val_accuracy: 0.7575
Epoch 5/30
20/20 [==============================] - 0s 3ms/step - loss: 0.6026 - accuracy: 0.6918 - val_loss: 0.5236 - val_accuracy: 0.7537
Epoch 6/30
20/20 [==============================] - 0s 3ms/step - loss: 0.6084 - accuracy: 0.7030 - val_loss: 0.6164 - val_accuracy: 0.7052
Epoch 7/30
20/20 [==============================] - 0s 3ms/step - loss: 0.5811 - accuracy: 0.7030 - val_loss: 0.6076 - val_accuracy: 0.6604

# Specify the model
model_1 = Sequential()
model_1.add(Dense(10, activation='relu', input_shape=input_shape))
model_1.add(Dense(10, activation='relu'))
model_1.add(Dense(2, activation='softmax'))

# Compile the model
model_1.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

model_1.summary()

Model: "sequential_10"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
=================================================================
dense_28 (Dense)             (None, 10)                110       
_________________________________________________________________
dense_29 (Dense)             (None, 10)                110       
_________________________________________________________________
dense_30 (Dense)             (None, 2)                 22        
=================================================================
Total params: 242
Trainable params: 242
Non-trainable params: 0
_________________________________________________________________

# Define early_stopping_monitor
early_stopping_monitor = EarlyStopping(patience=2)

# Create the new model: model_2
model_2 = Sequential()

# Add the first and second layers
model_2.add(Dense(100, activation='relu', input_shape=input_shape))
model_2.add(Dense(100, activation='relu'))

# Add the output layer
model_2.add(Dense(2, activation='softmax'))

# Compile model_2
model_2.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

# Fit model_1
model_1_training = model_1.fit(predictors, target, epochs=15, validation_split=0.2, callbacks=[early_stopping_monitor], verbose=False)

# Fit model_2
model_2_training = model_2.fit(predictors, target, epochs=15, validation_split=0.2, callbacks=[early_stopping_monitor], verbose=False)

# Create the plot
plt.plot(model_1_training.history['val_loss'], 'r', label='model_1')
plt.plot(model_2_training.history['val_loss'], 'b', label='model_2')
plt.xlabel('Epochs')
plt.ylabel('Validation score')
_ = plt.legend()

# Specify the model
model_1 = Sequential()
model_1.add(Dense(10, activation='relu', input_shape=input_shape))
model_1.add(Dense(2, activation='softmax'))

# Compile the model
model_1.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

model_1.summary()

Model: "sequential_12"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
=================================================================
dense_34 (Dense)             (None, 10)                110       
_________________________________________________________________
dense_35 (Dense)             (None, 2)                 22        
=================================================================
Total params: 132
Trainable params: 132
Non-trainable params: 0
_________________________________________________________________

# The input shape to use in the first hidden layer
input_shape = (n_cols,)

# Create the new model: model_2
model_2 = Sequential()

# Add the first, second, and third hidden layers
model_2.add(Dense(10, activation='relu', input_shape=input_shape))
model_2.add(Dense(10, activation='relu'))
model_2.add(Dense(10, activation='relu'))

# Add the output layer
model_2.add(Dense(2, activation='softmax'))

# Compile model_2
model_2.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

# Fit model 1
model_1_training = model_1.fit(predictors, target, epochs=20, validation_split=0.4, callbacks=[early_stopping_monitor], verbose=False)

# Fit model 2
model_2_training = model_2.fit(predictors, target, epochs=20, validation_split=0.4, callbacks=[early_stopping_monitor], verbose=False)

# Create the plot
plt.plot(model_1_training.history['val_loss'], 'r', label='model_1')
plt.plot(model_2_training.history['val_loss'], 'b', label='model_2')
plt.xlabel('Epochs')
plt.ylabel('Validation score')
_ = plt.legend()

from tensorflow.keras.datasets import mnist

(x_train, y_train), (x_test, y_test) = mnist.load_data()

assert x_train.shape == (60000, 28, 28)
assert x_test.shape == (10000, 28, 28)
assert y_train.shape == (60000,)
assert y_test.shape == (10000,)

X = x_test.reshape((10000, 784))

y = np.zeros((y_test.size, y_test.max() + 1))
y[np.arange(y_test.size), y_test] = 1

y[0]

array([0., 0., 0., 0., 0., 0., 0., 1., 0., 0.])

y_test[0]

7

# Create the model: model
model = Sequential()

# Add the first hidden layer
model.add(Dense(50, activation='relu', input_shape=(784,)))

# Add the second hidden layer
model.add(Dense(50, activation='relu'))

# Add the output layer
model.add(Dense(10, activation='softmax'))

# Compile the model
model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

# Fit the model
model.fit(X, y, epochs=10, validation_split=0.3)

Epoch 1/10
219/219 [==============================] - 1s 3ms/step - loss: 6.9723 - accuracy: 0.6180 - val_loss: 1.7533 - val_accuracy: 0.7673
Epoch 2/10
219/219 [==============================] - 1s 2ms/step - loss: 1.4124 - accuracy: 0.7709 - val_loss: 1.0788 - val_accuracy: 0.8153
Epoch 3/10
219/219 [==============================] - 1s 2ms/step - loss: 0.8167 - accuracy: 0.8190 - val_loss: 0.9107 - val_accuracy: 0.8277
Epoch 4/10
219/219 [==============================] - 1s 2ms/step - loss: 0.5930 - accuracy: 0.8547 - val_loss: 0.8294 - val_accuracy: 0.8377
Epoch 5/10
219/219 [==============================] - 1s 2ms/step - loss: 0.4901 - accuracy: 0.8699 - val_loss: 0.8243 - val_accuracy: 0.8493
Epoch 6/10
219/219 [==============================] - 1s 2ms/step - loss: 0.4056 - accuracy: 0.8911 - val_loss: 0.7467 - val_accuracy: 0.8567
Epoch 7/10
219/219 [==============================] - 1s 2ms/step - loss: 0.3549 - accuracy: 0.9054 - val_loss: 0.5833 - val_accuracy: 0.8727
Epoch 8/10
219/219 [==============================] - 1s 2ms/step - loss: 0.2733 - accuracy: 0.9204 - val_loss: 0.6773 - val_accuracy: 0.8717
Epoch 9/10
219/219 [==============================] - 1s 2ms/step - loss: 0.2872 - accuracy: 0.9203 - val_loss: 0.7157 - val_accuracy: 0.8763
Epoch 10/10
219/219 [==============================] - 1s 2ms/step - loss: 0.2614 - accuracy: 0.9264 - val_loss: 0.6382 - val_accuracy: 0.8947

<tensorflow.python.keras.callbacks.History at 0x1e21f49c850>

	wage_per_hour	union	education_yrs	experience_yrs	age	female	marr	south	manufacturing	construction
0	5.10	0	8	21	35	1	1	0	1	0
1	4.95	0	9	42	57	1	1	0	1	0

	survived	pclass	age	sibsp	parch	fare	male	age_was_missing	embarked_from_cherbourg	embarked_from_queenstown	embarked_from_southampton
0	0	3	22.0	1	0	7.2500	1	False	0	0	1
1	1	1	38.0	1	0	71.2833	0	False	1	0	0

	wage_per_hour	education_yrs	experience_yrs	age	female	marr	manufacturing
0	5.10	8	21	35	1	1	1
1	4.95	9	42	57	1	1	1
2	6.67	12	1	19	0	0	1

	wage_per_hour	union	education_yrs	experience_yrs	age	female	marr	south	manufacturing	construction
count	534.000000	534.000000	534.000000	534.000000	534.000000	534.000000	534.000000	534.000000	534.000000	534.000000
mean	9.024064	0.179775	13.018727	17.822097	36.833333	0.458801	0.655431	0.292135	0.185393	0.044944
std	5.139097	0.384360	2.615373	12.379710	11.726573	0.498767	0.475673	0.455170	0.388981	0.207375
min	1.000000	0.000000	2.000000	0.000000	18.000000	0.000000	0.000000	0.000000	0.000000	0.000000
25%	5.250000	0.000000	12.000000	8.000000	28.000000	0.000000	0.000000	0.000000	0.000000	0.000000
50%	7.780000	0.000000	12.000000	15.000000	35.000000	0.000000	1.000000	0.000000	0.000000	0.000000
75%	11.250000	0.000000	15.000000	26.000000	44.000000	1.000000	1.000000	1.000000	0.000000	0.000000
max	44.500000	1.000000	18.000000	55.000000	64.000000	1.000000	1.000000	1.000000	1.000000	1.000000

shot_clock	dribbles	touch_time	shot_dis	close_def_dis	shot_result
10.8	2	1.9	7.7	1.3	1
3.4	0	0.8	28.2	6.1	0
0	3	2.7	10.1	0.9	0
10.3	2	1.9	17.2	3.4	0

	survived	pclass	age	sibsp	parch	fare	male	age_was_missing	embarked_from_cherbourg	embarked_from_queenstown	embarked_from_southampton
count	891.000000	891.000000	891.000000	891.000000	891.000000	891.000000	891.000000	891.000000	891.000000	891.000000	891.000000
mean	0.383838	2.308642	29.699118	0.523008	0.381594	32.204208	0.647587	0.198653	0.188552	0.086420	0.722783
std	0.486592	0.836071	13.002015	1.102743	0.806057	49.693429	0.477990	0.399210	0.391372	0.281141	0.447876
min	0.000000	1.000000	0.420000	0.000000	0.000000	0.000000	0.000000	0.000000	0.000000	0.000000	0.000000
25%	0.000000	2.000000	22.000000	0.000000	0.000000	7.910400	0.000000	0.000000	0.000000	0.000000	0.000000
50%	0.000000	3.000000	29.699118	0.000000	0.000000	14.454200	1.000000	0.000000	0.000000	0.000000	1.000000
75%	1.000000	3.000000	35.000000	1.000000	0.000000	31.000000	1.000000	0.000000	0.000000	0.000000	1.000000
max	1.000000	3.000000	80.000000	8.000000	6.000000	512.329200	1.000000	1.000000	1.000000	1.000000	1.000000

	0	1	2	3	4	5
0	5	0	0.1	0.2	0.3	0.4
1	4	0	0.0	0.0	0.0	0.0

shot_result		Outcome 0	Outcome 1
1	→	0	1
0	→	1	0
0	→	1	0
0	→	1	0

Course¶

Course Description¶

Imports¶

tf testing¶

Configuration Options¶

Functions¶

Datasets¶

DataFrames¶

hw: Hourly Wages¶

mnist¶

titanic¶

Memory Usage¶

Basics of deep learning and neural networks¶

Introduction to deep learning¶

Comparing neural network models to classical regression models¶

Forward propagation¶

Coding the forward propagation algorithm¶

Activation functions¶

The Rectified Linear Activation Function¶

def relu¶

Applying the network to many observations/rows of data¶

def predict_with_network1¶

Deeper networks¶

Forward propagation in a deeper network¶

Multi-layer neural networks¶

def predict_with_network2¶

Representations are learned¶

Levels of representation¶

Optimizing a neural network with backward propagation¶

The need for optimization¶

Calculating model errors¶

Understanding how weights change model accuracy¶

Coding how weight changes affect accuracy¶

Scaling up to multiple data points¶

Gradient descent¶

Calculating slopes¶

def get_slope¶

Improving model weights¶

Making multiple updates to weights¶

def get_mse¶

Backpropagation¶

The relationship between forward and backward propagation¶

Thinking about backward propagation¶

Backpropagation in practice¶

A round of backpropagation¶

Building deep learning models with keras¶

Creating a keras model¶

Understanding your data¶

Specifying a model¶

Compiling and fitting a model¶

Compiling the model¶

Fitting the model¶

Classification models¶

Understanding your classification data¶

Last steps in classification models¶

Using models¶

Making predictions¶

Fine-tuning keras models¶

Understanding model optimization¶

def get_new_model¶

Diagnosing optimization problems¶

Changing optimization parameters¶

Model validation¶

Evaluating model accuracy on validation dataset¶

Early stopping: Optimizing the optimization¶

Experimenting with wider networks¶

Adding layers to a network¶

Thinking about model capacity¶

Experimenting with model structures¶

Stepping up to images¶

Building your own digit recognition model¶

Final Thoughts¶

Certificate¶

`hw`: Hourly Wages¶

`mnist`¶

`titanic`¶

`def relu`¶

`def predict_with_network1`¶

`def predict_with_network2`¶

`def get_slope`¶

`def get_mse`¶

`def get_new_model`¶