Lecture 8 Notes Export

2024-11-12 00:37:17 +00:00 · 2024-11-12 00:37:17 +00:00 · 85da8f42aa
commit 85da8f42aa
parent 13087d2a0b
2 changed files with 195 additions and 0 deletions
--- a/lecture07/notes_07.pdf
+++ b/lecture07/notes_07.pdf
--- a/lecture07/notes_07.py
+++ b/lecture07/notes_07.py
@ -0,0 +1,195 @@
 # %% [markdown]
 # # Previous Class Definitions
 # The previously defined Layer_Dense, Activation_ReLU, and Activation_Softmax
 # %%
 # imports
 import numpy as np
 import nnfs
 from nnfs.datasets import spiral_data
 nnfs.init()
 # %%
 class Layer_Dense:
    def __init__(self, n_inputs, n_neurons):
        # Initialize the weights and biases
        self.weights = 0.01 * np.random.randn(n_inputs, n_neurons)  # Normal distribution of weights
        self.biases = np.zeros((1, n_neurons))
    def forward(self, inputs):
        # Calculate the output values from inputs, weights, and biases
        self.output = np.dot(inputs, self.weights) + self.biases        # Weights are already transposed
 class Activation_ReLU:
    def forward(self, inputs):
        self.output = np.maximum(0, inputs)
 class Activation_Softmax:
    def forward(self, inputs):
        # Get the unnormalized probabilities
        # Subtract max from the row to prevent larger numbers
        exp_values = np.exp(inputs - np.max(inputs, axis=1, keepdims=True))
        # Normalize the probabilities with element wise division
        probabilities = exp_values / np.sum(exp_values, axis=1,keepdims=True)
        self.output = probabilities
 # %% [markdown]
 # # Forward Pass with No Loss Consideration
 # 2 input neural network with 2 layers of 3 neurons each. ReLU activation in the first layer with Softmax in the second layer to normalize the outputs.
 # %%
 # Create dataset
 X, y = spiral_data(samples=100, classes=3)
 # Create Dense layer with 2 input features and 3 output values
 dense1 = Layer_Dense(2, 3)
 # Create ReLU activation (to be used with Dense layer):
 activation1 = Activation_ReLU()
 # Create second Dense layer with 3 input features (as we take output
 # of previous layer here) and 3 output values
 dense2 = Layer_Dense(3, 3)
 # Create Softmax activation (to be used with Dense layer):
 activation2 = Activation_Softmax()
 # Make a forward pass of our training data through this layer
 dense1.forward(X)
 # Make a forward pass through activation function
 # it takes the output of first dense layer here
 activation1.forward(dense1.output)
 # Make a forward pass through second Dense layer
 # it takes outputs of activation function of first layer as inputs
 dense2.forward(activation1.output)
 # Make a forward pass through activation function
 # it takes the output of second dense layer here
 activation2.forward(dense2.output)
 # Let's see output of the first few samples:
 print(activation2.output[:5])
 # %% [markdown]
 # # Calculating Network Error with Categorical Cross Entropy Loss
 # loss = negative sum of the expected output * log(neural network output)
 # loss = - sum(expected_i * log(nn_output_i)) for all i in outputs
 # 
 # In the classification case, incorrect outputs do not end up mattering as the expected_i for the wrong class is 0.
 # 
 # %%
 nn_outputs = np.array([
    [0.7, 0.1, 0.2],
    [0.1, 0.5, 0.4],
    [0.02, 0.9, 0.08]])
 class_targets = [0, 1, 1]
 losses = -np.log(nn_outputs[range(len(nn_outputs)), class_targets])
 print(f"Losses: {losses}")
 print(f"Average Loss: {np.average(losses)}")
 # %% [markdown]
 # ## Loss with One Hot Encoding
 # Classification typically has the expected output to be all zero except for the class the inputs belong too. This leads to simplfiying the cross entropy loss calculation.
 # %%
 true_output = np.array([
    [1, 0, 0],
    [0, 1, 0],
    [0, 1, 0]
 ])
 nn_output = np.array([
    [0.7, 0.2, 0.1],
    [0.1, 0.5, 0.4],
    [0.02, 0.9, 0.08]
 ])
 # Element by element multiplication "erases" the output terms corresponding with 0
 A = true_output*nn_output
 # Sum the columns (ie, sum every element in row 0, then row 1, etc) because each row is a batch of output
 B = np.sum(A, axis = 1)
 # Get the cross entropy loss
 C = -np.log(B)
 print(f"Losses: {C}")
 print(f"Average Loss: {np.mean(C)}")
 # %% [markdown]
 # ## Implementing the Loss Class
 # %%
 # Base class for Loss functions
 class Loss:
    '''Calculates the data and regularization losses given
    model output and ground truth values'''
    def calculate(self, output, y):
        sample_losses = self.forward(output, y)
        data_loss = np.average(sample_losses)
        return data_loss
 # %% [markdown]
 # ## Implementing the Categorical Cross Entropy Loss Class
 # %%
 class Loss_CategoricalCrossEntropy(Loss):
    def forward(self, y_pred, y_true):
        '''y_pred is the neural network output
        y_true is the ideal output of the neural network'''
        samples = len(y_pred)
        # Bound the predicted values 
        y_pred_clipped = np.clip(y_pred, 1e-7, 1-1e-7)
        if len(y_true.shape) == 1:     # Categorically labeled
            correct_confidences = y_pred_clipped[range(samples), y_true]
        elif len(y_true.shape) == 2:   # One hot encoded
            correct_confidences = np.sum(y_pred_clipped*y_true, axis=1)
        # Calculate the losses
        negative_log_likelihoods = -np.log(correct_confidences)
        return negative_log_likelihoods
 # %%
 nn_outputs = np.array([
    [0.7, 0.1, 0.2],
    [0.1, 0.5, 0.4],
    [0.02, 0.9, 0.08]])
 class_targets = np.array([
    [1, 0, 0],
    [0, 1, 0],
    [0, 1, 0]])
 loss_function = Loss_CategoricalCrossEntropy()
 losses = loss_function.calculate(nn_outputs, class_targets)
 print(f"Losses: {losses}")
 print(f"Average Loss: {np.average(losses)}")
 # %% [markdown]
 # # Introducing Accuracy
 # In the simple example, if the highest value in the outputs align with the correct classification, then that accuracy is 1. Even if it was 51% red and 49% blue, and the true output is red, it would be considered fully accurate.
 # %%
 nn_outputs = np.array([
    [0.7, 0.1, 0.2],
    [0.1, 0.5, 0.4],
    [0.02, 0.9, 0.08]])
 class_targets = np.array([
    [1, 0, 0],
    [0, 1, 0],
    [0, 1, 0]])
 # Calculate the losses
 loss_function = Loss_CategoricalCrossEntropy()
 losses = loss_function.calculate(nn_outputs, class_targets)
 print(f"Losses: {losses}")
 print(f"Average Loss: {np.average(losses)}")
 # Calculate the accuracy
 predictions = np.argmax(nn_outputs, axis=1)
 # If targets are one-hot encoded - convert them
 if len(class_targets.shape) == 2:
    class_targets = np.argmax(class_targets, axis=1)
 # True evaluates to 1; False to 0
 accuracy = np.mean(predictions == class_targets)
 print(f"Accuracy: {accuracy}")