# libraries

import numpy as np
import torch
import torch.nn as nn
import scipy as stats
import matplotlib.pyplot as plt
%matplotlib inline

# Setting random seeds for reproducibility
np.random.seed(42)
torch.manual_seed(42)

<torch._C.Generator at 0x7bdf17843e30>


# Example of Affine Transformation
R = 3 # input dimension
D = 3 # output dimension
x = torch.rand(R) # create a random vector
W = torch.rand(D,R) # Weight matrix (output dim, input dim)
b = torch.rand(D) # #create random bias vector
h = W@x + b # Affine transformation

# print(f'input vector: {x}')
# print(f'weight matrix: {W}')
# print(f'weight bias vector: {b}')
# print(f'affine transformed vector:{h}')

# Transforming vectors to numpy format
x_np = x.numpy()
h_np = h.numpy()
print('***Visualization***')
print(f'numpy x:{x_np} and numpy h:{h_np}')

# Create the plot and plot the two points
from mpl_toolkits.mplot3d import Axes3D
fig = plt.figure()
ax = fig.add_subplot(111,projection='3d')
v1 = ax.scatter(x_np[0],x_np[1],x_np[2],color="blue",label="Input Vector x")
v2 = ax.scatter(h_np[0],h_np[1],h_np[2], color="red",label="Output Vector h")

# Add lables and legends
ax.set_xlabel('X axis')
ax.set_ylabel('Y axis')
ax.set_zlabel('Z axis')
ax.legend()
ax.set_title('Affine Transformation')

# Add arrows from origint to each point
ax.plot([0, x_np[0]], [0, x_np[1]], [0, x_np[2]],
          color='blue', linewidth=2, alpha=0.7, linestyle='--')
ax.plot([0, h_np[0]], [0, h_np[1]], [0, h_np[2]],
          color='red', linewidth=2, alpha=0.7, linestyle='--')

plt.show()

***Visualization***
numpy x:[0.88226926 0.91500396 0.38286376] and numpy h:[2.303093  1.8804536 1.941021 ]


#Create an xy plane without any plots
from matplotlib import pyplot as plt
fig, ax = plt.subplots(figsize=(5,4))
ax.axis((0,10,0,10))
ax.set_xlabel('X axis')
ax.set_ylabel('Y axis')
ax.set_title('Clustering example')


# Cluster of dots
def sample_cluster(center_xy, n=10, spread=0.3):
    """
    center_xy: (x,y) tuple for the cluster center
    n: number of points to be created
    spread: how tight the cluster is
    """
    cx,cy = center_xy
    pts = np.column_stack([
        np.random.normal(cx, spread, n),
        np.random.normal(cy, spread, n)
    ])
    return pts

# Choose the centers of the clusters
centers = [
    (2,8), # top right
    (8,8), # top left
    (2,2), # bottom right
    (8,2) # bottom left
]

for c in centers:
    vectors = sample_cluster(c,n=10,spread=0.3)
    ax.scatter(vectors[:,0],vectors[:,1], s=30)

# Adding a trend line (decision boundary)

x_line = np.linspace(0,10,5)
y_line = x_line.copy()
ax.plot(x_line,y_line,'--',color='red', linewidth=2,label="Decision Boundary")

ax.legend()
plt.show()


# ReLU that works on both single values and arrays (vectors)

def relu_manual(x):
    """
    Implements RelU: f(x)
    Works for both single values and numpy arrays
    """
    # Handling scalar inputs
    if np.isscalar(x):
        return np.maximum(0,x)


    r_x = []
    for i in x:
        a = np.maximum(0,i)
        r_x.append(a)
    return np.array(r_x)

# Test on single values
test_values = [-2, -1, 0, 1, 2]
one_value = 56
print(f"ReLU({test_values}) = {relu_manual(test_values)}")
print(f"ReLU({one_value}) = {relu_manual(one_value)}")

# Lets create a scatter plot with the ReLU function

from matplotlib import pyplot as plt
fig, ax = plt.subplots(figsize=(5,4))
ax.axis((-10,10,-10,10))
ax.set_xlabel('X axis')
ax.set_ylabel('Y axis')
ax.set_title('ReLU function visualization')


# Add nice gridlines
ax.grid(True, linestyle='--', linewidth=0.5, alpha=0.3, color='gray')
ax.set_axisbelow(True)  # Put grid behind the plot

# ReLU values
x_values = np.linspace(-10,10,100)
y_values = relu_manual(x_values)
ax.plot(x_values,y_values,"-",color="blue",linewidth=1,label="Decision Boundary")

ReLU([-2, -1, 0, 1, 2]) = [0 0 0 1 2]
ReLU(56) = 56

[<matplotlib.lines.Line2D at 0x7bde328afef0>]


# Building a Neural Network from scratch

class SimpleLayer:
  """
  A simple neural network layer with affine transformation and ReLU activation
  """
  def __init__(self, input_dim, output_dim):
    """
    Initialize the layer with random weights and biases
    input_dim: Number of input features/neaurons feeding into this layer
    output_dim: Number of output neurons this layer will produce
    """
    # Initialize wights and baises with small random numbers
    # W here is created one row per output neuron (perceptron) --> SUPER IMPORTANT
    self.W = np.random.rand(output_dim, input_dim) * 0.1
    self.b = np.random.rand(output_dim) * 0.1

  def forward(self, x):
    """
    Forward pass through the neural network layer
    x: input vector (numpy array)
    returns: activated output
    """
    print(f"W:{self.W}")
    print(f"b:{self.b}")
    t = np.dot(self.W, x) + self.b # Perform transformation
    if np.isscalar(t):
        return np.maximum(0,t)
    r_t = []
    for i in t:
        a = np.maximum(0,i)
        r_t.append(a)
    return np.array(r_t)

# Test the layer
np.random.seed(42)
layer1 = SimpleLayer(input_dim=3, output_dim=4)
test_input = np.array([1.0,-0.5,2.0])
output = layer1.forward(test_input)
print(f"Input shape: {test_input.shape}")
print(f"Input values: {test_input}")
print(f"Output shape: {output.shape}")
print(f"Output values: {output}")

W:[[0.03745401 0.09507143 0.07319939]
 [0.05986585 0.01560186 0.01559945]
 [0.00580836 0.08661761 0.0601115 ]
 [0.07080726 0.00205845 0.09699099]]
b:[0.08324426 0.02123391 0.0181825  0.01834045]
Input shape: (3,)
Input values: [ 1.  -0.5  2. ]
Output shape: (4,)
Output values: [0.21956135 0.10449773 0.10090505 0.28210045]


class Neuron:

  """
  Forward pass
  Backward pass (Backpropagation)
  Loss function
  """
  def __init__(self, input_dim):
    # initialize weights and bias with small random values
    self.W = np.random.randn(input_dim) * 0.1
    self.b = 0.0

    # Store values for backward pass
    self.last_input = None
    self.last_z = None # pre-activation value
    self.last_output = None

  def forward(self, x):
    """Compute output for input x"""
    # Store for backward pass
    self.last_input = x

    # Affine transformation
    z = np.dot(self.W,x) + self.b
    self.last_z = z

    # Implement activation in this case it would be sigmoid
    h = np.where(z >= 0, 1/(1+np.exp(-z), np.exp(z)/ (1+np.exp(z))))
    self.last_output = h
    return self.last_output

  def compute_loss(self, y_true):
    """ Compute squared error loss """
    if self.last_output is None:
      raise ValueError("Must call forward() first")

    # Simple squared error: (prediction - target)^2
    loss = 0.5 * np.square(self.last_output - y_true)
    return loss

# Test the neuron
neuron = Neuron(input_dim=2)
test_x = np.array([1.0, -0.5])

# Implement forward pass
print(f"Neuron created with weights:{neuron.W}")

[-0.17249178 -0.05622875] 0.0
Neuron created with weights:[-0.17249178 -0.05622875]

0.5

Othello GPT Notes¶

By: Ivan Vega with LLM support¶

Completely written by Ivan Vega but conversations and explanation done by LLMs (ChatGPT-5, Claude, Gemini)¶

Step 1: Understanding and Affine Transformation¶

Step 2: Understanding nonlinearity¶

Step 3: Implementing ReLU¶

Step 5: Building a Neural Network Layer¶

Step 6: Building my first neuron from scratch¶