import torch

# Function to compute y = sin(log(x^2 + 1))
def func(x):
    g = x**2 + 1
    h = torch.log(g)
    k = torch.sin(h)
    return k
    #return torch.sin(torch.log(x**2 + 1))

# Set up the initial guess for x (starting point for optimization)
x = torch.tensor([1.0], requires_grad=True)  # x is a scalar, requires gradients

# Use an optimizer to minimize the difference between y and 0
optimizer = torch.optim.Adam([x], lr=0.1)

# Number of iterations for optimization
num_iterations = 10

for i in range(num_iterations):
    # Zero the gradients from the previous step
    optimizer.zero_grad()

    # Compute the function value
    y = func(x)
    
    print(x)
    # Compute the loss, we want to find x when y = 0
    loss = y**2  # This is the squared error between y and 0

    #Calculate manual gradient of x
    manual = 2*x*torch.cos(torch.log(x**2+1))/(x**2+1)
    
    # Perform backward propagation to compute the gradients
    y.backward()

    # Print the current value of x and loss at every 100 iterations
    if i % 1 == 0:
        print(f"Iteration {i}, x: {x.item():.4f}, y: {y.item():.6f}, Auto Gradient of x: {x.grad.item():.6f}, Manual Gradient of x: {manual.item():.6f}")

    # Update the value of x using the optimizer
    optimizer.step()        
        
# Final value of x where y should be approximately 0
print(f"Final value of x: {x.item():.4f}")

tensor([1.], requires_grad=True)
Iteration 0, x: 1.0000, y: 0.638961, Auto Gradient of x: 0.769239, Manual Gradient of x: 0.769239
tensor([0.9000], requires_grad=True)
Iteration 1, x: 0.9000, y: 0.559122, Auto Gradient of x: 0.824505, Manual Gradient of x: 0.824505
tensor([0.7999], requires_grad=True)
Iteration 2, x: 0.7999, y: 0.474661, Auto Gradient of x: 0.858673, Manual Gradient of x: 0.858673
tensor([0.6996], requires_grad=True)
Iteration 3, x: 0.6996, y: 0.387947, Auto Gradient of x: 0.865841, Manual Gradient of x: 0.865841
tensor([0.5992], requires_grad=True)
Iteration 4, x: 0.5992, y: 0.301997, Auto Gradient of x: 0.840632, Manual Gradient of x: 0.840632
tensor([0.4989], requires_grad=True)
Iteration 5, x: 0.4989, y: 0.220408, Auto Gradient of x: 0.779257, Manual Gradient of x: 0.779257
tensor([0.3989], requires_grad=True)
Iteration 6, x: 0.3989, y: 0.147134, Auto Gradient of x: 0.680803, Manual Gradient of x: 0.680803
tensor([0.3000], requires_grad=True)
Iteration 7, x: 0.3000, y: 0.086076, Auto Gradient of x: 0.548428, Manual Gradient of x: 0.548428
tensor([0.2032], requires_grad=True)
Iteration 8, x: 0.2032, y: 0.040449, Auto Gradient of x: 0.389961, Manual Gradient of x: 0.389961
tensor([0.1100], requires_grad=True)
Iteration 9, x: 0.1100, y: 0.012033, Auto Gradient of x: 0.217409, Manual Gradient of x: 0.217409
Final value of x: 0.0226

x = torch.tensor([1.0], requires_grad=True)
x

tensor([1.], requires_grad=True)

g1 = x**2
print(g1)
g = g1+1
print(g)

tensor([1.], grad_fn=<PowBackward0>)
tensor([2.], grad_fn=<AddBackward0>)

h = torch.log(g)
print(h)

tensor([0.6931], grad_fn=<LogBackward0>)

k = torch.sin(h)
print(k)

tensor([0.6390], grad_fn=<SinBackward0>)

import torch
from torch.utils.tensorboard import SummaryWriter
writer = SummaryWriter('runs/experiment_2')
class OurNet(torch.nn.Module):
    def __init__(self):
        super(OurNet,self).__init__()
    def forward(self,x):
        g1 = x**2
        g = g1 + 1
        h = torch.log(g)
        k = torch.sin(h)
        return k
graph = OurNet()
writer.add_graph(graph,torch.randn((1)))
writer.close()

### use tensorboard --logdir=runs command to view

import torch
a = torch.tensor([
    [1, 2, 3],
    [1, 2, 3]
])
transpose_a = torch.t(a)
print("Transpose matrix of a is",transpose_a)

Transpose matrix of a is tensor([[1, 1],
        [2, 2],
        [3, 3]])

transpose_a = torch.transpose(a,0,1)
print("Transpose matrix of a is",transpose_a)

Transpose matrix of a is tensor([[1, 1],
        [2, 2],
        [3, 3]])

import torch
a = torch.tensor([1, 2, 3])
b = torch.tensor([4, 5, 6])

ab= torch.dot(a, b)
print (a)
print (b)
print ("Inner product of a and b is",ab)

tensor([1, 2, 3])
tensor([4, 5, 6])
Inner product of a and b is tensor(32)

ba= torch.dot(b, a)
print ("Inner product of b and a is",ba)

Inner product of b and a is tensor(32)

# what if now the vectors are not the same size
a = torch.tensor([1, 2])
c = torch.tensor([3, 2, 1])

ac= torch.dot(a, c)
print ("Inner product of a and b is",ac)

import torch
a  =  torch.randn(2, 3) 
b  =  torch.randn(3)
print(a)
print(b)
c = torch.mv(a,b)
print("Matrix-vector dot product is",c)

tensor([[-1.0917,  0.6832,  1.5545],
        [-1.0927,  0.6571,  0.5402]])
tensor([-0.2527, -0.5882, -2.8065])
Matrix-vector dot product is tensor([-4.4887, -1.6265])

d = a@b
print("Matrix multiplication is", d)

Matrix multiplication is tensor([-4.4887, -1.6265])

import torch
import time

# Define the size of the matrix and vector
m, n = 1000, 1000

# Create a random matrix A (m x n) and a random vector v (n,)
A = torch.rand(m, n)
v = torch.rand(n)

# Time `torch.mv` (matrix-vector multiplication)
start_time = time.time()
result_mv = torch.mv(A, v)
mv_time = time.time() - start_time

# Time `torch.mm` (matrix-matrix multiplication)
start_time = time.time()
# We need to reshape v to be a matrix with shape (n, 1) for mm
result_mm = torch.mm(A, v.view(-1, 1))
mm_time = time.time() - start_time

# Print the results
print(f"Time taken by torch.mv: {mv_time:.6f} seconds")
print(f"Time taken by torch.mm: {mm_time:.6f} seconds")

Time taken by torch.mv: 0.009708 seconds
Time taken by torch.mm: 0.012335 seconds

import torch
a = torch.tensor([[1, 2],[3, 4]])
b = torch.tensor([[5, 6],[7, 8]])

ab = a*b
print (a)
print (b)
print ("Hadamard product of a and b is",ab)

tensor([[1, 2],
        [3, 4]])
tensor([[5, 6],
        [7, 8]])
Hadamard product of a and b is tensor([[ 5, 12],
        [21, 32]])

# Example of matrix dot product
a = torch.arange(1, 7).view(2, 3)
b = torch.arange(1, 7).view(3, 2)
print(a)
print(b)
adotb=torch.mm(a, b)
print ("Dot product of a and b is",adotb)

tensor([[1, 2, 3],
        [4, 5, 6]])
tensor([[1, 2],
        [3, 4],
        [5, 6]])
Dot product of a and b is tensor([[22, 28],
        [49, 64]])

# Example of matrix dot product
a = torch.arange(1, 7).view(3, 2)
b = torch.arange(1, 7).view(2, 3)
print(a)
print(b)
adotb=torch.mm(a, b)
print ("Dot product of a and b is")
print (adotb)

tensor([[1, 2],
        [3, 4],
        [5, 6]])
tensor([[1, 2, 3],
        [4, 5, 6]])
Dot product of a and b is
tensor([[ 9, 12, 15],
        [19, 26, 33],
        [29, 40, 51]])

# Matrix multiplication is not commutative,
bdota=torch.mm(b, a)
print ("Dot product of b and a is",bdota)

# the dimensions of the matrices is important for matrix multiplication
adota=torch.mm(a, a)
print ("Dot product of a and a is",adota)

---------------------------------------------------------------------------
RuntimeError                              Traceback (most recent call last)
Cell In[34], line 2
      1 # the dimensions of the matrices is important for matrix multiplication
----> 2 adota=torch.mm(a, a)
      3 print ("Dot product of a and a is",adota)

RuntimeError: mat1 and mat2 shapes cannot be multiplied (3x2 and 3x2)

# both arguments 1D
vec_1 = torch.tensor([3, 6, 2])
vec_2 = torch.tensor([4, 1, 9])
  
print("Single dimensional tensors :", torch.matmul(vec_1, vec_2))

Single dimensional tensors : tensor(36)

# both arguments 2D
mat_1 = torch.tensor([[1, 2, 3],
                      [4, 3, 8],
                      [1, 7, 2]])
  
mat_2 = torch.tensor([[2, 4, 1],
                      [1, 3, 6],
                      [2, 6, 5]])
  
out = torch.matmul(mat_1, mat_2)
  
print("\n3x3 dimensional tensors :\n", out)

3x3 dimensional tensors :
 tensor([[10, 28, 28],
        [27, 73, 62],
        [13, 37, 53]])

# Arguments of different dimensions
# first argument 1D and second argument 2D
mat1_1 = torch.tensor([3, 6, 2])
  
mat1_2 = torch.tensor([[1, 2, 3],
                       [4, 3, 8],
                       [1, 7, 2]])
  
out_1 = torch.matmul(mat1_1, mat1_2)
print("\n1D-2D multiplication :\n", out_1)

1D-2D multiplication :
 tensor([29, 38, 61])

# first argument 2D and second argument 1D
mat2_1 = torch.tensor([[2, 4, 1],
                       [1, 3, 6],
                       [2, 6, 5]])
  
mat2_2 = torch.tensor([4, 1, 9])
  
# assigning to output tensor
out_2 = torch.matmul(mat2_1, mat2_2)
  
print("\n2D-1D multiplication :\n", out_2)

2D-1D multiplication :
 tensor([21, 61, 59])

# N-dimensional argument (N>2)
# creating Tensors using randn()
mat_1 = torch.randn(2, 3, 3)
mat_2 = torch.randn(3)
  
# printing the matrices
print("matrix A :\n", mat_1)
print("\nmatrix B :\n", mat_2)
  
# output
print("\nOutput :\n", torch.matmul(mat_1, mat_2))

matrix A :
 tensor([[[ 1.9742, -0.3101,  0.9207],
         [-0.5845,  0.3964,  0.2774],
         [ 0.1423, -0.6356, -1.0601]],

        [[ 0.7488,  0.0633, -0.1190],
         [ 0.2655, -1.8284, -1.4647],
         [ 0.2355, -0.5253,  0.6223]]])

matrix B :
 tensor([ 0.7186, -1.4878,  1.3330])

Output :
 tensor([[ 3.1072, -0.6399, -0.3651],
        [ 0.2852,  0.9588,  1.7803]])

Argument 1	Argument 2	Action taken
1-dimensional	1-dimensional	The scalar product is calculated
2-dimensional	2-dimensional	General matrix multiplication is done
1-dimensional	2-dimensional	The tensor 1 is pretended with a ‘1’ to match dimension of tensor 2
2-dimensional	1-dimensional	Matrix-vector product is calculated
1/N-dimensional (N>2)	1/N-dimensional (N>2)	Batched matrix multiplication is done

Lecture 2 - Linear Algebra I¶

ECE364 - Programming Methods for Machine Learning¶

Nickvash Kani¶

Slides based off prior lectures by Alex Schwing, Aigou Han, Farzas Kamalabadi, Corey Snyder. All mistakes are my own!¶

Motivation¶

How computation graphs work (in PyTorch)¶

Linear Algebra for Machine Learning¶

Scaler, vector, matrix and tensor (Review)¶

Matrix Transpose¶

Inner (dot) product of two vectors¶

Matrix-Vector dot product¶

Hadamard Product (Element Wise Multiplication)¶

Matrix dot product¶

Matrix product of two tensors (general form)¶

That's it for today¶