import numpy

x = numpy.zeros(1024)

x

array([0., 0., 0., ..., 0., 0., 0.])

x.dtype

dtype('float64')

y = x

y[1] = 17

x

array([ 0., 17.,  0., ...,  0.,  0.,  0.])

import torch

x = torch.zeros(1024)
y = x
y[1] = 17
x

tensor([ 0., 17.,  0.,  ...,  0.,  0.,  0.])

z = x[1:5]
z[1] = 6

x

tensor([ 0., 17.,  6.,  ...,  0.,  0.,  0.])

a = [0,0,0,0,0]
b = a
b[1] = 4
a

[0, 4, 0, 0, 0]

c = a[1:3]
c[1] = 5

c

[4, 5]

a

[0, 4, 0, 0, 0]

x = torch.randn(4,4)
y = torch.randn(4,4,device='mps')

import torch

x = torch.ones((1,3,4))

x = torch.ones(())
x = x + x

x

tensor(2.)

x = torch.ones(())
x.requires_grad = True
u = (x + 2)
y = u.square()  # (x + 2)^2 --> 2 * (1 + 2) = 6
y

tensor(9., grad_fn=<PowBackward0>)

with torch.no_grad():
    v = x * x

v

tensor(1.)

y.backward()

x.grad

tensor(6.)

def dumb_abs(a):
    if a >= 0:
        return a
    else:
        return -a

x = torch.tensor(-5.0)
x.requires_grad = True

y = dumb_abs(x)
y

tensor(5., grad_fn=<NegBackward0>)

y.backward()
x.grad

tensor(-1.)

import time

N = 1024 * 16
X = torch.randn(N,N)
Y = torch.randn(N,N)

begin = time.time()
Z = X @ Y
print(Z[0,0])
end = time.time()
print(f"elapsed: {(end - begin) * 1000} ms")

tensor(111.4226)
elapsed: 4410.971879959106 ms

X_mps = X.to("mps")
Y_mps = Y.to("mps")
begin = time.time()
Z_mps = X_mps @ Y_mps
print(Z_mps[0,0])
end = time.time()
print(f"elapsed: {(end - begin) * 1000} ms")

tensor(111.4226, device='mps:0')
elapsed: 912.1642112731934 ms

import torch

torch.nn

<module 'torch.nn' from '/opt/anaconda3/lib/python3.10/site-packages/torch/nn/__init__.py'>

X = torch.nn.Linear(128,128)

X = torch.nn.Sequential(
    torch.nn.Linear(128,128),
    torch.nn.ReLU(),
    torch.nn.Linear(128,128),
    torch.nn.ReLU(),
    torch.nn.Linear(128,1)
)

X

Sequential(
  (0): Linear(in_features=128, out_features=128, bias=True)
  (1): ReLU()
  (2): Linear(in_features=128, out_features=128, bias=True)
  (3): ReLU()
  (4): Linear(in_features=128, out_features=1, bias=True)
)

a = torch.randn(128)

X[0].weight

Parameter containing:
tensor([[-0.0642,  0.0879, -0.0534,  ...,  0.0206,  0.0588, -0.0675],
        [-0.0641, -0.0230,  0.0114,  ...,  0.0265,  0.0713, -0.0848],
        [-0.0686,  0.0794,  0.0154,  ...,  0.0783,  0.0211,  0.0513],
        ...,
        [ 0.0850, -0.0019,  0.0655,  ..., -0.0470, -0.0641,  0.0205],
        [ 0.0141,  0.0150,  0.0432,  ...,  0.0211, -0.0118, -0.0345],
        [-0.0493,  0.0454,  0.0276,  ..., -0.0297,  0.0097,  0.0564]],
       requires_grad=True)

U_mps = U.to("mps")

U

tensor([1.])

U_mps[0] = 3

U

tensor([1.])

U_mps

tensor([3.], device='mps:0')

U_mps.cpu()

tensor([3.])

U_mps.to("cpu")

tensor([3.])

U = torch.ones((5,5,5),device="mps")

(N ** 3)/(1024**3)

4096.0

U = torch.ones((N,N,N),device="meta")

torch.ones((1000000,2000000),device="meta") @ torch.ones((2000000,3000000),device="meta")

tensor(..., device='meta', size=(1000000, 3000000))

torch.ones((10000,20000),device="meta") @ torch.ones((30000,30000),device="meta")

---------------------------------------------------------------------------
RuntimeError                              Traceback (most recent call last)
Cell In[39], line 1
----> 1 torch.ones((10000,20000),device="meta") @ torch.ones((30000,30000),device="meta")

File /opt/anaconda3/lib/python3.10/site-packages/torch/_prims_common/wrappers.py:273, in out_wrapper.<locals>._out_wrapper.<locals>._fn(out, *args, **kwargs)
    271     result = fn(*args, is_out=(out is not None), **kwargs)  # type: ignore[arg-type]
    272 else:
--> 273     result = fn(*args, **kwargs)
    274 assert (
    275     isinstance(result, TensorLike)
    276     and is_tensor
    277     or isinstance(result, Tuple)  # type: ignore[arg-type]
    278     and len(result) == len(out_names)  # type: ignore[arg-type]
    279 )
    280 if out is not None:
    281     # Naively you might expect this assert to be true, but
    282     # it's not:
   (...)
    295     # be a normal meta tensor, but this is perfectly
    296     # harmless.

File /opt/anaconda3/lib/python3.10/site-packages/torch/_meta_registrations.py:2100, in meta_mm(a, b)
   2098 N, M1 = a.shape
   2099 M2, P = b.shape
-> 2100 torch._check(
   2101     M1 == M2,
   2102     lambda: f"a and b must have same reduction dim, but got [{N}, {M1}] X [{M2}, {P}].",
   2103 )
   2104 return a.new_empty(N, P)

File /opt/anaconda3/lib/python3.10/site-packages/torch/__init__.py:1564, in _check(cond, message)
   1549 def _check(cond, message=None):  # noqa: F811
   1550     r"""Throws error containing an optional message if the specified condition
   1551     is False.
   1552 
   (...)
   1562             message. Default: ``None``
   1563     """
-> 1564     _check_with(RuntimeError, cond, message)

File /opt/anaconda3/lib/python3.10/site-packages/torch/__init__.py:1546, in _check_with(error_type, cond, message)
   1542         raise TypeError("message must be a callable")
   1544     message_evaluated = str(message())
-> 1546 raise error_type(message_evaluated)

RuntimeError: a and b must have same reduction dim, but got [10000, 20000] X [30000, 30000].

torch.ones((1000000,2000000),device="meta")

tensor(..., device='meta', size=(1000000, 2000000))

torch.ones((1000000,2000000)).to("meta")

Lecture 4: ML Frameworks¶

CS4787/5777 — Principles of Large-Scale Machine Learning Systems¶

Recall from last time: Reverse-Mode AD¶

"Deep Learning" ML Frameworks¶

Numerical Linear Algebra¶

Numerical Linear Algebra: More Details¶

Numerical Linear Algebra On-Device¶

Eager Execution vs Graph Execution¶