import numpy as np
import random
import matplotlib.pyplot as plt
import imageio.v3 as imageio

# create a list
numbers = list(range(8))
numbers

[0, 1, 2, 3, 4, 5, 6, 7]

# turn it into a numpy array
arr = np.array(numbers)
arr

array([0, 1, 2, 3, 4, 5, 6, 7])

# index into the array
arr[4]

np.int64(4)

# check the shape of the array
arr.shape

(8,)

# slice a subarray
arr[2:4]

array([2, 3])

# implicit range start
arr[:4]

array([0, 1, 2, 3])

# implicit range end
arr[4:]

array([4, 5, 6, 7])

# slice the whole thing - creates a copy!
arr[:]

array([0, 1, 2, 3, 4, 5, 6, 7])

# array + scalar
arr + 4

array([ 4,  5,  6,  7,  8,  9, 10, 11])

# array + array
arr + arr

array([ 0,  2,  4,  6,  8, 10, 12, 14])

# scalar * array
2 * arr

array([ 0,  2,  4,  6,  8, 10, 12, 14])

# errors if shapes don't match
arr + arr[:4]

---------------------------------------------------------------------------
ValueError                                Traceback (most recent call last)
Cell In[16], line 2
      1 # errors if shapes don't match
----> 2 arr + arr[:4]

ValueError: operands could not be broadcast together with shapes (8,) (4,)

# create a list of 1 million random floats between 0 and 1:
N = 1_000_000
originals = []
for _ in range(N):
    originals.append(random.random())

# make a copy of each so memory allocations aren't slowing us down:
result_py = originals[:]
result_np = np.array(originals[:])

%%time
# how long does it take to subtract 0.5 from a million numbers, the pure python way?
for i in range(N):
    result_py[i] -= 0.5

CPU times: user 76.9 ms, sys: 11.4 ms, total: 88.3 ms
Wall time: 88 ms

%%time
# how long does it take to subtract 0.5 from a million numbers, the numpy way?
result_np -= 0.5

CPU times: user 1.82 ms, sys: 1.27 ms, total: 3.09 ms
Wall time: 3.07 ms

# seen before: np.array to turn an existing list into an array
a = np.array(range(6))
a

array([0, 1, 2, 3, 4, 5])

# np.zeros - create an array filled with zeros
b = np.zeros((4,2))
b

array([[0., 0.],
       [0., 0.],
       [0., 0.],
       [0., 0.]])

b.dtype

dtype('float64')

# np.ones - fill with ones; specify data type
np.ones((3,3),dtype=np.int32)

array([[1, 1, 1],
       [1, 1, 1],
       [1, 1, 1]], dtype=int32)

# 2d arrays: np.zeros with a tuple shape

# create a 1d array and reshape it to 2d
a = np.array(range(6)).reshape((3, 2))
a

array([[0, 1],
       [2, 3],
       [4, 5]])

# indexing 2D arrays
a[0,1]

np.int64(1)

# slicing 2D arrays
a[:2,:2]

array([[0, 1],
       [2, 3]])

# make a 3D array
c = np.zeros((4,6,3))
c

array([[[0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.]],

       [[0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.]],

       [[0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.]],

       [[0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.]]])

# slice the 3D array
c[:4,2:3,0].shape

(4, 1)

b = np.array(range(6)).reshape(2, 3)
b

array([[0, 1, 2],
       [3, 4, 5]])

# elementwise comparison operator - array > scalar
b > 2

array([[False, False, False],
       [ True,  True,  True]])

# boolean indexing
b[b>=4]

array([4, 5])

b * (b >= 4)

array([[0, 0, 0],
       [0, 4, 5]])

a = np.array(range(6))
b = np.array(range(6)).reshape((2, 3))
c = np.array([1, 2])
b

array([[0, 1, 2],
       [3, 4, 5]])

# sum of a 2d array
b.sum()

np.int64(15)

# minimum of a 2d array
np.min(b)

np.int64(0)

# sum along one dimension of a 2d array
b.sum(axis=1)

array([ 3, 12])

b.shape, c.shape

((2, 3), (2,))

# shape mismatch
b * c

---------------------------------------------------------------------------
ValueError                                Traceback (most recent call last)
Cell In[57], line 2
      1 # shape mismatch
----> 2 b * c

ValueError: operands could not be broadcast together with shapes (2,3) (2,)

b

array([[0, 1, 2],
       [3, 4, 5]])

c

array([1, 2])

np.reshape(c, (2, 1)).shape

(2, 1)

b.shape

(2, 3)

# unless the mismatch is only singleton dimensions:
b * np.reshape(c, (2, 1))

array([[ 0,  1,  2],
       [ 6,  8, 10]])

a[np.array([0, 4, 5])]

array([0, 4, 5])

beans = imageio.imread("../data/beans.jpg")

plt.imshow(beans)

<matplotlib.image.AxesImage at 0x107d13710>

beans.shape

(600, 600, 3)

beans[0,0,:]

array([164, 150, 124], dtype=uint8)

beans_green = beans[:,:,1]
plt.imshow(beans_green, cmap="gray")
plt.colorbar()

<matplotlib.colorbar.Colorbar at 0x10f3f7e90>

plt.imshow(beans_green > 127, cmap="gray")
plt.colorbar()

<matplotlib.colorbar.Colorbar at 0x10f3260c0>

beans_green[beans_green > 127].mean()

np.float64(130.81223141203705)

beans_green.mean(axis=0).argmax()

np.int64(579)

Lecture 1A - `numpy` Crash Course¶

Goals¶

Code along!¶

Creating Arrays¶

Basic list-like slicing¶

Elementwise Operations¶

Demo: Speed Check¶

Multidimensional Arrays¶

ND arrays¶

Boolean Arrays, Masking¶

Aggregation / Projection¶

Broadcasting Basics¶

Exercise: Play with my cat¶

Lecture 1A - numpy Crash Course¶

Goals¶

Code along!¶

Creating Arrays¶

Basic list-like slicing¶

Elementwise Operations¶

Demo: Speed Check¶

Multidimensional Arrays¶

ND arrays¶

Boolean Arrays, Masking¶

Aggregation / Projection¶

Broadcasting Basics¶

Exercise: Play with my cat¶

Lecture 1A - `numpy` Crash Course¶