import numpy
numpy.__version__

'1.19.5'


import numpy as np


import array
L = list(range(10))
A = array.array('i', L)
A

array('i', [0, 1, 2, 3, 4, 5, 6, 7, 8, 9])


type(A)

array.array


[x ** 2 for x in range(10)]

[0, 1, 4, 9, 16, 25, 36, 49, 64, 81]


type(_)

list


np.array([1, 4, 2, 5, 3])

array([1, 4, 2, 5, 3])


np.array([3.14, 4, 2, 3])

array([3.14, 4.  , 2.  , 3.  ])


np.array([1, 2, 3, 4], dtype='float32')

array([1., 2., 3., 4.], dtype=float32)


np.zeros(10, dtype=int)

array([0, 0, 0, 0, 0, 0, 0, 0, 0, 0])


np.ones((3, 5), dtype=float)

array([[1., 1., 1., 1., 1.],
       [1., 1., 1., 1., 1.],
       [1., 1., 1., 1., 1.]])


np.full((3, 5), 3.14)

array([[3.14, 3.14, 3.14, 3.14, 3.14],
       [3.14, 3.14, 3.14, 3.14, 3.14],
       [3.14, 3.14, 3.14, 3.14, 3.14]])


np.arange(0, 20, 2)

array([ 0,  2,  4,  6,  8, 10, 12, 14, 16, 18])


np.linspace(0, 1, 5)

array([0.  , 0.25, 0.5 , 0.75, 1.  ])


np.random.random((3, 3))

array([[0.49760049, 0.67705904, 0.59093804],
       [0.99268699, 0.42792808, 0.8336333 ],
       [0.44928886, 0.70924885, 0.1681015 ]])


np.random.normal(0, 1, (3, 3))

array([[-0.84044642,  1.54753956, -0.023514  ],
       [ 1.09749938,  0.70455525,  0.57204258],
       [ 0.47691043,  0.89482679, -2.07735954]])


np.eye(3)

array([[1., 0., 0.],
       [0., 1., 0.],
       [0., 0., 1.]])


[x**4 for i, x in enumerate(range(10, 0, -1))]

[10000, 6561, 4096, 2401, 1296, 625, 256, 81, 16, 1]

_

[10000, 6561, 4096, 2401, 1296, 625, 256, 81, 16, 1]


[ _**4 for (x, _, _) in [(1, 2, 3), (2, 3, 4)]]

[81, 256]


[ tuple([x**4, y**3]) for (x, y, _) in [(1, 2, 3), (2, 3, 4)]]

[(1, 8), (16, 27)]


a = (2, 3, 4)


a.append(5)

---------------------------------------------------------------------------
AttributeError                            Traceback (most recent call last)
<ipython-input-18-80c7c94d949c> in <module>
----> 1 a.append(5)

AttributeError: 'tuple' object has no attribute 'append'


b = a + (5,)
b

(2, 3, 4, 5)


assert a != b


(1,2,3), [1, 2, 3]

((1, 2, 3), [1, 2, 3])


tuple(range(100))

(0,
 1,
 2,
 3,
 4,
 5,
 6,
 7,
 8,
 9,
 10,
 11,
 12,
 13,
 14,
 15,
 16,
 17,
 18,
 19,
 20,
 21,
 22,
 23,
 24,
 25,
 26,
 27,
 28,
 29,
 30,
 31,
 32,
 33,
 34,
 35,
 36,
 37,
 38,
 39,
 40,
 41,
 42,
 43,
 44,
 45,
 46,
 47,
 48,
 49,
 50,
 51,
 52,
 53,
 54,
 55,
 56,
 57,
 58,
 59,
 60,
 61,
 62,
 63,
 64,
 65,
 66,
 67,
 68,
 69,
 70,
 71,
 72,
 73,
 74,
 75,
 76,
 77,
 78,
 79,
 80,
 81,
 82,
 83,
 84,
 85,
 86,
 87,
 88,
 89,
 90,
 91,
 92,
 93,
 94,
 95,
 96,
 97,
 98,
 99)


def A(a, b=0, c=1):
    return a+b+c


A(1, 2,)

4


{1, 2, 23,}

{1, 2, 23}


L = [
    '/my/path/to/an/interesting/file0',
    '/my/path/to/an/interesting/file1',
    '/my/path/to/an/interesting/file2',
    '/my/path/to/an/interesting/file3',
    '/my/path/to/an/interesting/file4',
    '/my/path/to/an/interesting/file5',
]

L

['/my/path/to/an/interesting/file0',
 '/my/path/to/an/interesting/file1',
 '/my/path/to/an/interesting/file2',
 '/my/path/to/an/interesting/file3',
 '/my/path/to/an/interesting/file4',
 '/my/path/to/an/interesting/file5']


[object(), 3, 3.14, 'hello world']

[<object at 0x7fd9f964d760>, 3, 3.14, 'hello world']


np.random.seed(0)  # seed for reproducibility

x1 = np.random.randint(10, size=6)  # One-dimensional array
x2 = np.random.randint(10, size=(3, 4))  # Two-dimensional array
x3 = np.random.randint(10, size=(3, 4, 5))  # Three-dimensional array


print("x3 ndim: ", x3.ndim)
print("x3 shape:", x3.shape)
print("x3 size: ", x3.size)
print("dtype:", x3.dtype)

x3 ndim:  3
x3 shape: (3, 4, 5)
x3 size:  60
dtype: int64

x1

array([5, 0, 3, 3, 7, 9])


x1[0]

5


x1[-1] # To index from the end of the array, you can use negative indices.

9

x2

array([[3, 5, 2, 4],
       [7, 6, 8, 8],
       [1, 6, 7, 7]])


x2[0, 0]

3


x2[2, -1]

7


x2[0, 0] = 12
x2

array([[12,  5,  2,  4],
       [ 7,  6,  8,  8],
       [ 1,  6,  7,  7]])


x1[0] = 3.14159  # this will be truncated!
x1

array([3, 0, 3, 3, 7, 9])


x = np.arange(10)
x

array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9])


x[:5]  # first five elements

array([0, 1, 2, 3, 4])


x[5:]  # elements after index 5

array([5, 6, 7, 8, 9])


x[4:7]  # middle sub-array

array([4, 5, 6])


x[::2]  # every other element

array([0, 2, 4, 6, 8])


x[1::2]  # every other element, starting at index 1

array([1, 3, 5, 7, 9])


x[::-1]  # all elements, reversed

array([9, 8, 7, 6, 5, 4, 3, 2, 1, 0])


x[5::-2]  # reversed every other from index 5

array([5, 3, 1])

x2

array([[12,  5,  2,  4],
       [ 7,  6,  8,  8],
       [ 1,  6,  7,  7]])


x2[:2, :3]  # two rows, three columns

array([[12,  5,  2],
       [ 7,  6,  8]])


x2[:3, ::2]  # all rows, every other column

array([[12,  2],
       [ 7,  8],
       [ 1,  7]])


x2[::-1, ::-1]

array([[ 7,  7,  6,  1],
       [ 8,  8,  6,  7],
       [ 4,  2,  5, 12]])


print(x2[:, 0])  # first column of x2

[12  7  1]


print(x2[0, :])  # first row of x2

[12  5  2  4]


print(x2[0])  # equivalent to x2[0, :]

[12  5  2  4]

x2

array([[12,  5,  2,  4],
       [ 7,  6,  8,  8],
       [ 1,  6,  7,  7]])


x2_sub = x2[:2, :2]
x2_sub

array([[12,  5],
       [ 7,  6]])


x2_sub[0, 0] = 99 # if we modify this subarray, the original array is changed too
x2

array([[99,  5,  2,  4],
       [ 7,  6,  8,  8],
       [ 1,  6,  7,  7]])


np.arange(1, 10)

array([1, 2, 3, 4, 5, 6, 7, 8, 9])


_.shape

(9,)


__.reshape((3, 3))

array([[1, 2, 3],
       [4, 5, 6],
       [7, 8, 9]])


x = np.array([1, 2, 3])
x

array([1, 2, 3])


x.shape

(3,)


x.reshape((1, 3)) # row vector via reshape

array([[1, 2, 3]])


_.shape

(1, 3)


x.shape # therefore `reshape` doesn't modify in place the array we are working on

(3,)


x[np.newaxis, :] # row vector via newaxis

array([[1, 2, 3]])


_.shape

(1, 3)


x.shape

(3,)


x.reshape((3, 1)) # column vector via reshape

array([[1],
       [2],
       [3]])


_.shape

(3, 1)


x.shape

(3,)


x[:, np.newaxis] # column vector via newaxis

array([[1],
       [2],
       [3]])


_.shape

(3, 1)


x.shape

(3,)


x = np.array([1, 2, 3])
y = np.array([3, 2, 1])
np.concatenate([x, y])

array([1, 2, 3, 3, 2, 1])


z = [99, 99, 99]
np.concatenate([x, y, z])

array([ 1,  2,  3,  3,  2,  1, 99, 99, 99])


grid = np.array([[1, 2, 3],
                 [4, 5, 6]])


np.concatenate([grid, grid]) # concatenate along the first axis

array([[1, 2, 3],
       [4, 5, 6],
       [1, 2, 3],
       [4, 5, 6]])


np.concatenate([grid, grid], axis=1) # concatenate along the second axis (zero-indexed)

array([[1, 2, 3, 1, 2, 3],
       [4, 5, 6, 4, 5, 6]])


x = np.array([1, 2, 3])
grid = np.array([[9, 8, 7],
                 [6, 5, 4]])

np.vstack([x, grid]) # vertically stack the arrays

array([[1, 2, 3],
       [9, 8, 7],
       [6, 5, 4]])


y = np.array([[99],
              [99]])
np.hstack([grid, y]) # horizontally stack the arrays

array([[ 9,  8,  7, 99],
       [ 6,  5,  4, 99]])


x = [1, 2, 3, 99, 99, 3, 2, 1]
x1, x2, x3 = np.split(x, [3, 5])
print(x1, x2, x3)

[1 2 3] [99 99] [3 2 1]


grid = np.arange(16).reshape((4, 4))
grid

array([[ 0,  1,  2,  3],
       [ 4,  5,  6,  7],
       [ 8,  9, 10, 11],
       [12, 13, 14, 15]])


np.vsplit(grid, [2])

[array([[0, 1, 2, 3],
        [4, 5, 6, 7]]),
 array([[ 8,  9, 10, 11],
        [12, 13, 14, 15]])]


np.hsplit(grid, [2])

[array([[ 0,  1],
        [ 4,  5],
        [ 8,  9],
        [12, 13]]),
 array([[ 2,  3],
        [ 6,  7],
        [10, 11],
        [14, 15]])]


np.random.seed(0)

def compute_reciprocals(values):
    output = np.empty(len(values))
    for i in range(len(values)):
        output[i] = 1.0 / values[i]
    return output
        
values = np.random.randint(1, 10, size=5)
compute_reciprocals(values)

array([0.16666667, 1.        , 0.25      , 0.25      , 0.125     ])


big_array = np.random.randint(1, 100, size=1000000)
%timeit compute_reciprocals(big_array)

2.63 s ± 29.4 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)


%timeit (1.0 / big_array)

2.97 ms ± 35.3 µs per loop (mean ± std. dev. of 7 runs, 100 loops each)


np.arange(5) / np.arange(1, 6)

array([0.        , 0.5       , 0.66666667, 0.75      , 0.8       ])


x = np.arange(9).reshape((3, 3))
2 ** x

array([[  1,   2,   4],
       [  8,  16,  32],
       [ 64, 128, 256]])


x = np.arange(4)
print("x     =", x)
print("x + 5 =", x + 5)
print("x - 5 =", x - 5)
print("x * 2 =", x * 2)
print("x / 2 =", x / 2)
print("x // 2 =", x // 2)  # floor division
print("-x     = ", -x)
print("x ** 2 = ", x ** 2)
print("x % 2  = ", x % 2)

x     = [0 1 2 3]
x + 5 = [5 6 7 8]
x - 5 = [-5 -4 -3 -2]
x * 2 = [0 2 4 6]
x / 2 = [0.  0.5 1.  1.5]
x // 2 = [0 0 1 1]
-x     =  [ 0 -1 -2 -3]
x ** 2 =  [0 1 4 9]
x % 2  =  [0 1 0 1]


-(0.5*x + 1) ** 2 # can be strung together also

array([-1.  , -2.25, -4.  , -6.25])


theta = np.linspace(0, np.pi, 3)


print("theta      = ", theta)
print("sin(theta) = ", np.sin(theta))
print("cos(theta) = ", np.cos(theta))
print("tan(theta) = ", np.tan(theta))

theta      =  [0.         1.57079633 3.14159265]
sin(theta) =  [0.0000000e+00 1.0000000e+00 1.2246468e-16]
cos(theta) =  [ 1.000000e+00  6.123234e-17 -1.000000e+00]
tan(theta) =  [ 0.00000000e+00  1.63312394e+16 -1.22464680e-16]


x = [1, 2, 3]
print("x     =", x)
print("e^x   =", np.exp(x))
print("2^x   =", np.exp2(x))
print("3^x   =", np.power(3, x))

x     = [1, 2, 3]
e^x   = [ 2.71828183  7.3890561  20.08553692]
2^x   = [2. 4. 8.]
3^x   = [ 3  9 27]


x = [1, 2, 4, 10]
print("x        =", x)
print("ln(x)    =", np.log(x))
print("log2(x)  =", np.log2(x))
print("log10(x) =", np.log10(x))

x        = [1, 2, 4, 10]
ln(x)    = [0.         0.69314718 1.38629436 2.30258509]
log2(x)  = [0.         1.         2.         3.32192809]
log10(x) = [0.         0.30103    0.60205999 1.        ]


x = np.arange(5)
y = np.empty(5)
np.multiply(x, 10, out=y)
print(y)

[ 0. 10. 20. 30. 40.]


y = np.zeros(10)
np.power(2, x, out=y[::2])
print(y)

[ 1.  0.  2.  0.  4.  0.  8.  0. 16.  0.]


x = np.arange(1, 6)
np.multiply.outer(x, x)

array([[ 1,  2,  3,  4,  5],
       [ 2,  4,  6,  8, 10],
       [ 3,  6,  9, 12, 15],
       [ 4,  8, 12, 16, 20],
       [ 5, 10, 15, 20, 25]])


L = np.random.random(100)
sum(L)

54.43983466916921


np.sum(L)

54.439834669169194


big_array = np.random.rand(1_000_000)
%timeit sum(big_array)
%timeit np.sum(big_array)

222 ms ± 6.88 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
791 µs ± 7.3 µs per loop (mean ± std. dev. of 7 runs, 1000 loops each)


min(big_array), max(big_array)

(7.071203171893359e-07, 0.9999997207656334)


np.min(big_array), np.max(big_array)

(7.071203171893359e-07, 0.9999997207656334)


%timeit min(big_array)
%timeit np.min(big_array)

118 ms ± 1.78 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
656 µs ± 8 µs per loop (mean ± std. dev. of 7 runs, 1000 loops each)


big_array.min(), big_array.max(), big_array.sum()

(7.071203171893359e-07, 0.9999997207656334, 500216.8034810001)


M = np.random.random((3, 4))
M

array([[0.07452786, 0.41843762, 0.99939192, 0.66974416],
       [0.54717434, 0.82711104, 0.23097044, 0.16283152],
       [0.27950484, 0.58540569, 0.90657413, 0.18671025]])


M.sum() # By default, each NumPy aggregation function works on the whole array

5.888383818472106


M.min(axis=0) # specifying the axis along which the aggregate is computed

array([0.07452786, 0.41843762, 0.23097044, 0.16283152])


M.max(axis=1) # find the maximum value within each row

array([0.99939192, 0.82711104, 0.90657413])


a = np.array([0, 1, 2])
b = np.array([5, 5, 5])
a + b

array([5, 6, 7])


a + 5

array([5, 6, 7])


M = np.ones((3, 3))
M

array([[1., 1., 1.],
       [1., 1., 1.],
       [1., 1., 1.]])


M + a

array([[1., 2., 3.],
       [1., 2., 3.],
       [1., 2., 3.]])


a = np.arange(3)
b = np.arange(3)[:, np.newaxis]
a, b

(array([0, 1, 2]),
 array([[0],
        [1],
        [2]]))


a + b

array([[0, 1, 2],
       [1, 2, 3],
       [2, 3, 4]])


X = np.random.random((10, 3))


Xmean = X.mean(0)
Xmean

array([0.55965135, 0.52179051, 0.41008518])


X_centered = X - Xmean


X_centered.mean(0) # To double-check, we can check that the centered array has near 0 means.

array([-6.66133815e-17,  3.33066907e-17, -7.77156117e-17])


steps = 500
x = np.linspace(0, 5, steps) # # x and y have 500 steps from 0 to 5
y = np.linspace(0, 5, steps)[:, np.newaxis]
z = np.sin(x) ** 10 + np.cos(10 + y * x) * np.cos(x)


%matplotlib inline
import matplotlib.pyplot as plt
plt.imshow(z, origin='lower', extent=[0, 5, 0, 5], cmap='viridis')
plt.colorbar();


x = np.array([1, 2, 3, 4, 5])


x < 3  # less than

array([ True,  True, False, False, False])


x > 3  # greater than

array([False, False, False,  True,  True])


x != 3  # not equal

array([ True,  True, False,  True,  True])


(2 * x) == (x ** 2)

array([False,  True, False, False, False])


rng = np.random.RandomState(0)
x = rng.randint(10, size=(3, 4))
x

array([[5, 0, 3, 3],
       [7, 9, 3, 5],
       [2, 4, 7, 6]])


x < 6

array([[ True,  True,  True,  True],
       [False, False,  True,  True],
       [ True,  True, False, False]])


np.count_nonzero(x < 6) # how many values less than 6?

8


np.sum(x < 6)

8


np.sum(x < 6, axis=1) # how many values less than 6 in each row?

array([4, 2, 2])


np.any(x > 8) # are there any values greater than 8?

True


np.any(x < 0) # are there any values less than zero?

False


np.all(x < 10) # are all values less than 10?

True


np.all(x < 8, axis=1) # are all values in each row less than 8?

array([ True, False,  True])

x

array([[5, 0, 3, 3],
       [7, 9, 3, 5],
       [2, 4, 7, 6]])


x < 5

array([[False,  True,  True,  True],
       [False, False,  True, False],
       [ True,  True, False, False]])


x[x < 5]

array([0, 3, 3, 3, 2, 4])


rand = np.random.RandomState(42)

x = rand.randint(100, size=10)
x

array([51, 92, 14, 71, 60, 20, 82, 86, 74, 74])


[x[3], x[7], x[2]] # Suppose we want to access three different elements.

[71, 86, 14]


ind = [3, 7, 4]
x[ind] # Alternatively, we can pass a single list or array of indices

array([71, 86, 60])


ind = np.array([[3, 7],
                [4, 5]])
x[ind]

array([[71, 86],
       [60, 20]])


X = np.arange(12).reshape((3, 4))
X

array([[ 0,  1,  2,  3],
       [ 4,  5,  6,  7],
       [ 8,  9, 10, 11]])


row = np.array([0, 1, 2])
col = np.array([2, 1, 3])
X[row, col]

array([ 2,  5, 11])


X[row[:, np.newaxis], col]

array([[ 2,  1,  3],
       [ 6,  5,  7],
       [10,  9, 11]])


row[:, np.newaxis] * col

array([[0, 0, 0],
       [2, 1, 3],
       [4, 2, 6]])

X

array([[ 0,  1,  2,  3],
       [ 4,  5,  6,  7],
       [ 8,  9, 10, 11]])


X[2, [2, 0, 1]] # combine fancy and simple indices

array([10,  8,  9])


X[1:, [2, 0, 1]] # combine fancy indexing with slicing

array([[ 6,  4,  5],
       [10,  8,  9]])


mask = np.array([1, 0, 1, 0], dtype=bool)
X[row[:, np.newaxis], mask] # combine fancy indexing with masking

array([[ 0,  2],
       [ 4,  6],
       [ 8, 10]])


mean = [0, 0]
cov = [[1, 2],
       [2, 5]]
X = rand.multivariate_normal(mean, cov, 100)
X.shape

(100, 2)


plt.scatter(X[:, 0], X[:, 1]);


indices = np.random.choice(X.shape[0], 20, replace=False)
indices

array([22, 56, 83, 30, 58, 32, 78, 14, 36, 33,  8, 98, 25,  6, 41, 84, 13,
       92,  7, 34])


selection = X[indices]  # fancy indexing here
selection.shape

(20, 2)


plt.scatter(X[:, 0], X[:, 1], alpha=0.3);


x = np.arange(10)
i = np.array([2, 1, 8, 4])
x[i] = 99
x

array([ 0, 99, 99,  3, 99,  5,  6,  7, 99,  9])


x[i] -= 10 # use any assignment-type operator for this
x

array([ 0, 89, 89,  3, 89,  5,  6,  7, 89,  9])


x = np.zeros(10)
x[[0, 0]] = [4, 6]
x

array([6., 0., 0., 0., 0., 0., 0., 0., 0., 0.])


i = [2, 3, 3, 4, 4, 4]
x[i] += 1
x

array([6., 0., 1., 1., 1., 0., 0., 0., 0., 0.])


x = np.zeros(10)
np.add.at(x, i, 1)
x

array([0., 0., 1., 2., 3., 0., 0., 0., 0., 0.])


np.random.seed(42)
x = np.random.randn(100)

# compute a histogram by hand
bins = np.linspace(-5, 5, 20)
counts = np.zeros_like(bins)

# find the appropriate bin for each x
i = np.searchsorted(bins, x)

# add 1 to each of these bins
np.add.at(counts, i, 1)


# The counts now reflect the number of points 
# within each bin–in other words, a histogram:
line, = plt.plot(bins, counts);
line.set_drawstyle("steps")


print("NumPy routine:")
%timeit counts, edges = np.histogram(x, bins)

print("Custom routine:")
%timeit np.add.at(counts, np.searchsorted(bins, x), 1)

NumPy routine:
35.1 µs ± 209 ns per loop (mean ± std. dev. of 7 runs, 10000 loops each)
Custom routine:
18.5 µs ± 405 ns per loop (mean ± std. dev. of 7 runs, 100000 loops each)


x = np.random.randn(1000000)
print("NumPy routine:")
%timeit counts, edges = np.histogram(x, bins)

print("Custom routine:")
%timeit np.add.at(counts, np.searchsorted(bins, x), 1)

NumPy routine:
95.9 ms ± 1.17 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
Custom routine:
142 ms ± 115 µs per loop (mean ± std. dev. of 7 runs, 10 loops each)


x = np.array([2, 1, 4, 3, 5])
np.sort(x)

array([1, 2, 3, 4, 5])

x

array([2, 1, 4, 3, 5])


i = np.argsort(x)
i

array([1, 0, 3, 2, 4])


x[i]

array([1, 2, 3, 4, 5])


rand = np.random.RandomState(42)
X = rand.randint(0, 10, (4, 6))
X

array([[6, 3, 7, 4, 6, 9],
       [2, 6, 7, 4, 3, 7],
       [7, 2, 5, 4, 1, 7],
       [5, 1, 4, 0, 9, 5]])


np.sort(X, axis=0) # sort each column of X

array([[2, 1, 4, 0, 1, 5],
       [5, 2, 5, 4, 3, 7],
       [6, 3, 7, 4, 6, 7],
       [7, 6, 7, 4, 9, 9]])


np.sort(X, axis=1) # sort each row of X

array([[3, 4, 6, 6, 7, 9],
       [2, 3, 4, 6, 7, 7],
       [1, 2, 4, 5, 7, 7],
       [0, 1, 4, 5, 5, 9]])


x = np.array([7, 2, 3, 1, 6, 5, 4])
np.partition(x, 3)

array([2, 1, 3, 4, 6, 5, 7])


np.partition(X, 2, axis=1)

array([[3, 4, 6, 7, 6, 9],
       [2, 3, 4, 7, 6, 7],
       [1, 2, 4, 5, 7, 7],
       [0, 1, 4, 5, 9, 5]])


X = rand.rand(50, 2)

---------------------------------------------------------------------------
NameError                                 Traceback (most recent call last)
<ipython-input-8-ffd1d8c0b963> in <module>
----> 1 X = rand.rand(50, 2)

NameError: name 'rand' is not defined


plt.scatter(X[:, 0], X[:, 1], s=100);

---------------------------------------------------------------------------
NameError                                 Traceback (most recent call last)
<ipython-input-9-68a4fcce3c3f> in <module>
----> 1 plt.scatter(X[:, 0], X[:, 1], s=100);

NameError: name 'plt' is not defined


# compute the distance between each pair of points
dist_sq = np.sum((X[:, np.newaxis, :] - X[np.newaxis, :, :]) ** 2, axis=-1)
dist_sq.shape, np.all(dist_sq.diagonal() == 0)

((50, 50), True)


nearest = np.argsort(dist_sq, axis=1)
nearest[:,0]

array([ 0,  1,  2,  3,  4,  5,  6,  7,  8,  9, 10, 11, 12, 13, 14, 15, 16,
       17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33,
       34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49])


K = 2
nearest_partition = np.argpartition(dist_sq, K + 1, axis=1)


plt.scatter(X[:, 0], X[:, 1], s=100)
K = 2 # draw lines from each point to its two nearest neighbors
for i in range(X.shape[0]):
    for j in nearest_partition[i, :K+1]:
        plt.plot(*zip(X[j], X[i]), color='black')


def A(a: int) -> (3 if 0 else 4):
    return 4


A(3)

4


A.__annotations__

{'a': int, 'return': 4}


type(_)

dict


def B(f):
    print(f.__annotations__)


B(A)

{'a': <class 'int'>, 'return': <object object at 0x7fd9be16ccc0>}

Data type	Description
`bool_`	Boolean (True or False) stored as a byte
`int_`	Default integer type (same as C `long`; normally either `int64` or `int32`)
`intc`	Identical to C `int` (normally `int32` or `int64`)
`intp`	Integer used for indexing (same as C `ssize_t`; normally either `int32` or `int64`)
`int8`	Byte (-128 to 127)
`int16`	Integer (-32768 to 32767)
`int32`	Integer (-2147483648 to 2147483647)
`int64`	Integer (-9223372036854775808 to 9223372036854775807)
`uint8`	Unsigned integer (0 to 255)
`uint16`	Unsigned integer (0 to 65535)
`uint32`	Unsigned integer (0 to 4294967295)
`uint64`	Unsigned integer (0 to 18446744073709551615)
`float_`	Shorthand for `float64`.
`float16`	Half precision float: sign bit, 5 bits exponent, 10 bits mantissa
`float32`	Single precision float: sign bit, 8 bits exponent, 23 bits mantissa
`float64`	Double precision float: sign bit, 11 bits exponent, 52 bits mantissa
`complex_`	Shorthand for `complex128`.
`complex64`	Complex number, represented by two 32-bit floats
`complex128`	Complex number, represented by two 64-bit floats

Function Name	NaN-safe Version	Description
`np.sum`	`np.nansum`	Compute sum of elements
`np.prod`	`np.nanprod`	Compute product of elements
`np.mean`	`np.nanmean`	Compute mean of elements
`np.std`	`np.nanstd`	Compute standard deviation
`np.var`	`np.nanvar`	Compute variance
`np.min`	`np.nanmin`	Find minimum value
`np.max`	`np.nanmax`	Find maximum value
`np.argmin`	`np.nanargmin`	Find index of minimum value
`np.argmax`	`np.nanargmax`	Find index of maximum value
`np.median`	`np.nanmedian`	Compute median of elements
`np.percentile`	`np.nanpercentile`	Compute rank-based statistics of elements
`np.any`	N/A	Evaluate whether any elements are true
`np.all`	N/A	Evaluate whether all elements are true

Introduction to NumPy¶

Understanding Data Types in Python¶

Creating Arrays from Python Lists¶

Creating Arrays from Scratch¶

NumPy Standard Data Types¶

INTERMEZZO¶

The Basics of NumPy Arrays¶

NumPy Array Attributes¶

Array Indexing: Accessing Single Elements¶

Array Slicing: Accessing Subarrays¶

One-dimensional subarrays¶

Multi-dimensional subarrays¶

Accessing array rows and columns¶

Subarrays as no-copy views¶

Reshaping of Arrays¶

Concatenation of arrays¶

Splitting of arrays¶

Computation on NumPy Arrays: Universal Functions¶

The Slowness of Loops¶

Introducing UFuncs¶

Array arithmetic¶

Trigonometric functions¶

Exponents and logarithms¶

Specifying output¶

Outer products¶

Aggregations: Min, Max, and Everything In Between¶

Summing the Values in an Array¶

Minimum and Maximum¶

Multi dimensional aggregates¶

Other aggregation functions¶

Computation on Arrays: Broadcasting¶

Introducing Broadcasting¶

Rules of Broadcasting¶

Centering an array¶

Plotting a two-dimensional function¶

Comparisons, Masks, and Boolean Logic¶

Comparison Operators as ufuncs¶

Counting entries¶

Boolean Arrays as Masks¶

Fancy Indexing¶

Combined Indexing¶

Example: Selecting Random Points¶

Modifying Values with Fancy Indexing¶

Example: Binning Data¶

Sorting Arrays¶

Fast Sorting in NumPy: np.sort and np.argsort¶

Sorting along rows or columns¶

Partial Sorts: Partitioning¶

Example: k-Nearest Neighbors¶

Fast Sorting in NumPy: `np.sort` and `np.argsort`¶