import numpy as np

from sklearn.metrics.pairwise import euclidean_distances
from sklearn.preprocessing import StandardScaler

np.set_printoptions(precision=3, suppress=True)

py_list =  [[2, 0, 1], [1, 3, 2]]     ## Correct format: consistent sizes, same datatype (here: int)
#py_list =  [[2, 0, 1], [1, 3, 2.0]]   ## Acceptable format: consistent sizes, all entries treated as floats/double
#py_list =  [[2, 0, 1], [1, 3]]        ## Inconsistent sizes: result is not a 2D array but 1D array with lists as entries
#py_list =  [[2, 0, 1], [1, 3, '2']]   ## Different data types: all entries are treated as string

a = np.array(py_list)

print(a)

[[2 0 1]
 [1 3 2]]

a = np.array([[2, 0, 1], [1, 3, 2]], dtype=float)

print(a)

[[2. 0. 1.]
 [1. 3. 2.]]

a = np.array([[[2, 0, 1], [1, 3, 2]], [[4, 4, 6], [3, 5, 1]]])

print(a)

[[[2 0 1]
  [1 3 2]]

 [[4 4 6]
  [3 5 1]]]

a = np.array([[[2, 0, 1], [1, 3, 2]], [[4, 4, 6], [3, 5, 1]]], dtype=np.int64)
#a = np.array([[[2, 0, 1], [1, 3, 2]], [[4, 4, 6], [3, 5, 1]]], dtype=np.int32)
#a = np.array([[[2, 0, 1], [1, 3, 2]], [[4, 4, 6], [3, 5, 1]]], dtype=np.float32)

print(f"Number of axes: {a.ndim}")

Number of axes: 3

print(f"Data type: {a.dtype}")

Data type: int64

print(a.shape)

(2, 2, 3)

a = np.zeros((3,5))

print(a)

[[0. 0. 0. 0. 0.]
 [0. 0. 0. 0. 0.]
 [0. 0. 0. 0. 0.]]

a = np.ones((3,5))

print(a)

[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]]

a = np.full((3,5), 5.8)

print(a)

[[5.8 5.8 5.8 5.8 5.8]
 [5.8 5.8 5.8 5.8 5.8]
 [5.8 5.8 5.8 5.8 5.8]]

a = np.random.rand(3,5)

print(a)

[[0.959 0.723 0.926 0.416 0.106]
 [0.064 0.577 0.915 0.6   0.473]
 [0.241 0.434 0.46  0.743 0.107]]

a = np.arange(0, 10, 2)

print(a)

[0 2 4 6 8]

a = np.linspace(0, 1, 5)

print(a)

[0.   0.25 0.5  0.75 1.  ]

a = np.eye(3)

print(a)

[[1. 0. 0.]
 [0. 1. 0.]
 [0. 0. 1.]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

a_transposed = a.T
#a_transposed = a.transpose()
#a_transposed = np.transpose(a)
print(f"Transposed array (shape: {a_transposed.shape}):\n{a_transposed}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Transposed array (shape: (4, 3)):
[[ 1  5  9]
 [ 2  6 10]
 [ 3  7 11]
 [ 4  8 12]]

a = np.ones((2,3,4,5))
print(f"Shape of original array:\n{a.shape}\n")

a_transposed = a.transpose()
print(f"Shape of transposed array:\n{a_transposed.shape}")

Shape of original array:
(2, 3, 4, 5)

Shape of transposed array:
(5, 4, 3, 2)

a = np.ones((2,3,4,5))
print(f"Shape of original array:\n{a.shape}\n")

a_transposed = a.transpose((3,1,2,0))
print(f"Shape of transposed array:\n{a_transposed.shape}")

Shape of original array:
(2, 3, 4, 5)

Shape of transposed array:
(5, 3, 4, 2)

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

a_reshaped = a.reshape(4,3)
#a_reshaped = np.reshape(a, (4,3))
print(f"Reshaped array (shape: {a_reshaped.shape}):\n{a_reshaped}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Reshaped array (shape: (4, 3)):
[[ 1  2  3]
 [ 4  5  6]
 [ 7  8  9]
 [10 11 12]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

# All the commands below will work just fine.
a_reshaped = a.reshape(6,2)
#a_reshaped = a.reshape(2,6)
#a_reshaped = a.reshape(3,2,2)
#a_reshaped = a.reshape(1,1,6,1,1,2,1,1)
#a_reshaped = a.reshape(1,1,6,1,1,2,1,1)
#a_reshaped = a.reshape(2,1,3,2,1)
#a_reshaped = a.reshape(1,12)
#a_reshaped = a.reshape(1,1,12)
#a_reshaped = a.reshape(1,1,1,12)
#a_reshaped = a.reshape(1,1,1,1,12)
#...

print(f"Reshaped array (shape: {a_reshaped.shape}):\n{a_reshaped}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Reshaped array (shape: (6, 2)):
[[ 1  2]
 [ 3  4]
 [ 5  6]
 [ 7  8]
 [ 9 10]
 [11 12]]

#a.reshape(2, 1, 5)  # <-- This will fail (product is 10)
#a.reshape(8, 2)  # <-- That will fail (prodcut is 16)

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

a_reshaped = a.reshape(-1)
print(f"Reshaped array (shape: {a_reshaped.shape}):\n{a_reshaped}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Reshaped array (shape: (12,)):
[ 1  2  3  4  5  6  7  8  9 10 11 12]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

a_reshaped = a.reshape(2,-1,2)
print(f"Reshaped array (shape: {a_reshaped.shape}):\n{a_reshaped}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Reshaped array (shape: (2, 3, 2)):
[[[ 1  2]
  [ 3  4]
  [ 5  6]]

 [[ 7  8]
  [ 9 10]
  [11 12]]]

#a.reshape(-1, 3, -1)   # ValueError: can only specify one unknown dimension
#a.reshape(-1, 3, 3)    # ValueError: cannot reshape array of size 12 into shape (3,3) -- 3*3*?=12 does not work out

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

a_flattened = a.flatten()
print(f"Flattend array (shape: {a_flattened.shape}):\n{a_flattened}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Flattend array (shape: (12,)):
[ 1  2  3  4  5  6  7  8  9 10 11 12]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

a_raveled = a.ravel()
print(f"Raveled array (shape: {a_raveled.shape}):\n{a_raveled}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Raveled array (shape: (12,)):
[ 1  2  3  4  5  6  7  8  9 10 11 12]

a = np.array([[1,1,1,1], [2,2,2,2], [3,3,3,3]])
b = np.array([[4,4,4,4], [5,5,5,5], [6,6,6,6]])
print(f"Original array a (shape: {a.shape}):\n{a}\n")
print(f"Original array b (shape: {a.shape}):\n{b}\n")

ab_concat = np.concatenate((a,b), axis=0)
print(f"Concatenated array along 1st axis (shape: {ab_concat.shape}):\n{ab_concat}\n")

ab_concat = np.concatenate((a,b), axis=1)
print(f"Concatenated array along 2nd axis (shape: {ab_concat.shape}):\n{ab_concat}\n")

Original array a (shape: (3, 4)):
[[1 1 1 1]
 [2 2 2 2]
 [3 3 3 3]]

Original array b (shape: (3, 4)):
[[4 4 4 4]
 [5 5 5 5]
 [6 6 6 6]]

Concatenated array along 1st axis (shape: (6, 4)):
[[1 1 1 1]
 [2 2 2 2]
 [3 3 3 3]
 [4 4 4 4]
 [5 5 5 5]
 [6 6 6 6]]

Concatenated array along 2nd axis (shape: (3, 8)):
[[1 1 1 1 4 4 4 4]
 [2 2 2 2 5 5 5 5]
 [3 3 3 3 6 6 6 6]]

a = np.array([[1,1,1,1], [2,2,2,2], [3,3,3,3]])
b = np.array([[4,4,4,4], [5,5,5,5], [6,6,6,6]])
print(f"Original array a (shape: {a.shape}):\n{a}\n")
print(f"Original array b (shape: {a.shape}):\n{b}\n")

ab_stacked = np.stack((a,b), axis=0)
print(f"Stacked array along 1st axis (shape: {ab_stacked.shape}):\n{ab_stacked}\n")

ab_stacked = np.stack((a,b), axis=1)
print(f"Stacked array along 2nd axis (shape: {ab_stacked.shape}):\n{ab_stacked}\n")

Original array a (shape: (3, 4)):
[[1 1 1 1]
 [2 2 2 2]
 [3 3 3 3]]

Original array b (shape: (3, 4)):
[[4 4 4 4]
 [5 5 5 5]
 [6 6 6 6]]

Stacked array along 1st axis (shape: (2, 3, 4)):
[[[1 1 1 1]
  [2 2 2 2]
  [3 3 3 3]]

 [[4 4 4 4]
  [5 5 5 5]
  [6 6 6 6]]]

Stacked array along 2nd axis (shape: (3, 2, 4)):
[[[1 1 1 1]
  [4 4 4 4]]

 [[2 2 2 2]
  [5 5 5 5]]

 [[3 3 3 3]
  [6 6 6 6]]]

a = np.array([[1,1,1,1], [2,2,2,2], [3,3,3,3]])
b = np.array([[4,4,4,4], [5,5,5,5], [6,6,6,6]])
print(f"Original array a (shape: {a.shape}):\n{a}\n")
print(f"Original array b (shape: {a.shape}):\n{b}\n")

ab_vstacked = np.vstack((a,b))
print(f"Stacked array along 1st axis (shape: {ab_vstacked.shape}):\n{ab_vstacked}\n")

ab_hstacked = np.hstack((a,b))
print(f"Stacked array along 2nd axis (shape: {ab_hstacked.shape}):\n{ab_hstacked}\n")

ab_dstacked = np.dstack((a,b))
print(f"Stacked array along 2nd axis (shape: {ab_dstacked.shape}):\n{ab_dstacked}\n")

Original array a (shape: (3, 4)):
[[1 1 1 1]
 [2 2 2 2]
 [3 3 3 3]]

Original array b (shape: (3, 4)):
[[4 4 4 4]
 [5 5 5 5]
 [6 6 6 6]]

Stacked array along 1st axis (shape: (6, 4)):
[[1 1 1 1]
 [2 2 2 2]
 [3 3 3 3]
 [4 4 4 4]
 [5 5 5 5]
 [6 6 6 6]]

Stacked array along 2nd axis (shape: (3, 8)):
[[1 1 1 1 4 4 4 4]
 [2 2 2 2 5 5 5 5]
 [3 3 3 3 6 6 6 6]]

Stacked array along 2nd axis (shape: (3, 4, 2)):
[[[1 4]
  [1 4]
  [1 4]
  [1 4]]

 [[2 5]
  [2 5]
  [2 5]
  [2 5]]

 [[3 6]
  [3 6]
  [3 6]
  [3 6]]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

for idx, subarray in enumerate(np.split(a, 3, axis=0)):
    print(f"Subarray {idx} (shape: {subarray.shape}):\n{subarray}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray 0 (shape: (1, 4)):
[[1 2 3 4]]

Subarray 1 (shape: (1, 4)):
[[5 6 7 8]]

Subarray 2 (shape: (1, 4)):
[[ 9 10 11 12]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

for idx, subarray in enumerate(np.split(a, 4, axis=1)):
    print(f"Subarray {idx} (shape: {subarray.shape}):\n{subarray}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray 0 (shape: (3, 1)):
[[1]
 [5]
 [9]]

Subarray 1 (shape: (3, 1)):
[[ 2]
 [ 6]
 [10]]

Subarray 2 (shape: (3, 1)):
[[ 3]
 [ 7]
 [11]]

Subarray 3 (shape: (3, 1)):
[[ 4]
 [ 8]
 [12]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

for idx, subarray in enumerate(np.split(a, 2, axis=1)):
    print(f"Subarray {idx} (shape: {subarray.shape}):\n{subarray}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray 0 (shape: (3, 2)):
[[ 1  2]
 [ 5  6]
 [ 9 10]]

Subarray 1 (shape: (3, 2)):
[[ 3  4]
 [ 7  8]
 [11 12]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

for idx, subarray in enumerate(np.split(a, [1,3], axis=1)):
    print(f"Subarray {idx} (shape: {subarray.shape}):\n{subarray}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray 0 (shape: (3, 1)):
[[1]
 [5]
 [9]]

Subarray 1 (shape: (3, 2)):
[[ 2  3]
 [ 6  7]
 [10 11]]

Subarray 2 (shape: (3, 1)):
[[ 4]
 [ 8]
 [12]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

for idx, subarray in enumerate(np.array_split(a, 2, axis=0)):
    print(f"Subarray {idx} (shape: {subarray.shape}):\n{subarray}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray 0 (shape: (2, 4)):
[[1 2 3 4]
 [5 6 7 8]]

Subarray 1 (shape: (1, 4)):
[[ 9 10 11 12]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

for idx, subarray in enumerate(np.hsplit(a, 2)):
    print(f"Subarray {idx} (shape: {subarray.shape}):\n{subarray}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray 0 (shape: (3, 2)):
[[ 1  2]
 [ 5  6]
 [ 9 10]]

Subarray 1 (shape: (3, 2)):
[[ 3  4]
 [ 7  8]
 [11 12]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

a_resized = np.resize(a, (2,2))
print(f"Resized array (shape: {a_resized.shape}):\n{a_resized}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Resized array (shape: (2, 2)):
[[1 2]
 [3 4]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

a_resized = np.resize(a, (4,5))
print(f"Resized array (shape: {a_resized.shape}):\n{a_resized}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Resized array (shape: (4, 5)):
[[ 1  2  3  4  5]
 [ 6  7  8  9 10]
 [11 12  1  2  3]
 [ 4  5  6  7  8]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Original array (shape: {a.shape}):\n{a}\n")

a_resized = np.resize(a, (4,2,5))
print(f"Resized array (shape: {a_resized.shape}):\n{a_resized}\n")

Original array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Resized array (shape: (4, 2, 5)):
[[[ 1  2  3  4  5]
  [ 6  7  8  9 10]]

 [[11 12  1  2  3]
  [ 4  5  6  7  8]]

 [[ 9 10 11 12  1]
  [ 2  3  4  5  6]]

 [[ 7  8  9 10 11]
  [12  1  2  3  4]]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

#value = a[2][1]  # Notation for basic Python lists of lists; valid notation for NumPy arrays as well but less common
value = a[2,1]  # More common and more convenient notation for NumPy arrays
#value = a[3,1]. # Will throw an out of bound error

print(f"Value: {value}")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Value: 10

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

print(f"Values: {a[0]}")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Values: [1 2 3 4]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

subarray = a[0:2]
print(f"Subarray (shape: {subarray.shape}):\n{subarray}\n")

subarray = a[0:2,:]
print(f"Subarray (shape: {subarray.shape}):\n{subarray}\n")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray (shape: (2, 4)):
[[1 2 3 4]
 [5 6 7 8]]

Subarray (shape: (2, 4)):
[[1 2 3 4]
 [5 6 7 8]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

subarray = a[:,0:2]
print(f"Subarray (shape: {subarray.shape}):\n{subarray}\n")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray (shape: (3, 2)):
[[ 1  2]
 [ 5  6]
 [ 9 10]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

subarray = a[0:2,0:2]
print(f"Subarray (shape: {subarray.shape}):\n{subarray}\n")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray (shape: (2, 2)):
[[1 2]
 [5 6]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

subarray = a[-2:,-2:]
print(f"Subarray (shape: {subarray.shape}):\n{subarray}\n")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray (shape: (2, 2)):
[[ 7  8]
 [11 12]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

subarray = a[0:2,::2]
print(f"Subarray (shape: {subarray.shape}):\n{subarray}\n")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray (shape: (2, 2)):
[[1 3]
 [5 7]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

subarray = a[[-1,0]]
print(f"Subarray (shape: {subarray.shape}):\n{subarray}\n")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray (shape: (2, 4)):
[[ 9 10 11 12]
 [ 1  2  3  4]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

subarray = a[:,[-1,0]]
print(f"Subarray (shape: {subarray.shape}):\n{subarray}\n")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray (shape: (3, 2)):
[[ 4  1]
 [ 8  5]
 [12  9]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

subarray = a[[-1,0], [-1,0]]
print(f"Subarray (shape: {subarray.shape}):\n{subarray}\n")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray (shape: (2,)):
[12  1]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

subarray = np.array([a[-1,-1], a[0,0]])
print(f"Subarray (shape: {subarray.shape}):\n{subarray}\n")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray (shape: (2,)):
[12  1]

#subarray = a[[2,1], [0,3,1]]   # np.array([a[2,0], a[1,3], a[?,1]])

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

boolean_index = (a > 5)

print(f"Boolean index (shape: {boolean_index.shape}):\n{boolean_index}")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Boolean index (shape: (3, 4)):
[[False False False False]
 [False  True  True  True]
 [ True  True  True  True]]

subarray = a[boolean_index]

print(f"Subarray (shape: {subarray.shape}): {subarray}")

Subarray (shape: (7,)): [ 6  7  8  9 10 11 12]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

subarray = a[a > 5]
print(f"Subarray (shape: {subarray.shape}):\n{subarray}")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray (shape: (7,)):
[ 6  7  8  9 10 11 12]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

subarray = a[(a > 5) & (a % 2 == 0)]
print(f"Subarray (shape: {subarray.shape}):\n{subarray}")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray (shape: (4,)):
[ 6  8 10 12]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

subarray = a[a[:,0] > 5]
print(f"Subarray (shape: {subarray.shape}):\n{subarray}")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Subarray (shape: (1, 4)):
[[ 9 10 11 12]]

a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(f"Array (shape: {a.shape}):\n{a}\n")

boolean_index = (a[:, 0] > 5)

print(f"Boolean index (shape: {boolean_index.shape}):\n{boolean_index}")

Array (shape: (3, 4)):
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Boolean index (shape: (3,)):
[False False  True]

subarray = a[boolean_index]
print(f"Subarray (shape: {subarray.shape}):\n{subarray}")

Subarray (shape: (1, 4)):
[[ 9 10 11 12]]

a = np.array([[1, 2, 3, 4], [2, 2, 3, 3]])
b = np.array([[4, 1, 1, 2], [1, 4, 2, 2]])

print(f"Input array a:\n{a}\n")
print(f"Input array b:\n{b}\n")

print(f"Addition (a+b):\n{a+b}\n")
print(f"Subtraction (a-b):\n{a-b}\n")
print(f"Multiplication (a*b):\n{a*b}\n")
print(f"Division (a/b):\n{a/b}\n")
print(f"Modulo (a%b):\n{a%b}\n")

Input array a:
[[1 2 3 4]
 [2 2 3 3]]

Input array b:
[[4 1 1 2]
 [1 4 2 2]]

Addition (a+b):
[[5 3 4 6]
 [3 6 5 5]]

Subtraction (a-b):
[[-3  1  2  2]
 [ 1 -2  1  1]]

Multiplication (a*b):
[[4 2 3 8]
 [2 8 6 6]]

Division (a/b):
[[0.25 2.   3.   2.  ]
 [2.   0.5  1.5  1.5 ]]

Modulo (a%b):
[[1 0 0 0]
 [0 2 1 1]]

a = np.array([[1, 2, 3, 4], [2, 2, 3, 3]])

print(f"Input array a:\n{a}\n")

print(f"Negation:\n{-a}\n")
print(f"Absolute:\n{np.abs(a)}\n")
print(f"Square root:\n{np.sqrt(a)}\n")
print(f"Sine:\n{np.sin(a)}\n")

Input array a:
[[1 2 3 4]
 [2 2 3 3]]

Negation:
[[-1 -2 -3 -4]
 [-2 -2 -3 -3]]

Absolute:
[[1 2 3 4]
 [2 2 3 3]]

Square root:
[[1.    1.414 1.732 2.   ]
 [1.414 1.414 1.732 1.732]]

Sine:
[[ 0.841  0.909  0.141 -0.757]
 [ 0.909  0.909  0.141  0.141]]

a = np.array([[1, 2, 3, 4], [2, 2, 3, 3]])
b = np.array([[4, 1, 1, 2], [1, 4, 2, 2]])

print(f"Input array a:\n{a}\n")
print(f"Input array b:\n{b}\n")

print(f"Addition (np.add(a, b)):\n{np.add(a, b)}\n")

Input array a:
[[1 2 3 4]
 [2 2 3 3]]

Input array b:
[[4 1 1 2]
 [1 4 2 2]]

Addition (np.add(a, b)):
[[5 3 4 6]
 [3 6 5 5]]

a = np.array([[1, 2, 3, 4], [2, 2, 3, 3]])

print(f"Input array a:\n{a}\n")

print(f"Sum of all elements:\n{np.sum(a)}\n")

Input array a:
[[1 2 3 4]
 [2 2 3 3]]

Sum of all elements:
20

a = np.array([[1, 2, 3, 4], [2, 2, 3, 3]])

print(f"Input array a:\n{a}\n")

print(f"Sums along Axis 0:\n{np.sum(a, axis=0)}\n")

Input array a:
[[1 2 3 4]
 [2 2 3 3]]

Sums along Axis 0:
[3 4 6 7]

a = np.array([[1, 2, 3, 4], [2, 2, 3, 3]])

print(f"Input array a:\n{a}\n")

print(f"Sums along Axis 1:\n{np.sum(a, axis=1)}\n")

Input array a:
[[1 2 3 4]
 [2 2 3 3]]

Sums along Axis 1:
[10 10]

a = np.array([[1, 2, 3, 4], [2, 2, 3, 3]])

print(f"Input array a:\n{a}\n")

print(f"Sums along Axis 0 & 1:\n{np.sum(a, axis=(0,1))}\n")

Input array a:
[[1 2 3 4]
 [2 2 3 3]]

Sums along Axis 0 & 1:
20

matrix = np.array([[1, 2, 3, 4], [2, 2, 3, 3]])
vector = np.array([[1], [2], [3], [4]])

print(f"Matrix:\n{matrix}\n")
print(f"Vector:\n{vector}\n")

print(f"Dot product:\n{np.dot(matrix, vector)}\n")
#print(f"Dot product:\n{matrix.dot(vector)}\n")   # Same effect

Matrix:
[[1 2 3 4]
 [2 2 3 3]]

Vector:
[[1]
 [2]
 [3]
 [4]]

Dot product:
[[30]
 [27]]

matrix1 = np.array([[1, 2, 3, 4], [2, 2, 3, 3]])
matrix2 = np.array([[4, 1, 1, 2], [1, 4, 2, 2]]).T

print(f"Matrix 1:\n{matrix1}\n")
print(f"Matrix 2:\n{matrix2}\n")

print(f"Matrix product:\n{np.dot(matrix1, matrix2)}\n")

Matrix 1:
[[1 2 3 4]
 [2 2 3 3]]

Matrix 2:
[[4 1]
 [1 4]
 [1 2]
 [2 2]]

Matrix product:
[[17 23]
 [19 22]]

A = np.random.rand(2, 3, 4)
B = np.random.rand(2, 4, 5)

C = np.matmul(A, B)
#C = A @ B  # Same effect
print(C.shape)

(2, 3, 5)

a = np.array([[1, 2, 3, 4], [2, 2, 3, 3]])
b = np.array([[1], [3]])

print(f"Array a (shape: {a.shape}):\n{a}\n")
print(f"Array b (shape: {b.shape}):\n{b}\n")

print(f"Sum a+b:\n{a+b}\n")

Array a (shape: (2, 4)):
[[1 2 3 4]
 [2 2 3 3]]

Array b (shape: (2, 1)):
[[1]
 [3]]

Sum a+b:
[[2 3 4 5]
 [5 5 6 6]]

a = np.array([[1, 2, 3, 4], [2, 2, 3, 3]])
b = np.array([[1, 1, 1, 1]])  # Shape: (4,)
#b = np.array([[1, 1, 1, 1]])  # Shape: (1, 4)


print(f"Array a (shape: {a.shape}):\n{a}\n")
print(f"Array b (shape: {b.shape}):\n{b}\n")

print(f"Sum a+b:\n{a+b}\n")

Array a (shape: (2, 4)):
[[1 2 3 4]
 [2 2 3 3]]

Array b (shape: (1, 4)):
[[1 1 1 1]]

Sum a+b:
[[2 3 4 5]
 [3 3 4 4]]

np.random.seed(1)
a = np.random.randint(1, 20, size=(3, 5))

print(f"Input array a:\n{a}\n")

max_idx = np.argmax(a)
max_val = a.ravel()[max_idx]
print(f"Index with the first maximum values: {max_idx} (value: {max_val})")

max_idx_multi = np.unravel_index(max_idx, a.shape)
max_val = a[max_idx_multi]
print(f"Index with the first maximum values: {max_idx} (value: {max_val})")

Input array a:
[[ 6 12 13  9 10]
 [12  6 16  1 17]
 [ 2 13  8 14  7]]

Index with the first maximum values: 9 (value: 17)
Index with the first maximum values: 9 (value: 17)

np.random.seed(1)
a = np.random.randint(1, 20, size=(3, 5))

print(f"Input array a:\n{a}\n")

print(f"Indices of maximum values for each column:\n{np.argmax(a, axis=0)}\n")
print(f"Indices of maximum values for each row:\n{np.argmax(a, axis=1)}\n")

Input array a:
[[ 6 12 13  9 10]
 [12  6 16  1 17]
 [ 2 13  8 14  7]]

Indices of maximum values for each column:
[1 2 1 2 1]

Indices of maximum values for each row:
[2 4 3]

np.random.seed(1)
a = np.random.randint(1, 20, size=(3, 5))

print(f"Input array a:\n{a}\n")

print(f"Indices of sorted array entries:\n{np.argsort(a, axis=None)}\n")

Input array a:
[[ 6 12 13  9 10]
 [12  6 16  1 17]
 [ 2 13  8 14  7]]

Indices of sorted array entries:
[ 8 10  0  6 14 12  3  4  1  5 11  2 13  7  9]

np.random.seed(1)
a = np.random.randint(1, 20, size=(3, 5))

print(f"Input array a:\n{a}\n")

print(f"Indices of sorted array entries (axis=1):\n{np.argsort(a, axis=1)}\n")
# np.argsort(a, axis=-1)  # Same effect since a has only to axes 0 and 1.

Input array a:
[[ 6 12 13  9 10]
 [12  6 16  1 17]
 [ 2 13  8 14  7]]

Indices of sorted array entries (axis=1):
[[0 3 4 1 2]
 [3 1 0 2 4]
 [0 4 2 1 3]]

np.random.seed(10) # Just to ensure that we get the same random numbers

D = np.random.rand(10, 5)
x = np.random.rand(5)

print('Dataset D:')
print(D) 
print()
print('Data point x:')
print(x)

Dataset D:
[[0.771 0.021 0.634 0.749 0.499]
 [0.225 0.198 0.761 0.169 0.088]
 [0.685 0.953 0.004 0.512 0.813]
 [0.613 0.722 0.292 0.918 0.715]
 [0.543 0.142 0.373 0.674 0.442]
 [0.434 0.618 0.513 0.65  0.601]
 [0.805 0.522 0.909 0.319 0.09 ]
 [0.301 0.114 0.829 0.047 0.626]
 [0.548 0.819 0.199 0.857 0.352]
 [0.755 0.296 0.884 0.326 0.165]]

Data point x:
[0.393 0.093 0.821 0.151 0.384]

# Use broadcasting to subtract x from all data points in D
R = D - x

# Square all elements
R = np.square(R)

# Sum up all squared elements for each row
distances = np.sum(R, axis=1)

# Calculate the final square roots
distances = np.sqrt(distances)

# Print the 10 distances
print(distances)

[0.744 0.361 1.344 1.192 0.709 0.817 0.69  0.28  1.199 0.504]

# Get the indices of the 3 most similar data points
top_i = np.argsort(distances)[:3]

print(top_i)

[7 1 9]

D[top_i]

array([[0.301, 0.114, 0.829, 0.047, 0.626],
       [0.225, 0.198, 0.761, 0.169, 0.088],
       [0.755, 0.296, 0.884, 0.326, 0.165]])

euclidean_distances(D, x.reshape(1,-1))

array([[0.744],
       [0.361],
       [1.344],
       [1.192],
       [0.709],
       [0.817],
       [0.69 ],
       [0.28 ],
       [1.199],
       [0.504]])

np.random.seed(10) # Just to ensure that we get the same random numbers

D = np.random.rand(10, 5) * np.array([0.05, 10, 500, 0.1, 50])

print('Dataset D:')
print(D)

Dataset D:
[[  0.039   0.208 316.824   0.075  24.925]
 [  0.011   1.981 380.265   0.017   4.417]
 [  0.034   9.534   1.974   0.051  40.631]
 [  0.031   7.218 145.938   0.092  35.729]
 [  0.027   1.422 186.67    0.067  22.092]
 [  0.022   6.178 256.569   0.065  30.052]
 [  0.04    5.216 454.324   0.032   4.523]
 [  0.015   1.14  414.341   0.005  31.314]
 [  0.027   8.193  99.474   0.086  17.583]
 [  0.038   2.96  441.968   0.033   8.251]]

col_mean = np.mean(D, axis=0)
col_std = np.std(D, axis=0)

print(col_mean, "<= Means for all features")
print(col_std, "<= Standard deviations for all features")

[  0.028   4.405 269.835   0.052  21.952] <= Means for all features
[  0.009   3.123 149.052   0.028  12.324] <= Standard deviations for all features

D_standardized = (D - col_mean) / col_std

print(D_standardized)

[[ 1.078 -1.344  0.315  0.807  0.241]
 [-1.817 -0.776  0.741 -1.256 -1.423]
 [ 0.622  1.643 -1.797 -0.035  1.516]
 [ 0.237  0.901 -0.831  1.408  1.118]
 [-0.134 -0.955 -0.558  0.541  0.011]
 [-0.709  0.568 -0.089  0.457  0.657]
 [ 1.257  0.26   1.238 -0.722 -1.414]
 [-1.415 -1.046  0.969 -1.691  0.76 ]
 [-0.107  1.213 -1.143  1.191 -0.355]
 [ 0.989 -0.463  1.155 -0.699 -1.112]]

scaler = StandardScaler()

D_standardized_sklearn = scaler.fit_transform(D)

print(D_standardized_sklearn)

[[ 1.078 -1.344  0.315  0.807  0.241]
 [-1.817 -0.776  0.741 -1.256 -1.423]
 [ 0.622  1.643 -1.797 -0.035  1.516]
 [ 0.237  0.901 -0.831  1.408  1.118]
 [-0.134 -0.955 -0.558  0.541  0.011]
 [-0.709  0.568 -0.089  0.457  0.657]
 [ 1.257  0.26   1.238 -0.722 -1.414]
 [-1.415 -1.046  0.969 -1.691  0.76 ]
 [-0.107  1.213 -1.143  1.191 -0.355]
 [ 0.989 -0.463  1.155 -0.699 -1.112]]

Array Dimensions	np.dot() Behavior	np.matmul() Behavior
1D · 1D	Returns inner product (scalar)	Returns inner product (scalar)
1D · 2D	Not allowed directly; 1D is treated as row vector (may require reshape)	Treats 1D as row vector $\rightarrow$ returns 1D vector
2D · 1D	Treats 1D as column vector $\rightarrow$ returns 1D vector	Treats 1D as column vector $\rightarrow$ returns 1D vector
2D · 2D	Standard matrix multiplication	Standard matrix multiplication
ND (N>2) · ND (N>2)	No broadcasting; sum-product over last axis of A and second-to-last axis of B	Performs batch matrix multiplication with broadcasting over leading dimensions
ND · 2D / 2D · ND	Limited support; may require reshaping	Supports batch operations consistently

NumPy — Basic Tutorial¶

Setting up the Notebook¶

Make Required Imports¶

Set Print Options¶

Multidimensional Arrays¶

Basic Usage¶

Creating Arrays¶

Describing Arrays¶

Auxiliary Methods for Array Creation¶

Views of Arrays¶

Array Manipulation¶

Transposing Arrays¶

Reshaping Arrays¶

Combining Arrays¶

Splitting Arrays¶

Resizing Arrays¶

Array Indexing¶

Integer Indexing¶

Slicing¶

Integer Array Indexing¶

Boolean Indexing¶

Array Math¶

Elementwise Operations¶

Aggregation Operations¶

Linear Algebra Operations¶

Broadcasting¶

Arg* Methods¶

Practical Example Use Cases¶

Finding the K-Nearest Neighbors¶

Feature Scaling: Standardization¶

Summary¶