Library: NumPy¶

Installation¶

#conda install numpy
#pip install numpy

import numpy as np

Numpy Arrays¶

A homogeneous container of numerical element of a single type.
Arrays can have 1 dimension (similar to python lists) or 2 dimensions (similar to python matrix).
Axes are defined for arrays with more than one dimension: the first running vertically downwards across rows (axis 0), and the second running horizontally across columns (axis 1).

Creating NumPy Arrays¶

#From a Python list

my_list = [1,2,3]
my_list

[1, 2, 3]

arr = np.array(my_list)
arr

array([1, 2, 3])

#From a Python matrix

my_matrix = [[1,2,3],[4,5,6],[7,8,9]]
my_matrix

[[1, 2, 3], [4, 5, 6], [7, 8, 9]]

mat = np.array(my_matrix)
mat

array([[1, 2, 3],
       [4, 5, 6],
       [7, 8, 9]])

Array¶

np.array(object [, dtype=None, copy=True, order='K', subok=False, ndmin=0])

#create an array 1 dimension
arr = np.array([2,4,6]) 
arr

array([2, 4, 6])

#create an array 2 dimensions (matrix)
mat = np.array([[2,4,6], [8,10,12], [14,16,18]]) 
mat

array([[ 2,  4,  6],
       [ 8, 10, 12],
       [14, 16, 18]])

zeros and ones¶

#generates arrays of zeros
arr0 = np.zeros(3)
mat0 = np.zeros((5,5))
mat0

array([[0., 0., 0., 0., 0.],
       [0., 0., 0., 0., 0.],
       [0., 0., 0., 0., 0.],
       [0., 0., 0., 0., 0.],
       [0., 0., 0., 0., 0.]])

#generates arrays of ones
arr1 = np.ones(3)
mat1 = np.ones((3,3))
mat1

array([[1., 1., 1.],
       [1., 1., 1.],
       [1., 1., 1.]])

arange array¶

np.arange(start, stop, [step, ]dtype=None)

#create sequences of numbers
arr = np.arange(0,10, 2, int ) #np.arange([start,] stop [, step, dtype])
arr

array([0, 2, 4, 6, 8])

arr = np.arange( 0, 2, 0.3 ) #accepts float
arr

array([0. , 0.3, 0.6, 0.9, 1.2, 1.5, 1.8])

arr = np.arange(0,12).reshape(3,4) #can be reshaped in rows and columns
arr

array([[ 0,  1,  2,  3],
       [ 4,  5,  6,  7],
       [ 8,  9, 10, 11]])

linspace¶

np.linspace(start, stop, num=50[, endpoint=True, retstep=False, dtype=None, axis=0])

#Return evenly spaced numbers over a specified interval
np.linspace(0,10,21)

array([ 0. ,  0.5,  1. ,  1.5,  2. ,  2.5,  3. ,  3.5,  4. ,  4.5,  5. ,
        5.5,  6. ,  6.5,  7. ,  7.5,  8. ,  8.5,  9. ,  9.5, 10. ])

eye¶

#creates an identity matrix
np.eye(4)

array([[1., 0., 0., 0.],
       [0., 1., 0., 0.],
       [0., 0., 1., 0.],
       [0., 0., 0., 1.]])

Random¶

#Create an array of the given shape and populate it with random samples from a uniform distribution over [0, 1].
np.random.rand(2)
np.random.rand(5,5)

array([[0.9797668 , 0.94586434, 0.36524117, 0.19784975, 0.15176004],
       [0.09277052, 0.90938651, 0.52618724, 0.62981716, 0.5111796 ],
       [0.96197826, 0.48489467, 0.14034696, 0.69334539, 0.33582117],
       [0.69485323, 0.93141817, 0.03266454, 0.1680806 , 0.49473144],
       [0.19240705, 0.50925566, 0.07623005, 0.34016356, 0.66179273]])

#Return a sample (or samples) from the "standard normal" distribution. Unlike rand which is uniform:
np.random.randn(2)
np.random.randn(5,5)

array([[-1.58666343,  0.85040663, -0.27919152,  0.01841439,  0.75435485],
       [ 0.89726612,  0.69130702, -1.13555545, -0.66225676,  0.70258642],
       [ 1.44323687, -0.34104132,  0.83226325, -1.37563275,  2.36230149],
       [-0.20648663,  1.00273908, -0.56658769, -1.49940631,  2.05278195],
       [-0.80371781,  0.59568719, -1.63747353, -1.14329534, -0.69771396]])

#Return random integers from `low` (inclusive) to `high` (exclusive).
np.random.randint(1,100)
np.random.randint(1,100,10)

array([76,  9, 67, 24, 16, 89, 54, 23, 31, 87])

Array Attributes and Methods¶

arr = np.arange(25)
arr #show

array([ 0,  1,  2,  3,  4,  5,  6,  7,  8,  9, 10, 11, 12, 13, 14, 15, 16,
       17, 18, 19, 20, 21, 22, 23, 24])

ranarr = np.random.randint(0,50,10)
ranarr #show

array([11, 49, 21,  5, 45, 32, 36, 41, 16, 28])

ranarr.reshape(5,2) #modify the structure of the array

array([[11, 49],
       [21,  5],
       [45, 32],
       [36, 41],
       [16, 28]])

ranarr.max() #max value

49

ranarr.argmax() #max value position

1

ranarr.min()#min value

5

ranarr.argmin() #min value position

3

ranarr.ndim #number of axes(dimensions)

1

ranarr.size #number of elements

10

ranarr.shape #dimensions

(10,)

ranarr.dtype #data type

dtype('int32')

ranarr.itemsize #size in bytes

4

ranarr.reshape(5,2).shape

(5, 2)

Indexing and Selection¶

Bracket Indexing and Selection¶

#Get a value at an index
arr[8]

8

#Get values in a range (start included, end excluded)
arr[1:5]

array([1, 2, 3, 4])

#Copies and clones
arr1 = arr
arr2 = arr.copy
arr is arr1 #true, same object
arr is arr2 #false, different object

False

Indexing a 2D array (matrices)¶

#Creating 2D array
arr_2d = np.array(([5,10,15],[20,25,30],[35,40,45]))
arr_2d

array([[ 5, 10, 15],
       [20, 25, 30],
       [35, 40, 45]])

#Indexing rows
arr_2d[1] #one row
arr_2d[[0,2]] #list of rows

array([[ 5, 10, 15],
       [35, 40, 45]])

#Getting individual element value
arr_2d[1][0]

20

#Getting multiple element values
arr_2d[:2,1:] #first row/s, second column/s

array([[10, 15],
       [25, 30]])

#Filter
arr = np.arange(1,11)
arr > 4 #filter condition
bool_arr = arr>4 #boolean of selection
arr[bool_arr] #filter

array([ 5,  6,  7,  8,  9, 10])

arr[arr>4] #direct filter

array([ 5,  6,  7,  8,  9, 10])

x = 4 #filter condition
arr[arr>x] #filter using condition

array([ 5,  6,  7,  8,  9, 10])

NumPy Operations¶

arr = np.arange(1,13).reshape(3,4)
print(arr)

[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]

Basic Operations¶

arr + arr #sum

array([[ 2,  4,  6,  8],
       [10, 12, 14, 16],
       [18, 20, 22, 24]])

arr - arr #subtraction

array([[0, 0, 0, 0],
       [0, 0, 0, 0],
       [0, 0, 0, 0]])

arr * arr #product

array([[  1,   4,   9,  16],
       [ 25,  36,  49,  64],
       [ 81, 100, 121, 144]])

arr/arr #division

array([[1., 1., 1., 1.],
       [1., 1., 1., 1.],
       [1., 1., 1., 1.]])

1/arr #normalization

array([[1.        , 0.5       , 0.33333333, 0.25      ],
       [0.2       , 0.16666667, 0.14285714, 0.125     ],
       [0.11111111, 0.1       , 0.09090909, 0.08333333]])

arr**2 #power

array([[  1,   4,   9,  16],
       [ 25,  36,  49,  64],
       [ 81, 100, 121, 144]], dtype=int32)

np.sqrt(arr) #square root

array([[1.        , 1.41421356, 1.73205081, 2.        ],
       [2.23606798, 2.44948974, 2.64575131, 2.82842712],
       [3.        , 3.16227766, 3.31662479, 3.46410162]])

np.exp(arr) #exponent

array([[2.71828183e+00, 7.38905610e+00, 2.00855369e+01, 5.45981500e+01],
       [1.48413159e+02, 4.03428793e+02, 1.09663316e+03, 2.98095799e+03],
       [8.10308393e+03, 2.20264658e+04, 5.98741417e+04, 1.62754791e+05]])

np.sin(arr) #sin

array([[ 0.84147098,  0.90929743,  0.14112001, -0.7568025 ],
       [-0.95892427, -0.2794155 ,  0.6569866 ,  0.98935825],
       [ 0.41211849, -0.54402111, -0.99999021, -0.53657292]])

np.log(arr) #logaritm

array([[0.        , 0.69314718, 1.09861229, 1.38629436],
       [1.60943791, 1.79175947, 1.94591015, 2.07944154],
       [2.19722458, 2.30258509, 2.39789527, 2.48490665]])

np.sum(arr) #total sum

78

np.sum(arr, axis = 0) #column sum

array([15, 18, 21, 24])

np.sum(arr, axis = 1) #row sum

array([10, 26, 42])

np.cumsum(arr, axis = 0) #cumulative column sum

array([[ 1,  2,  3,  4],
       [ 6,  8, 10, 12],
       [15, 18, 21, 24]], dtype=int32)

np.cumsum(arr, axis = 1) #cumulative row sum

array([[ 1,  3,  6, 10],
       [ 5, 11, 18, 26],
       [ 9, 19, 30, 42]], dtype=int32)

np.diff(arr) #diference between a number and the following one

array([[1, 1, 1],
       [1, 1, 1],
       [1, 1, 1]])

np.prod(arr) #total product

479001600

np.cumprod(arr) #acumulated product

array([        1,         2,         6,        24,       120,       720,
            5040,     40320,    362880,   3628800,  39916800, 479001600],
      dtype=int32)

Basic Statistics¶

np.max(arr) #maximum

12

np.min(arr) #minimum

1

np.average(arr) #average

6.5

np.mean(arr) #mean

6.5

np.median(arr) #median

6.5

np.var(arr) #variance

11.916666666666666

np.std(arr) #standard deviation

3.452052529534663

np.bincount(arr[0]) #values occurency

array([0, 1, 1, 1, 1], dtype=int64)

np.corrcoef(arr) #Pearson relation between vectprs

array([[1., 1., 1.],
       [1., 1., 1.],
       [1., 1., 1.]])

np.cov(arr) #covariance matrix

array([[1.66666667, 1.66666667, 1.66666667],
       [1.66666667, 1.66666667, 1.66666667],
       [1.66666667, 1.66666667, 1.66666667]])

Rounding Methods¶

arrdem = np.arange(0,8,0.23)
arrdem

array([0.  , 0.23, 0.46, 0.69, 0.92, 1.15, 1.38, 1.61, 1.84, 2.07, 2.3 ,
       2.53, 2.76, 2.99, 3.22, 3.45, 3.68, 3.91, 4.14, 4.37, 4.6 , 4.83,
       5.06, 5.29, 5.52, 5.75, 5.98, 6.21, 6.44, 6.67, 6.9 , 7.13, 7.36,
       7.59, 7.82])

np.rint(arrdem) #to the nearest integer

array([0., 0., 0., 1., 1., 1., 1., 2., 2., 2., 2., 3., 3., 3., 3., 3., 4.,
       4., 4., 4., 5., 5., 5., 5., 6., 6., 6., 6., 6., 7., 7., 7., 7., 8.,
       8.])

np.round(arrdem, 1) #to the nearest number for the precision defined (decimals)

array([0. , 0.2, 0.5, 0.7, 0.9, 1.2, 1.4, 1.6, 1.8, 2.1, 2.3, 2.5, 2.8,
       3. , 3.2, 3.4, 3.7, 3.9, 4.1, 4.4, 4.6, 4.8, 5.1, 5.3, 5.5, 5.8,
       6. , 6.2, 6.4, 6.7, 6.9, 7.1, 7.4, 7.6, 7.8])

np.ceil(arrdem) #to te nearest upper integer

array([0., 1., 1., 1., 1., 2., 2., 2., 2., 3., 3., 3., 3., 3., 4., 4., 4.,
       4., 5., 5., 5., 5., 6., 6., 6., 6., 6., 7., 7., 7., 7., 8., 8., 8.,
       8.])

np.floor(arrdem) #to te nearest lower integer

array([0., 0., 0., 0., 0., 1., 1., 1., 1., 2., 2., 2., 2., 2., 3., 3., 3.,
       3., 4., 4., 4., 4., 5., 5., 5., 5., 5., 6., 6., 6., 6., 7., 7., 7.,
       7.])

np.trunc(arrdem) #truncates to integer

array([0., 0., 0., 0., 0., 1., 1., 1., 1., 2., 2., 2., 2., 2., 3., 3., 3.,
       3., 4., 4., 4., 4., 5., 5., 5., 5., 5., 6., 6., 6., 6., 7., 7., 7.,
       7.])

np.clip(arrdem, 2, 6) #clips lower and upper values according to the boundaries

array([2.  , 2.  , 2.  , 2.  , 2.  , 2.  , 2.  , 2.  , 2.  , 2.07, 2.3 ,
       2.53, 2.76, 2.99, 3.22, 3.45, 3.68, 3.91, 4.14, 4.37, 4.6 , 4.83,
       5.06, 5.29, 5.52, 5.75, 5.98, 6.  , 6.  , 6.  , 6.  , 6.  , 6.  ,
       6.  , 6.  ])

Shape manipulation¶

np.sort(arr) #sort values ascending

array([[ 1,  2,  3,  4],
       [ 5,  6,  7,  8],
       [ 9, 10, 11, 12]])

-np.sort(-arr) #sort values descending

array([[ 4,  3,  2,  1],
       [ 8,  7,  6,  5],
       [12, 11, 10,  9]])

np.ravel(arr) #flattens the values to a single line

array([ 1,  2,  3,  4,  5,  6,  7,  8,  9, 10, 11, 12])

arr.T #transposes the matrix

array([[ 1,  5,  9],
       [ 2,  6, 10],
       [ 3,  7, 11],
       [ 4,  8, 12]])

arr.resize(4,3) #modifies arrays structure
arr

array([[ 1,  2,  3],
       [ 4,  5,  6],
       [ 7,  8,  9],
       [10, 11, 12]])

np.vstack((arr, arr)) #joins vertically (rows)

array([[ 1,  2,  3],
       [ 4,  5,  6],
       [ 7,  8,  9],
       [10, 11, 12],
       [ 1,  2,  3],
       [ 4,  5,  6],
       [ 7,  8,  9],
       [10, 11, 12]])

np.hstack((arr,arr)) #joins horizontally (columns)

array([[ 1,  2,  3,  1,  2,  3],
       [ 4,  5,  6,  4,  5,  6],
       [ 7,  8,  9,  7,  8,  9],
       [10, 11, 12, 10, 11, 12]])

np.split(arr, 2) #splits in equal parts the rows

[array([[1, 2, 3],
        [4, 5, 6]]), array([[ 7,  8,  9],
        [10, 11, 12]])]

np.hsplit(arr, 3) #splits in equal parts the columns

[array([[ 1],
        [ 4],
        [ 7],
        [10]]), array([[ 2],
        [ 5],
        [ 8],
        [11]]), array([[ 3],
        [ 6],
        [ 9],
        [12]])]

Broadcasting¶

arr[0:3,0] = 100 #updates values
arr

array([[100,   2,   3],
       [100,   5,   6],
       [100,   8,   9],
       [ 10,  11,  12]])

slice_of_arr = arr[:2, :3] #cuts a portion of values
slice_of_arr

array([[100,   2,   3],
       [100,   5,   6]])

arr[arr > 6] = 20 #filter to update
arr

array([[20,  2,  3],
       [20,  5,  6],
       [20, 20, 20],
       [20, 20, 20]])