#!/usr/bin/env python # coding: utf-8 # # Numpy # $\newcommand{\re}{\mathbb{R}}$ # [Numpy](https://numpy.org/doc/stable/user/index.html) provides many useful types and methods to perform numerical computations including vectors, matrices and linear algebra. # # First import the numpy module. # In[353]: import numpy # You only need to do this once, usually at the beginning of your code. # # To access methods, etc. inside this module, use dot operator. # In[354]: print(numpy.pi) print(numpy.sin(numpy.pi/2)) # It is common practice to import numpy like this. # In[355]: import numpy as np # Note that ```np``` acts as an alias or short-hand for ```numpy```. # In[356]: print(np.pi) print(np.sin(np.pi/2)) # ## 1-d [arrays](https://numpy.org/doc/stable/reference/generated/numpy.array.html) # Create an array of zeros # In[357]: x = np.zeros(5) print(x) # These one dimensional arrays are of type ```ndarray``` # In[358]: type(x) # Create an array of ones # In[359]: x = np.ones(5) print(x) # Create and add two arrays # In[360]: x = np.array([1.0, 2.0, 3.0]) y = np.array([4.0, 5.0, 6.0]) z = x + y print(z) # Get the size of array # In[361]: print(len(x)) print(x.size) # Get the shape of an array # In[362]: print(x.shape) # We see that these are arrays of reals by default. We can specify the type # In[363]: a = np.zeros(5, dtype=int) print(a) # ## [linspace](https://numpy.org/doc/stable/reference/generated/numpy.linspace.html) # This behaves same way as Matlab's [linspace](https://mathworks.com/help/matlab/ref/linspace.html) function. # # Generate 10 uniformly spaced numbers in [1,10] # In[364]: x = np.linspace(1,10,10) print(x) # Note that this includes the end points 1 and 10. The output of linspace is an ```ndarray``` of floats. # In[365]: type(x) # `x = linspace(a,b,n)` is such that `x` is an array of `n` elements # # ``` # x[i] = a + i*h, i=0,1,2,...,n-1, h = (b-a)/(n-1) # ``` # # so that # # ``` # x[0] = a, x[n-1] = x[-1] = b # ``` # # Note that we get last element of array using `x[-1]`; similarly, the last but one is given by `x[-2]`, etc. # ## [arange](https://numpy.org/doc/stable/reference/generated/numpy.arange.html) # In[366]: x = np.arange(1,10) print(x) print(type(x)) # For $m < n$, `arange(m,n)` returns # # $$ # m, m+1, \ldots, n-1 # $$ # # Note the last value $n$ is not included. # # We can specify a step size # In[367]: x = np.arange(1,10,2) print(x) # If the arguments are float, the returned value is also float. # In[368]: x = np.arange(1.0,10.0) print(x) # In[369]: x = np.arange(0,1,0.1) print(x) # ## Beware of pitfalls - 1 # # Create an array of ones. # In[370]: x = np.ones(10) print(x) # Maybe we want set all elements to zero, so we might try this # In[371]: x = 0.0 print(x) # ```x``` has changed from an array to a scalar !!! In Python, the type of a variable is determined by what we assign to it. The correct way to set zeroes is this. # In[372]: x = np.ones(10) print(x) x[:] = 0.0 print(x) # ## Beware of pitfalls - 2 # In[373]: x = np.ones(5) y = x x[:] = 0.0 print('x = ', x) print('y = ', y) # Why did ```y``` change ? This happened because when we do # # ``` # y = x # ``` # # then `y` is just a pointer to `x`, so that changing `x` changes `y` also. If we want ```y``` to be an independent copy of ```x``` then do this # In[374]: x = np.ones(5) y = x.copy() # or y = np.copy(x) x[:] = 0.0 print('x = ', x) print('y = ', y) # ## 2-d [arrays](https://numpy.org/doc/stable/reference/generated/numpy.array.html) # 2-d arrays can be considered as matrices, though Numpy has a separate [matrix](https://numpy.org/doc/stable/reference/generated/numpy.matrix.html) class. # # Create an array of zeros # In[375]: A = np.zeros((5,5)) print(A) # The size must be specified as a tuple or list. # # We can access the elements by two indices `A[i,j]`: here `i` is the row index and `j` is the column index. # # ``` # -----------j--------> # | [[0. 0. 0. 0. 0.] # | [0. 0. 0. 0. 0.] # i [0. 0. 0. 0. 0.] # | [0. 0. 0. 0. 0.] # v [0. 0. 0. 0. 0.]] # ``` # # The top, left element is `A[0,0]`. # # We can modify the elements of an array. # In[376]: A[1,1] = 1.0 print(A) # Create an array of ones # In[377]: A = np.ones((2,3)) print(A) # Create identity matrix # In[378]: A = np.eye(5) print(A) # Create an array by specifying its elements # In[379]: A = np.array([[1.0, 2.0], [3.0, 4.0]]) print(A) # Create a random array and inspect its shape # In[380]: m, n = 2, 3 A = np.random.rand(m,n) print(A) print('A.size =',A.size) print('A.shape =',A.shape) print('A.shape[0] =',A.shape[0],' (number of rows)') print('A.shape[1] =',A.shape[1],' (number of columns)') # To print the elements of an array, we need two for loops, one over rows and another over the columns. # In[381]: for i in range(m): # loop over rows for j in range(n): # loop over columns print(i,j,A[i,j]) # To transpose a 2-d array # In[382]: A = np.array([[1,2],[3,4]]) print("A ="); print(A) B = A.T print("B ="); print(B) # ## Diagonal matrix # # Create # # $$ # A = \begin{bmatrix} # 1 & 0 & 0 & 0 \\ # 0 & 2 & 0 & 0 \\ # 0 & 0 & 3 & 0 \\ # 0 & 0 & 0 & 4 \end{bmatrix} # $$ # In[383]: a = np.array([1,2,3,4]) # diagonal elements A = np.diag(a) print(A) # Create $n \times n$ tri-diagonal matrix # In[384]: a = np.array([1,2,3]) # sub-diagonal : length = n-1 b = np.array([4,5,6,7]) # main diagonal : length = n c = np.array([-1,-2,-3]) # super-diagonal: length = n-1 A = np.diag(a,-1) + np.diag(b,0) + np.diag(c,+1) print(A) # ## empty_like, etc. # # Sometimes we have an existing array and we want to create a new array of the same shape and type, but without initializing its elements. # In[385]: A = np.random.rand(2,3) B = np.empty_like(A) print(A.shape,B.shape) # In[386]: C = np.zeros_like(A) print(C) # In[387]: D = np.ones_like(A) print(D) # ## 1-D array is neither row nor column vector # In[388]: x = np.array([1,2,3]) print(x.shape, x) y = x.T print(y.shape, y) # Create a row vector # In[389]: x = np.array([[1,2,3]]) # row vector print('x.shape =',x.shape) print(x) y = x.T print('y.shape =',y.shape) print(y) # Create a column vector # In[390]: x = np.array([[1], [2], [3]]) # column vector print('x.shape =',x.shape) print(x) y = x.T print('y.shape =',y.shape) print(y) # Functions like `zeros` and `ones` can return row/column vector rather than array. # In[391]: x = np.ones((3,1)) # column vector print('x ='); print(x) y = np.ones((1,3)) # row vector print('y ='); print(y) # Row/column vectors are like row/column matrix. We have to use two indices to access the elements of such row/column vectors. # # Here we access elements of a column vector. # In[392]: print(x[0][0]) # or x[0,0] print(x[1][0]) print(x[2][0]) # `x[0]` gives an array for the first row. # In[393]: print('First row of x =',x[0], type(x[0])) print('Element in first row =',x[0][0], type(x[0][0])) # ## Accessing portions of arrays # Array of 10 elements # # | x[0] | x[1] | x[2] | x[3] | x[4] | x[5] | x[6] | x[7] | x[8] | x[9] | # |:----:|:----:|:----:|:----:|:----:|:----:|:----:|:----:|:----:|:----:| # | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 8 | 9 | # |x[-10]| x[-9]| x[-8]| x[-7]| x[-6]| x[-5]| x[-4]| x[-3]| x[-2]|x[-1] | # # In[394]: x = np.linspace(0,9,10) print(x) # Get elements ```x[2],...,x[5]``` # In[395]: print(x[2:6]) # Hence ```x[m:n]``` gives the elements ```x[m],x[m+1],...,x[n-1]```. # # Get elements from ```x[5]``` upto the last element # In[396]: print(x[5:]) # Get the last element # In[397]: print(x[-1]) # Get element ```x[5]``` upto last but one element # In[398]: print(x[5:-1]) # Access every alternate element of array starting from beginning `x[0]` # In[399]: print(x[0::2]) # and starting from `x[1]` # In[400]: print(x[1::2]) # These operations work on multi dimensional arrays also. # In[401]: A = np.random.rand(3,4) print(A) # In[402]: print(A[0,:]) # 0'th row # In[403]: print(A[:,0]) # 0'th column # In[404]: print(A[0:2,0:3]) # print submatrix # In[405]: A[0,:] = 0.0 # zero out zeroth row print(A) # ## Arithmetic operations on arrays # Some arithmetic operations act element-wise # In[406]: x = np.array([1.0, 2.0, 3.0]) y = np.array([4.0, 5.0, 6.0]) print(x*y) # multiply # In[407]: print(x/y) # divide # In[408]: print(y**x) # exponentiation # In[409]: A = np.ones((3,3)) print(A*x) # If ```A``` and ```x``` are arrays, then ```A*x``` does not give matrix-vector product. For that use ```dot``` # In[410]: print(A.dot(x)) # or equivalently # In[411]: print(np.dot(A,x)) # In Python3 versions, we can use `@` to achieve matrix operations # In[412]: print(A@x) # We can of course do matrix-matrix products using ```dot``` or ```@``` # In[413]: A = np.ones((3,3)) B = 2*A print('A =\n',A) print('B =\n',B) print('A*B =\n',A@B) # On vectors, `@` performs dot product, i.e., `x@y = dot(x,y)` # In[414]: x = np.array([1,1,1]) y = np.array([2,3,4]) print(x@y) # ## Some matrix/vector functions # In[415]: x = np.array([-3,-2,-1,0,1,2,3]) print('min = ',np.min(x)) print('max = ',np.max(x)) print('abs min = ',np.abs(x).min()) # np.min(np.abs(x)) print('abs max = ',np.abs(x).max()) # np.max(np.abs(x)) print('sum = ',np.sum(x)) print('dot = ',np.dot(x,x)) print('dot = ',np.sum(x*x)) # Note that `np.sum(x*x)` gives # # $$ # \sum_{i=0}^{n-1} x_i^2 # $$ # # We can compute vector norms using [numpy.linalg.norm](https://numpy.org/doc/stable/reference/generated/numpy.linalg.norm.html) (also see [scipy.linalg.norm](https://docs.scipy.org/doc/scipy/reference/generated/scipy.linalg.norm.html)) # In[416]: from numpy.linalg import norm print(norm(x)) # L2 norm print(norm(x,2)) # L2 norm print(norm(x,1)) # L1 norm print(norm(x,np.inf)) # Linf norm # or import the `linalg` module and use methods inside it. # In[417]: import numpy.linalg as la print(la.norm(x)) # L2 norm print(la.norm(x,2)) # L2 norm print(la.norm(x,1)) # L1 norm print(la.norm(x,np.inf)) # Linf norm # These methods work on 2-d arrays treated as matrices. # In[418]: A = 2*np.random.rand(3,3) - 1 print(A) # In[419]: print('min = ',np.min(A)) print('max = ',np.max(A)) print('abs min = ',np.abs(A).min()) # np.min(np.abs(x)) print('abs max = ',np.abs(A).max()) # np.max(np.abs(x)) print('sum = ',np.sum(A)) print('Frob norm = ',la.norm(A)) # Frobenius norm print('L1 norm = ',la.norm(A,1)) # L1 norm print('L2 norm = ',la.norm(A,2)) # L2 norm print('Linf norm = ',la.norm(A,np.inf)) # Linf norm # ## Example: Matrix-vector product # Let # # $$ # x \in \re^n, \qquad A \in \re^{m \times n}, \qquad y = A x \in \re^m # $$ # # We can compute this element-wise # # $$ # y_i = \sum_{j=0}^{n-1} A_{ij} x_j, \qquad 0 \le i \le m-1 # $$ # In[420]: m, n = 5, 10 x = np.random.rand(n) A = np.random.rand(m,n) y = np.zeros(m) # Important to set to zero assert A.shape[1] == len(x) and len(y) == A.shape[0] for i in range(m): for j in range(n): y[i] += A[i,j]*x[j] # We can verify that our result is correct by computing $\| y - A x\|_\infty$ # In[421]: print(np.linalg.norm(y-A@x, np.inf)) # We can also compute the product column-wise. Let # # $$ # A_{:,j} = \textrm{j'th column of A} \in \re^m # $$ # # Then the matrix-vector product can also be written as # # $$ # y = \sum_{j=0}^{n-1} A_{:,j} x_j # $$ # # **Warning**: This may have inefficient memory access since by default, numpy arrays have column-major ordering, see below. # In[422]: y[:] = 0.0 for j in range(n): y += A[:,j]*x[j] # Now check the result print(np.linalg.norm(y-A@x, np.inf)) # ## Example: Matrix-Matrix product # If $A \in \re^{m\times n}$ and $B \in \re^{n \times p}$ then $C = AB \in \re^{m \times p}$ is given by # # $$ # C_{ij} = \sum_{k=0}^{n-1} A_{ik} B_{kj}, \qquad 0 \le i \le m-1, \quad 0 \le j \le p-1 # $$ # In[423]: m,n,p = 10,8,6 A = np.random.rand(m,n) B = np.random.rand(n,p) C = np.zeros((m,p)) assert A.shape[1] == B.shape[0] for i in range(m): for j in range(p): for k in range(n): C[i,j] += A[i,k]*B[k,j] # Let us verify the result is correct by computing # # $$ # |C-AB|_\infty = \max_{i,j} |C_{ij} - (AB)_{ij}| # $$ # # using `@` operator # In[424]: print(np.abs(C - A@B).max()) # Another view-point is the following # # $$ # C_{ij} = (\textrm{i'th row of A}) \cdot (\textrm{j'th column of B}) # $$ # In[425]: for i in range(m): for j in range(p): C[i,j] = A[i,:] @ B[:,j] # Now check the result print(np.abs(C - A@B).max()) # ## Outer product of two vectors # # Given $a \in \re^m$ and $b \in \re^n$, both considered as column vectors, their outer product # # $$ # A = a b^\top = # \begin{bmatrix} # | \\ # a \\ # | # \end{bmatrix} # \begin{bmatrix} # - b^\top - # \end{bmatrix} # = # \begin{bmatrix} # | & | & & | \\ # a b_0 & a b_1 & \ldots & a b_{n-1} \\ # | & | & & | # \end{bmatrix} \in \re^{m \times n} # $$ # # is an $m \times n$ matrix with elements # # $$ # A_{ij} = a_i b_j, \qquad 0 \le i \le m-1, \quad 0 \le j \le n-1 # $$ # In[426]: a = np.array([1,2,3]) b = np.array([1,2]) A = np.outer(a,b) print('A.shape = ', A.shape) print('A = \n', A) # ## Math functions # # Numpy provides standard functions like `sin`, `cos`, `log`, etc. which can act on arrays in an element-by-element manner. This is not the case for functions in `math` module, which can only take scalar arguments. # In[427]: x = np.linspace(0.0, 2.0*np.pi, 5) y = np.sin(x) print('x =',x) print('y =',y) # In[428]: A = np.random.rand(5,5) # 5x5 matrix Y = np.sin(A) print('A =\n',A) print('Y =\n',Y) # ## Memory ordering in arrays* # By default, the ordering is same as in C/C++, the inner-most index is the fastest running one. For example, if we have an array of size (2,3), they are stored in memory in this order # # ``` # a[0,0], a[0,1], a[0,2], a[1,0], a[1,1], a[1,2] # ``` # # i.e., # # ``` # a[0,0] --> a[0,1] --> a[0,2] # | # |----------<----------| # | # a[1,0] --> a[1,1] --> a[1,2] # ``` # In[429]: a = np.array([[1,2,3], [4,5,6]]) print('Row contiguous =', a[0,:].data.contiguous) print('Col contiguous =', a[:,0].data.contiguous) a.flags # To get fortran style ordering, where the outer-most index is the fastest running one, which corresponds to the following layout in memory # # ``` # a[0,0], a[1,0], a[0,1], a[1,1], a[0,2], a[1,2] # ``` # # i.e., # # ``` # a[0,0] -- a[0,1] -- a[0,2] # | | | | | # v ^ v ^ v # | | | | | # a[1,0] -- a[1,1] -- a[1,2] # ``` # # create like this # In[430]: b = np.array([[1,2,3], [4,5,6]], order='F') print('Row contiguous =', b[0,:].data.contiguous) print('Col contiguous =', b[:,0].data.contiguous) b.flags # ## Tensor product array: meshgrid # In[431]: x = np.linspace(0,3,4) y = np.linspace(0,2,3) X, Y = np.meshgrid(x,y) print('len(x) = ',len(x)) print('len(y) = ',len(y)) print('shape X= ',X.shape) print('shape Y= ',Y.shape) print('x = ', x) print('y = ', y) print('X = '); print(X) print('Y = '); print(Y) # If $x \in \re^m$ and $y \in \re^n$, then the output of `meshgrid(x,y)` is arranged like this # # $$ # X[i,j] = x[j], \qquad # Y[i,j] = y[i], \qquad 0 \le i \le n-1, \quad 0 \le j \le m-1 # $$ # # If we want the following arrangement # # $$ # X[i,j] = x[i], \qquad # Y[i,j] = y[j], \qquad 0 \le i \le m-1, \quad 0 \le j \le n-1 # $$ # # we have to do the following # In[432]: X, Y = np.meshgrid(x,y,indexing='ij') print('len(x) = ',len(x)) print('len(y) = ',len(y)) print('shape X= ',X.shape) print('shape Y= ',Y.shape) # The second form is useful when working with finite difference schemes on Cartesian grids, where we want to use `i` index running along x-axis and `j` index running along y-axis. # ## Reshaping arrays # In[433]: A = np.array([[1,2,3], [4,5,6]]) print(A) # In[434]: B = np.reshape(A,2*3,order='C') print(B) # In[435]: A1 = np.reshape(B,(2,3),order='C') print(A1) # In[436]: C = np.reshape(A,2*3,order='F') print(C) # In[437]: A2 = np.reshape(C,(2,3),order='F') print(A2) # ## Writing and reading files # Write an array to file # In[438]: A = np.random.rand(3,3) print(A) np.savetxt('A.txt',A) # Check the contents of the file in your terminal # ``` # cat A.txt # ``` # We can also print it from within the notebook # In[439]: get_ipython().system('cat A.txt') # Write two 1-D arrays as columns into file # In[440]: x = np.array([1.0,2.0,3.0,4.0]) y = np.array([2.0,4.0,6.0,8.0]) np.savetxt('data.txt',np.column_stack([x,y])) get_ipython().system('cat data.txt') # We can control the number of decimals saved, and use scientific notation # In[441]: np.savetxt('data.txt',np.column_stack([x,y]),fmt='%8.4e') get_ipython().system('cat data.txt') # We can read an existing file like this # In[442]: d = np.loadtxt('data.txt') print('Shape d =', d.shape) x1 = d[:,0] y1 = d[:,1] print('x =',x1) print('y =',y1) # ## Measuring time # # Loops are slow in Python and it is good to avoid them. The following example shows how to time code execution. # # Create some random matrices # In[443]: m = 1000 A = np.random.random((m,m)) B = np.random.random((m,m)) # First we add two matrices with an explicit for loop. # In[444]: get_ipython().run_cell_magic('timeit', '-r10 -n10', 'C = np.empty_like(A)\nfor i in range(m):\n for j in range(m):\n C[i,j] = A[i,j] + B[i,j]\n') # Now we use the + operator. # In[445]: get_ipython().run_cell_magic('timeit', '-r10 -n10', 'C = A + B\n') # The loop version is significantly slower.