import numpy as np # import the numpy package


a = np.array([1, 2, 3])  # Create a rank 1 array (1D array)
a

array([1, 2, 3])


type(a)

numpy.ndarray


b = np.array([[1,2,3],[4,5,6]]) #Create 2D array 
b

array([[1, 2, 3],
       [4, 5, 6]])


np.mean(b)

3.5


a = np.random.random(100000000)


%%time
x = np.sum(a)

CPU times: user 72.4 ms, sys: 0 ns, total: 72.4 ms
Wall time: 73.8 ms


%%time
x = 0 
for element in a:
  x = x + element

CPU times: user 15.9 s, sys: 36.2 ms, total: 15.9 s
Wall time: 16 s


x = np.array([[1,2],[3,4]], dtype=np.float64)
y = np.array([[5,6],[7,8]], dtype=np.float64)

# Elementwise sum; both produce the array
print(x + y)
print(np.add(x, y))

[[ 6.  8.]
 [10. 12.]]
[[ 6.  8.]
 [10. 12.]]


# Elementwise difference; both produce the array
print(x - y)
print(np.subtract(x, y))

[[-4. -4.]
 [-4. -4.]]
[[-4. -4.]
 [-4. -4.]]


# Elementwise product; both produce the array
print(x * y)
print(np.multiply(x, y))

[[ 5. 12.]
 [21. 32.]]
[[ 5. 12.]
 [21. 32.]]


# Elementwise division; both produce the array
# [[ 0.2         0.33333333]
#  [ 0.42857143  0.5       ]]
print(x / y)
print(np.divide(x, y))

[[0.2        0.33333333]
 [0.42857143 0.5       ]]
[[0.2        0.33333333]
 [0.42857143 0.5       ]]


# Elementwise square root; produces the array
# [[ 1.          1.41421356]
#  [ 1.73205081  2.        ]]
print(np.sqrt(x))

[[1.         1.41421356]
 [1.73205081 2.        ]]


# Elementwise exponential power; produces array 
#[[ 2.71828183  7.3890561 ]
#[20.08553692 54.59815003]]
print(np.exp(x))

[[ 2.71828183  7.3890561 ]
 [20.08553692 54.59815003]]


np.round(np.exp(x)) #Round an array to the given number of decimals.;elementwise

array([[ 3.,  7.],
       [20., 55.]])


np.ceil(np.exp(x)) #Return the ceiling of the input, element-wise.

array([[ 3.,  8.],
       [21., 55.]])


np.floor(np.exp(x)) #Return the floor of the input, element-wise.

array([[ 2.,  7.],
       [20., 54.]])


import numpy as np
x = np.array([[1,2],[3,4]])
y = np.array([[5,6],[7,8]])

v = np.array([9,10])
w = np.array([11, 12])

print(x)

print(y)

print(v)

print(w)

[[1 2]
 [3 4]]
[[5 6]
 [7 8]]
[ 9 10]
[11 12]


# Inner product of vectors; both produce 219
print(v.dot(w))
print(np.dot(v, w))

219
219


print(v @ w)

219


m1 = np.ones((5,3))
m1

array([[1., 1., 1.],
       [1., 1., 1.],
       [1., 1., 1.],
       [1., 1., 1.],
       [1., 1., 1.]])


m2 = np.ones((3,2))
m2

array([[1., 1.],
       [1., 1.],
       [1., 1.]])


m1@m2

array([[3., 3.],
       [3., 3.],
       [3., 3.],
       [3., 3.],
       [3., 3.]])


x = np.array([[1, 2], [3, 4], [5, 6]])

print(x)

[[1 2]
 [3 4]
 [5 6]]


print(np.min(x))  # Show min of all elements; prints "1"

1


print(np.max(x))  # Show max of all elements; prints "6"

6


print(np.mean(x))  # Compute the mean of the all elements; prints "3.5"

3.5


print(np.median(x))  # Compute the median of the all elements; prints "3.5"

3.5


print(np.quantile(x, 0.75))  # Compute the 3rd quartile of the all elements; prints "4.75"

4.75


print(np.std(x))  # Compute the standard deviation of the all elements; prints "1.708"

1.707825127659933


print(np.sum(x))  # Compute sum of all elements; prints "21"

21


print(np.cumsum(x))  # Compute cumulative sum of all elements; prints "21"

[ 1  3  6 10 15 21]


a = np.array([0.45959958, 0.1613048 , 0.76000473, 0.07536241, 0.60232491,
       0.00167602, 0.71653501, 0.40927931, 0.78030462, 0.15509362])
b = np.array([7.17485455, 5.50089164, 7.35266241, 5.64972889, 7.62871573,
       5.01298309, 7.57177999, 6.81378627, 7.3785654 , 5.79279215])


np.cov(a,b)

array([[0.08872592, 0.28013513],
       [0.28013513, 0.98124247]])


np.corrcoef(a,b)

array([[1.        , 0.94941078],
       [0.94941078, 1.        ]])


x = np.array([[1, 2], [5, 3], [4, 6]])

print(np.max(x, axis=0))  # Compute max of each column; prints "[5 6]"

[5 6]


print(np.max(x, axis=1))  # Compute max of each row; prints "[2 5 6]"

[2 5 6]


print(np.mean(x, axis=1))  # Compute mean of each row; prints "[1.5 4  5]"

[1.5 4.  5. ]

a

array([0.45959958, 0.1613048 , 0.76000473, 0.07536241, 0.60232491,
       0.00167602, 0.71653501, 0.40927931, 0.78030462, 0.15509362])


np.sort(a) #from smallest to largest

array([0.00167602, 0.07536241, 0.15509362, 0.1613048 , 0.40927931,
       0.45959958, 0.60232491, 0.71653501, 0.76000473, 0.78030462])


np.sort(a)[::-1] #from largest to smallest

array([0.78030462, 0.76000473, 0.71653501, 0.60232491, 0.45959958,
       0.40927931, 0.1613048 , 0.15509362, 0.07536241, 0.00167602])


np.random.shuffle(a)
a

array([0.00167602, 0.60232491, 0.45959958, 0.71653501, 0.15509362,
       0.40927931, 0.78030462, 0.07536241, 0.1613048 , 0.76000473])


ex2 = np.random.random(10)
ex2

array([0.06354225, 0.25978659, 0.71671978, 0.00627995, 0.30814461,
       0.72897845, 0.51545988, 0.57818907, 0.69467508, 0.42554708])


print(ex2.min())
print(np.quantile(ex2,0.25))
print(np.median(ex2))
print(np.quantile(ex2,0.75))
print(np.max(ex2))

0.006279953666841864
0.27187609181029326
0.47050348192359215
0.6655535802201438
0.7289784495557392


x1 = np.random.random(10) #create one dimensional array
x1

array([0.84473521, 0.25480532, 0.04202275, 0.97207065, 0.17375351,
       0.76710637, 0.48383864, 0.51858609, 0.64259706, 0.54944136])


x1[0]

0.8447352143549912


x1[4]

0.17375350556132374


x1[0:2]

array([0.84473521, 0.25480532])


x1[len(x1)-1] #the accessing the last entry

0.5494413589911319


x1[-1]

0.5494413589911319


x1[-2]

0.6425970578161072


# Create the following rank 2 array with shape (3, 4)
a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
a

array([[ 1,  2,  3,  4],
       [ 5,  6,  7,  8],
       [ 9, 10, 11, 12]])


# Use slicing to pull out the subarray showing the first entry
a[0,0]

1


# Use slicing to pull out the subarray showng the (2,3)^th element of the array
a[1,2]

7


row_r1 = a[1, :]    # Rank 1 view of the second row of a  
row_r2 = a[1:2, :]  # Rank 2 view of the second row of a
row_r3 = a[[1], :]  # Rank 2 view of the second row of a
print(row_r1, row_r1.shape)
print(row_r2, row_r2.shape)
print(row_r3, row_r3.shape)

[5 6 7 8] (4,)
[[5 6 7 8]] (1, 4)
[[5 6 7 8]] (1, 4)


# We can make the same distinction when accessing columns of an array:
col_r1 = a[:, 1]
col_r2 = a[:, 1:2]
print(col_r1, col_r1.shape)
print()
print(col_r2, col_r2.shape)

[ 2  6 10] (3,)

[[ 2]
 [ 6]
 [10]] (3, 1)


# Use slicing to pull out the subarray consisting of the first 2 rows
# and columns 1 and 2; b is the following array of shape (2, 2):
# [[2 3]
#  [6 7]]
b = a[:2, 1:3]
print(b)

[[2 3]
 [6 7]]


a = np.array([[1,2], [3, 4], [5, 6]])

a

array([[1, 2],
       [3, 4],
       [5, 6]])


# An example of integer array indexing.
# The returned array will have shape (3,) and 
print(a[[0, 1, 2], [0, 1, 0]])

# The above example of integer array indexing is equivalent to this:
print(np.array([a[0, 0], a[1, 1], a[2, 0]]))

[1 4 5]
[1 4 5]


a = np.arange(0,10,1)
a

array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9])


a[1]

1


a[0:5]

array([0, 1, 2, 3, 4])


ex_32 = np.array([[12,  5,  2],
       [ 7,  6,  8]])
ex_32

array([[12,  5,  2],
       [ 7,  6,  8]])


ex_32[:,2]

array([2, 8])


ex_32[:,0:2]

array([[12,  5],
       [ 7,  6]])


print(a[0, 1])
b[0, 0] = 77    # b[0, 0] is the same piece of data as a[0, 1]
print(a[0, 1])

2
2


a = np.array([3,4,5])
a

array([3, 4, 5])


a[1] = 121342141
a

array([        3, 121342141,         5])


ex_32 = np.array([[12,  5,  2],
       [ 7,  6,  8]])
ex_32

array([[12,  5,  2],
       [ 7,  6,  8]])


ex_32[0,0] = 3


ex_32

array([[3, 5, 2],
       [7, 6, 8]])


ex_32[1,:] = np.array([1,6,5])
ex_32

array([[3, 5, 2],
       [1, 6, 5]])


a = np.array([[1,2], [3, 4], [5, 6]])

a

array([[1, 2],
       [3, 4],
       [5, 6]])


bool_idx = (a > 2)  # Find the elements of a that are bigger than 2;
                    # this returns a numpy array of Booleans of the same
                    # shape as a, where each slot of bool_idx tells
                    # whether that element of a is > 2.

print(bool_idx)

[[False False]
 [ True  True]
 [ True  True]]


# We use boolean array indexing to construct a rank 1 array
# consisting of the elements of a corresponding to the True values
# of bool_idx
print(a[bool_idx])

# We can do all of the above in a single concise statement:
print(a[a > 2])

[3 4 5 6]
[3 4 5 6]


bbb = np.random.random(5)

bbb

array([0.93669359, 0.86031809, 0.59110717, 0.06983715, 0.5498046 ])


bbb[bbb>0.4]

array([0.93669359, 0.86031809, 0.59110717, 0.5498046 ])


data = np.array([0.59910553,0.19892384,0.42800147,0.67696757,0.34828451,0.69517928,
0.13703289,0.51119015,0.48787451,0.57731085,0.23286820,0.41338543,
0.65633721,1.35069021,0.12212476,0.47460029,0.26618002,1.20542218,
0.71538627,0.20428730,0.13221638,0.56680370,0.32725263,0.29339787,
0.07488558,0.51300380,0.08008302,0.14898439,1.71885703,0.09566642,
0.85223586,0.45847046,0.23882542,0.41942143,0.54160489,0.48413253,
0.62215659,1.83152943,0.10104083,0.92777223,0.25699445,0.22967180,
0.40207172,0.13048873,0.36742793,0.28115245,1.95182640,1.61350926,
0.57133538,0.20487397])


q1 = np.quantile(data,0.25)
q3 = np.quantile(data,0.75)
iqr = q3-q1 
upper = q3 + 1.5*iqr
lower = q1 - 1.5*iqr 

data[np.logical_or(data<lower, data>upper)]

array([1.35069021, 1.20542218, 1.71885703, 1.83152943, 1.9518264 ,
       1.61350926])


a = np.array([4, 3, 5, 7, 6, 8])


indices = [0, 1, 4]
np.take(a, indices)

array([4, 3, 6])


a[[0, 1, 4]]

array([4, 3, 6])


b  = np.array([[2,6,8],[5,12,17]])
b

array([[ 2,  6,  8],
       [ 5, 12, 17]])


np.take(b,[1],axis = 0)

array([[ 5, 12, 17]])


np.take(b,[1],axis = 1)

array([[ 6],
       [12]])

a

array([4, 3, 5, 7, 6, 8])


np.put(a, [0], 189)
a

array([189,   3,   5,   7,   6,   8])


a[0] = 189


x = np.array([[1, 2], [3, 4], [5, 6]])

print(x)
print("transpose\n", x.T)

[[1 2]
 [3 4]
 [5 6]]
transpose
 [[1 3 5]
 [2 4 6]]


v = np.array([[1,2,3]])
print(v )
print("transpose\n", v.T)

[[1 2 3]]
transpose
 [[1]
 [2]
 [3]]


w = np.array([[1],[2],[3]])
print(w)
w.shape

[[1]
 [2]
 [3]]

(3, 1)


y = w.reshape(-1,)
print(y)
y.shape

[1 2 3]

(3,)


z = w.squeeze()
print(z)
z.shape

[1 2 3]

(3,)


y.reshape((-1,1))

array([[1],
       [2],
       [3]])


x=np.array([[1,2],[3,4]])  
y=np.array([[12,30]]) 
print(x)
print(y)

[[1 2]
 [3 4]]
[[12 30]]


z=np.concatenate((x,y))  
z

array([[ 1,  2],
       [ 3,  4],
       [12, 30]])


x=np.array([[1,2],[3,4]])  
y=np.array([[12,30]])  
z=np.concatenate((x,y), axis=0)  
z

array([[ 1,  2],
       [ 3,  4],
       [12, 30]])


x=np.array([[1,2],[3,4]])  
y=np.array([[12],[30]])  
x
y

array([[12],
       [30]])


z=np.concatenate((x,y), axis=1)  
z

array([[ 1,  2, 12],
       [ 3,  4, 30]])


x=np.array([[1,2],[3,4]])  
y=np.array([[12,30]])  
z=np.concatenate((x,y.T), axis=1)  #take the transpose to create a column array
z

array([[ 1,  2, 12],
       [ 3,  4, 30]])


np.random.randint(1,5,2) #(min,max,size)

array([3, 1])


np.random.randint(3,15,4) #(min,max,size)

array([13, 14, 13, 14])


np.random.seed(456)
np.random.random(5)

array([0.24875591, 0.16306678, 0.78364326, 0.80852339, 0.62562843])


np.random.random(5)

array([0.60411363, 0.8857019 , 0.75911747, 0.18110506, 0.15016932])


np.random.seed(456)
np.random.random(5)

array([0.24875591, 0.16306678, 0.78364326, 0.80852339, 0.62562843])

Stat 112 - Recitation 7¶

Introduction to Numpy¶

Basic Operators¶

Exercise 1¶

Mathematical and Statistical Functions¶

Exercise 2¶

Array Indexing and Slicing¶

Exercise 3.1¶

Exercise 3.2¶

Exercise 4¶

Exercise 5¶

Manipulating Array¶

Exercise 6¶

Quiz 4¶