from IPython.core.display import HTML

def _set_css_style(css_file_path):
   """
   Read the custom CSS file and load it into Jupyter.
   Pass the file path to the CSS file.
   """

   styles = open(css_file_path, "r").read()
   s = '<style>%s</style>' % styles     
   return HTML(s)

_set_css_style('rise.css')

import numpy as np
L = [[0,1],[2,3]]
A = np.array(L)

print("L:",L)
print("A:\n",A)

print(type(L),type(A))

print(id(L))

print(id(L[1])-id(L[0])) # rows are far away

print(id(L[0][1])-id(L[0][0])) # columns not so much

A = np.array([1,2,3,4])
A.dtype # type of what is stored in the array - NOT python types!

A.ndim # number of dimensions (called axes in numpy)

A.shape # size of the dimensions as a tuple

A.reshape((4,1)).shape # a column vector

A = np.array([1,2,3,4]).reshape(4,1)

A[0]

A[0,0]

# can initialize an array with a list, or list of lists (or list of lists of lists, etc)
M = np.array([[1,2,3], [4,5,6.0]])
print(M.dtype, M.shape)

# if know the size, but not the data, can initialize to zeros:
Z = np.zeros((10,10))
# or ones
O = np.ones((5,10))
# or identity
I = np.identity(3) # this makes a 3x3 square identity matrix

print(Z.dtype) # note, default type is floating point

Z = np.zeros((10,10),np.int64) # can change type
print(Z.dtype)

x = np.array([1, 2, 3])
y = np.array([3, 2, 1])
x + y

z = np.array([1, 1, 1, 1])
x + z

x = np.array([1, 2, 3])
3 * x

x * x

y = np.array([2, 2, 2])
x**y

x/y

M = np.array([[0,1,2],[3,4,5]])
M

print(M[1,1])  # indexing
print(M[0,-1]) # last item of first row

print(M[0,1:]) # can have slices - all but first column of first row

print(M[1], M[1,:]) # missing indices are treated as complete slices

M = [[0,1,2],[3,4,5]]

M[1, 1]

A = np.array([0,1,4,9,16,25])

print(A[[2,5]]) # choose just indices 2 and 5

b = A > 4
print(b)

print(A[b])

print("b =",b)
A[b] = 0

print(A)

S = np.array(['a','b','c','b','a'])
S[S != 'a'] = 'z'

S

A = np.array([[0,1,2],[3,4,5],[6,7,8]])

B = A   # A and B reference the *same* object
A is B

B[0,0] = 1000
A

row = A[1,:]
row

row[2] = 5000
A

newMat = A.copy() # this will actually copy the data
newMat[0,0] = 0
A

newMat

A = np.array([[0,1,2],[3,4,5],[6,7,8]])
B = A[A > 4]
B

B[:] = -1
B

A

A[A > 4] = -1
A

def z(M):
    M[:] = 0
A = np.array([1,2,3])
z(A)
A

A = [1,2,3,4]
np.mean(A)

np.sum(A)

np.sin(A)

b = np.arange(12).reshape(3,4)
b

np.sum(b)

np.sum(b, axis=0)

np.sum(b, axis=1)

np.genfromtxt('../files/Spellman.csv')

np.genfromtxt('../files/Spellman.csv', delimiter=',')

strdata = np.genfromtxt('../files/Spellman.csv', dtype=str, delimiter=',')
strdata

header = strdata[0,1:].astype(int)
genes = strdata[1:,0]
values = strdata[1:,1:].astype(float)

len(strdata), len(strdata[0])

genes.shape

(values-values.min())/(values.max()-values.min())

np.std((values-values.mean())/values.std())

f = open('../files/Spellman.csv')
lines = f.readlines()
print(lines[0])
print(lines[1])

import numpy as np
import matplotlib.pyplot as plt
times = np.array(lines[0].replace('\n', '').split(',')[1:], float)
exps = np.array(lines[1].replace('\n', '').split(',')[1:], float)
plt.plot(times, exps);

import matplotlib.pyplot as plt
#bins = [-3,-2,-1,0,1,2,3]
#bins = np.linspace(-3,3,100)
plt.hist(values[:,0],bins=100);

plt.hist(values[:,-1],bins=100);

bins = np.linspace(-3,3,100)
plt.hist(values[:,0],bins=bins, alpha=0.5,label="ts-40")
plt.hist(values[:,-1],bins=100,alpha=0.5,label="ts-260")
plt.legend(loc="best");
plt.xlabel("Expression", size=14)
plt.ylabel("Number of Instances", size=14)

plt.hist(values.mean(axis=1),bins=100);

plt.plot(header,values.mean(axis=0))
plt.xlabel("Time",size=14)
plt.ylabel("Avg. Expression",size=14);

plt.plot(header,(values[values[:,0]>0]).mean(axis=0),label="positive")
plt.plot(header,(values[values[:,0]<0]).mean(axis=0),label="negative");
plt.xlabel("Time",size=14)
plt.ylabel("Avg. Expression",size=14)
plt.legend()

`numpy`: arrays and functions¶

Arrays¶

Array memory layout¶

Array memory¶

Why does this matter?¶

Creating `numpy` arrays¶

Definitions of dimensions¶

Initializing `numpy` arrays¶

`numpy` arrays behave like vectors¶

More math with arrays¶

Indexing and slicing¶

What is `M[1,1]`?¶

Advanced slicing: integers¶

Advanced slicing: boolean¶

Slicing assignment¶

What is the new value of `S`?¶

Array views vs. copies¶

Views¶

Sliced views¶

Explicit copy¶

Advanced slices copy¶

What is the value of `A` after this function call?¶

Functions on arrays¶

Axes¶

Loading data¶

Loading data¶

Data normalization¶

Activity: Expression data¶

For next time¶

numpy: arrays and functions¶

Arrays¶

Array memory layout¶

Array memory¶

Why does this matter?¶

Creating numpy arrays¶

Definitions of dimensions¶

Initializing numpy arrays¶

numpy arrays behave like vectors¶

More math with arrays¶

Indexing and slicing¶

What is M[1,1]?¶

Advanced slicing: integers¶

Advanced slicing: boolean¶

Slicing assignment¶

What is the new value of S?¶

Array views vs. copies¶

Views¶

Sliced views¶

Explicit copy¶

Advanced slices copy¶

What is the value of A after this function call?¶

Functions on arrays¶

Axes¶

Loading data¶

Loading data¶

Data normalization¶

Activity: Expression data¶

For next time¶

`numpy`: arrays and functions¶

Creating `numpy` arrays¶

Initializing `numpy` arrays¶

`numpy` arrays behave like vectors¶

What is `M[1,1]`?¶

What is the new value of `S`?¶

What is the value of `A` after this function call?¶