# import numpy as np
# import matplotlib.pyplot as plt
%pylab inline

%pylab is deprecated, use %matplotlib inline and import the required libraries.
Populating the interactive namespace from numpy and matplotlib


class_data = np.array([1.2, 2.1, 3.4, 4.1, 7, 11])

plt.figure()
plt.hist(class_data)
plt.xlim(0, 20)
plt.xlabel('time (min)')
plt.ylabel('mutations')
plt.show()


ts = np.linspace(0, 25, 100)
lams = [0.05, 2, 20, 80]
fig, ax1 = plt.subplots()
for lam in lams:
  ax1.plot(ts, np.exp(-ts/lam), label=r'$\lambda = $'+f'{lam}')

ax2 = ax1.twinx()
ax2.hist(class_data, density=True, color='k', label='class data')
ax1.legend(loc='upper left', bbox_to_anchor=(1.03, 1), borderaxespad=0)
ax1.set_xlabel('$t$')
plt.title('$\exp(-t/\lambda)$')
ax1.set_ylim(0, 1)
ax2.set_yticks([])
plt.show()


def Z(lamda, a=0, b=15):
    return np.exp(-a/lamda) - np.exp(-b/lamda)

def likelihood(datum,lamda):
    return np.exp(-datum/lamda) / Z(lamda)/lamda


lamda = np.linspace(0.01, 15,100)


plot(lamda,likelihood(1.2, lamda )/likelihood(1.2, lamda ).sum())
plot(lamda,likelihood(2.1, lamda )/likelihood(2.1, lamda ).sum())
plot(lamda,likelihood(3.4, lamda )/likelihood(3.4, lamda ).sum())
plot(lamda,likelihood(11, lamda )/likelihood(11, lamda ).sum())

plt.ylabel(r'P($t_{i} | \lambda$)');
plt.xlabel(r'$\lambda$');


plot(lamda,(likelihood(1.2, lamda )/likelihood(1.2, lamda ).sum() * likelihood(2.1, lamda )/likelihood(2.1, lamda ).sum() \
     * likelihood(3.4, lamda )/likelihood(3.4, lamda ).sum() * likelihood(11, lamda )/likelihood(11, lamda ).sum()) / 
     (likelihood(1.2, lamda )/likelihood(1.2, lamda ).sum() * likelihood(2.1, lamda )/likelihood(2.1, lamda ).sum() \
     * likelihood(3.4, lamda )/likelihood(3.4, lamda ).sum() * likelihood(11, lamda )/likelihood(11, lamda ).sum()).sum())

plt.ylabel(r'P($t_{i} | \lambda$)');
plt.xlabel(r'$\lambda$');


plot(lamda,likelihood(1.2, lamda )/likelihood(1.2, lamda ).sum(), color = 'gray')
plot(lamda,likelihood(2.1, lamda )/likelihood(2.1, lamda ).sum(), color = 'gray')
plot(lamda,likelihood(3.4, lamda )/likelihood(3.4, lamda ).sum(), color = 'gray')
plot(lamda,likelihood(11, lamda )/likelihood(11, lamda ).sum(), color = 'gray')
plot(lamda,(likelihood(1.2, lamda )/likelihood(1.2, lamda ).sum() * likelihood(2.1, lamda )/likelihood(2.1, lamda ).sum() \
     * likelihood(3.4, lamda )/likelihood(3.4, lamda ).sum() * likelihood(11, lamda )/likelihood(11, lamda ).sum()) / 
     (likelihood(1.2, lamda )/likelihood(1.2, lamda ).sum() * likelihood(2.1, lamda )/likelihood(2.1, lamda ).sum() \
     * likelihood(3.4, lamda )/likelihood(3.4, lamda ).sum() * likelihood(11, lamda )/likelihood(11, lamda ).sum()).sum(), color = 'magenta')

plt.ylabel(r'P($t_{i} | \lambda$)');
plt.xlabel(r'$\lambda$');


ts = np.linspace(0, 25, 100)
lams = [5]
fig, ax1 = plt.subplots()
for lam in lams:
  ax1.plot(ts, np.exp(-ts/lam), label=r'$\lambda = $'+f'{lam}')

ax2 = ax1.twinx()
ax2.hist(class_data, density=True, color='k', label='class data')
ax1.legend(loc='upper left', bbox_to_anchor=(1.03, 1), borderaxespad=0)
ax1.set_xlabel('$t$')
plt.title('$\exp(-t/\lambda)$')
ax1.set_ylim(0, 1)
ax2.set_yticks([])
plt.show()


lam1 = 0.05
lam2 = 80
eta = 0.5

plt.figure()
plt.plot(ts, eta*np.exp(-ts/lam1) + (1-eta)*np.exp(-ts/lam2),
         label=r'$\eta, \lambda_1, \lambda_2 = $'+f'{eta}, {lam1}, {lam2}')
plt.title('$\eta ~\exp(-t/\lambda_1) + (1-\eta) \exp(-t/\lambda_2)$')
plt.legend(loc='upper left', bbox_to_anchor=(1.04, 1), borderaxespad=0)
plt.xlabel('$t$')
plt.ylim(0, 1)
plt.show()


## try it yourself!

10**(-323), 10**(-324)

(1e-323, 0.0)


def flog(x):
    return np.log(x)


10**(-323)*10**(-322)

0.0

-1.3862943611198906


x = np.linspace(1.05,100,1000)
plt.plot(x,flog(x))

[<matplotlib.lines.Line2D at 0x7f46767cd0c0>]


np.log(np.exp(1000)+np.exp(999))

/usr/local/lib/python3.7/dist-packages/ipykernel_launcher.py:1: RuntimeWarning: overflow encountered in exp
  """Entry point for launching an IPython kernel.

inf


from scipy.special import logsumexp
?logsumexp


import numpy as np
np.logaddexp?


import numpy as np
import matplotlib.pyplot as plt


xs = np.linspace(0,1,int(1e7)) # define bins
dx = xs[1]-xs[0] # width of a bin


dx#see what our bin list looks like

1.00000010000001e-07


def g(x): # a function to integrate
    return x


plt.step(xs,g(xs))

[<matplotlib.lines.Line2D at 0x7f603b371090>]


%%time
bin_vals = []
for x in xs: # For every value in our list of bins get the area of the particular bin by multiplying the height at that point by the width of the bin.
    bin_vals.append(x*dx)

print(np.sum(bin_vals)) # sum up all the areas.

0.5000000500000026
CPU times: user 2.07 s, sys: 492 ms, total: 2.56 s
Wall time: 2.56 s


%%time
np.sum(g(xs)*dx) # numpy broadcasting Vector, we do the operation to ever entry on the array and sum the entries

CPU times: user 42 ms, sys: 28.4 ms, total: 70.4 ms
Wall time: 66.2 ms

0.5000000500000026


def g(x): #Another function to integrate.
    return x**2


plt.step(xs,g(xs))

[<matplotlib.lines.Line2D at 0x7f60168ee050>]


%%time
bin_vals = []
for x in xs:  # For every value in our list of bins get the area of the particular bin by multiplying the height at that point by the width of the bin.
    bin_vals.append(x**2 * dx)

np.sum(bin_vals) # sum up all the areas.

CPU times: user 2.68 s, sys: 183 ms, total: 2.86 s
Wall time: 2.87 s

0.3333333833333404


%%time
np.sum(xs**2*dx) # numpy broadcasting Vector, we do the operation to ever entry on the array and sum the entries

CPU times: user 51.9 ms, sys: 9.9 ms, total: 61.8 ms
Wall time: 63 ms

0.3333333833333404


xs = np.linspace(10,11,10) # define bins
ys = np.linspace(0,1,10) # define bins
dx = xs[1]- xs[0] # width of a bin
dy = ys[1]- ys[0] # width of a bin


xs.shape

(10,)


xs[:,np.newaxis]

array([[10.        ],
       [10.11111111],
       [10.22222222],
       [10.33333333],
       [10.44444444],
       [10.55555556],
       [10.66666667],
       [10.77777778],
       [10.88888889],
       [11.        ]])


xs**2 - ys**2

array([100.        , 102.22222222, 104.44444444, 106.66666667,
       108.88888889, 111.11111111, 113.33333333, 115.55555556,
       117.77777778, 120.        ])


xs[:,np.newaxis]**2 - ys**2

array([[100.        ,  99.98765432,  99.95061728,  99.88888889,
         99.80246914,  99.69135802,  99.55555556,  99.39506173,
         99.20987654,  99.        ],
       [102.2345679 , 102.22222222, 102.18518519, 102.12345679,
        102.03703704, 101.92592593, 101.79012346, 101.62962963,
        101.44444444, 101.2345679 ],
       [104.49382716, 104.48148148, 104.44444444, 104.38271605,
        104.2962963 , 104.18518519, 104.04938272, 103.88888889,
        103.7037037 , 103.49382716],
       [106.77777778, 106.7654321 , 106.72839506, 106.66666667,
        106.58024691, 106.4691358 , 106.33333333, 106.17283951,
        105.98765432, 105.77777778],
       [109.08641975, 109.07407407, 109.03703704, 108.97530864,
        108.88888889, 108.77777778, 108.64197531, 108.48148148,
        108.2962963 , 108.08641975],
       [111.41975309, 111.40740741, 111.37037037, 111.30864198,
        111.22222222, 111.11111111, 110.97530864, 110.81481481,
        110.62962963, 110.41975309],
       [113.77777778, 113.7654321 , 113.72839506, 113.66666667,
        113.58024691, 113.4691358 , 113.33333333, 113.17283951,
        112.98765432, 112.77777778],
       [116.16049383, 116.14814815, 116.11111111, 116.04938272,
        115.96296296, 115.85185185, 115.71604938, 115.55555556,
        115.37037037, 115.16049383],
       [118.56790123, 118.55555556, 118.51851852, 118.45679012,
        118.37037037, 118.25925926, 118.12345679, 117.96296296,
        117.77777778, 117.56790123],
       [121.        , 120.98765432, 120.95061728, 120.88888889,
        120.80246914, 120.69135802, 120.55555556, 120.39506173,
        120.20987654, 120.        ]])


%%time
int_value = 0
bin_vals_x = []
for x in xs: # For every value in our list of bins in one axis
    bin_vals_y = []
    for y in ys: # For every value in our list of bins in  the other axis
        bin_vals_y.append((x**2-y**2)*dx*dy) #updating lists
        int_value += (x**2-y**2)*dx*dy # Summing the entry ar every step
    bin_vals_x.append(bin_vals_y)
bin_vals_x = np.array(bin_vals_x) #create surface array
print(int_value) #value of the integral

135.802469135802
CPU times: user 0 ns, sys: 879 µs, total: 879 µs
Wall time: 933 µs


plt.imshow(bin_vals_x)
plt.colorbar()

<matplotlib.colorbar.Colorbar at 0x7f6014822860>


%%time
surf = xs[:,np.newaxis]**2 - ys**2 # Numpy broadcasting method of integrating with two axis.

CPU times: user 34 µs, sys: 20 µs, total: 54 µs
Wall time: 56.7 µs


(ys**2)[:,np.newaxis] - xs**2

array([[ 0.        , -0.01234568, -0.04938272, -0.11111111, -0.19753086,
        -0.30864198, -0.44444444, -0.60493827, -0.79012346, -1.        ],
       [ 0.01234568,  0.        , -0.03703704, -0.09876543, -0.18518519,
        -0.2962963 , -0.43209877, -0.59259259, -0.77777778, -0.98765432],
       [ 0.04938272,  0.03703704,  0.        , -0.0617284 , -0.14814815,
        -0.25925926, -0.39506173, -0.55555556, -0.74074074, -0.95061728],
       [ 0.11111111,  0.09876543,  0.0617284 ,  0.        , -0.08641975,
        -0.19753086, -0.33333333, -0.49382716, -0.67901235, -0.88888889],
       [ 0.19753086,  0.18518519,  0.14814815,  0.08641975,  0.        ,
        -0.11111111, -0.24691358, -0.40740741, -0.59259259, -0.80246914],
       [ 0.30864198,  0.2962963 ,  0.25925926,  0.19753086,  0.11111111,
         0.        , -0.13580247, -0.2962963 , -0.48148148, -0.69135802],
       [ 0.44444444,  0.43209877,  0.39506173,  0.33333333,  0.24691358,
         0.13580247,  0.        , -0.16049383, -0.34567901, -0.55555556],
       [ 0.60493827,  0.59259259,  0.55555556,  0.49382716,  0.40740741,
         0.2962963 ,  0.16049383,  0.        , -0.18518519, -0.39506173],
       [ 0.79012346,  0.77777778,  0.74074074,  0.67901235,  0.59259259,
         0.48148148,  0.34567901,  0.18518519,  0.        , -0.20987654],
       [ 1.        ,  0.98765432,  0.95061728,  0.88888889,  0.80246914,
         0.69135802,  0.55555556,  0.39506173,  0.20987654,  0.        ]])


plt.imshow(surf)

<matplotlib.image.AxesImage at 0x7f8de0afdf10>


def Z(lam, tmin, tmax):
  return lam * (np.exp(-tmin/lam) - np.exp(-tmax/lam))

## TODO FOR YOU, FOR HOMEWORK
## YOU'LL REALLY WANT TO USE LOGS TO COMPUTE THINGS
def logZ(lam, tmin, tmax):
    return 

# check if similar:
np.isclose(Z(3, 0.05, 80), np.exp(logZ(3, 0.05, 80)))

the problem¶

Week 3 homework!¶

$H_1$: One mutation time constant $\lambda$¶

$H_2$: Two mutation time constants $\lambda_1$, $\lambda_2$¶

Probabilities can be very small numbers¶

The smallest double-precision floting point number,¶

Working in log space¶

How to integrate?¶

But what about higher dimensional integrals?¶

Don't know where to start with the homework! Or getting confused with the `log` computations?¶

the problem¶

Week 3 homework!¶

$H_1$: One mutation time constant $\lambda$¶

$H_2$: Two mutation time constants $\lambda_1$, $\lambda_2$¶

Probabilities can be very small numbers¶

The smallest double-precision floting point number,¶

Working in log space¶

How to integrate?¶

But what about higher dimensional integrals?¶

Don't know where to start with the homework! Or getting confused with the log computations?¶

Don't know where to start with the homework! Or getting confused with the `log` computations?¶