import os

import numpy as np
import skimage.io
import colorcet

import bi1x

# This is the single molecule kinetics module
from bi1x import smk

import iqplot

import bokeh.plotting
import bokeh.io

# URL of notebook for interactive plotting
notebook_url = 'localhost:8888'

bokeh.io.output_notebook()


# Interframe time
dt = 0.5  # minutes

# Directory containing images
img_dir = "practice_2016"

# Get list of files, sorted so they are in the right order
flist = list(sorted(os.listdir(img_dir)))

# Load in TIFF files into collection of images
ic = [
    skimage.io.imread(os.path.join(img_dir, fname))
    for fname in flist
    if fname[-4:] == ".tif"
]


gray_mapper = lambda: bokeh.models.LinearColorMapper(colorcet.gray)

bokeh.io.show(bi1x.viz.imshow(ic[0], color_mapper=gray_mapper()))


inds = np.s_[:200, :200]

bokeh.io.show(bi1x.viz.imshow(ic[0][inds], color_mapper=gray_mapper()))


roi_radius = 5


bokeh.io.show(
    bokeh.layouts.row(
        bi1x.viz.imshow(ic[0][inds], color_mapper=gray_mapper(), frame_height=200),
        bi1x.viz.imshow(ic[63][inds], color_mapper=gray_mapper(), frame_height=200),
    )
)


# Find good frames
gf, covs = smk.good_frames(ic, 0.95, return_covs=True)


p = bokeh.plotting.figure(
    frame_width=500,
    frame_height=200,
    x_axis_label='frame number',
    y_axis_label='coefficient of variation',
)

p.line(np.arange(len(covs)), covs)
p.circle(gf, covs[gf], color='orange')

bokeh.io.show(p)


# Set up time points and new list of images with good time frames
ic = [ic[i] for i in gf]
t = (np.array(gf, dtype=float) - gf[0]) * dt


ic_dc, max_shift = smk.drift_correct(ic)


ic_filt = [smk.preprocess(im, sigma=1, selem_width=5, neg_im=False) for im in ic_dc]


bokeh.io.show(
    bokeh.layouts.row(
        bi1x.viz.imshow(ic[0][inds], color_mapper=gray_mapper(), frame_height=200),
        bi1x.viz.imshow(ic_filt[0][inds], color_mapper=gray_mapper(), frame_height=200),
    )
)


# Find peaks in filtered images
peaks = smk.get_all_peaks(ic_filt, border=max_shift)


# Get ROIs from first frame
rois = smk.peak_rois(peaks[0], roi_radius)


print(len(rois))
rois = smk.filter_rois_peaks(peaks[0], rois)
print(len(rois))
rois = smk.filter_rois_intensity(ic_filt[0], rois, thresh_std=(0.5, 1))
print(len(rois))

2790
2590
1850


bead_variances = smk.positional_variance(peaks, rois)


p_ecdf = iqplot.ecdf(
    bead_variances,
    x_axis_label="variance (sq. pixels)",
    frame_height=150,
    frame_width=300,
)
p_hist = iqplot.histogram(
    bead_variances,
    rug=False,
    x_axis_label="variance (sq. pixels)",
    frame_height=150,
    frame_width=300,
    x_range=p_ecdf.x_range,
)

bokeh.io.show(bokeh.layouts.column(p_ecdf, p_hist))


# Variance cutoff
var_cutoff = 1.8

rois = [roi for roi, var in zip(rois, bead_variances) if var >= var_cutoff]

# Total number of beads we consider
n_beads_2016 = len(rois)

print(n_beads_2016)

604


# Find number of peaks in each ROI
n_peaks = smk.n_peaks_in_rois(peaks, rois)


bokeh.io.show(iqplot.spike(n_peaks.ravel()))


# Get bead loss times
t_lost_2016, beads_lost_2016 = smk.all_bead_loss(t, n_peaks, n_frames=5, frac=0.75)


p = iqplot.ecdf(
    np.concatenate((t_lost_2016, np.nan * np.ones(n_beads_2016 - len(t_lost_2016)))),
    q="time of bead loss (min)",
    y_range=[-0.025, 1.025],
)
bokeh.io.show(p)


# Save time of lost beads
np.savetxt('t_lost_2016.csv', t_lost_2016, fmt='%.2f')

# Save number of uncut beads
np.savetxt('number_of_uncut_2016.csv', np.array([n_beads_2016 - len(t_lost_2016)]))

# Save time points
np.savetxt('time_points_2016.csv', t)


beads_lost_2016[:4]

array([1, 2, 3, 5])


bokeh.io.show(
    smk.bead_checker(ic_filt, rois, roi_radius, peaks), notebook_url=notebook_url
)


# Directory containing images
img_dir = "practice_2023"

# Get list of files, sorted so they are in the right order
flist = list(sorted(os.listdir(img_dir)))

ic = [
    skimage.io.imread(os.path.join(img_dir, fname))
    for fname in flist
    if fname[-4:] == ".tif"
]

# View the upper left corner of an image
bokeh.io.show(bi1x.viz.imshow(ic[0][inds], color_mapper=gray_mapper()))


# Find good frames
gf, covs = smk.good_frames(ic, 0.95, return_covs=True)

p = bokeh.plotting.figure(
    frame_width=500,
    frame_height=200,
    x_axis_label='frame number',
    y_axis_label='coefficient of variation',
)

p.line(np.arange(len(covs)), covs)
p.circle(gf, covs[gf], color='orange')

bokeh.io.show(p)


bokeh.io.show(
    bokeh.layouts.row(
        bi1x.viz.imshow(ic[0][inds], color_mapper=gray_mapper(), frame_height=200),
        bi1x.viz.imshow(ic[-1][inds], color_mapper=gray_mapper(), frame_height=200),
    )
)


# Drift correct
ic_dc, max_shift = smk.drift_correct(ic)

# Filter, taking into account out-of-focus beads
ic_filt = [smk.preprocess(im, sigma=1, selem_width=5, neg_im=True) for im in ic_dc]

# Take a look at filtered image
p1 = bi1x.viz.imshow(ic[0][inds], color_mapper=gray_mapper(), frame_height=200)
p2 = bi1x.viz.imshow(ic_filt[0][inds], color_mapper=gray_mapper(), frame_height=200)
p1.x_range = p2.x_range
p1.y_range = p2.y_range

bokeh.io.show(bokeh.layouts.row(p1, p2))


# Find peaks in filtered images
peaks = smk.get_all_peaks(ic_filt, border=max_shift)

# Get ROIs from first frame
rois = smk.peak_rois(peaks[0], roi_radius)

# Filter the ROIS
rois = smk.filter_rois_peaks(peaks[0], rois)
rois = smk.filter_rois_intensity(ic_filt[0], rois, thresh_std=(0.5, 1))

# Compute positional variance to determine stuck beads
bead_variances = smk.positional_variance(peaks, rois)

# Take a look at bead variances
p_ecdf = iqplot.ecdf(
    bead_variances,
    x_axis_label="variance (sq. pixels)",
    frame_height=150,
    frame_width=300,
)
p_hist = iqplot.histogram(
    bead_variances,
    rug=False,
    x_axis_label="variance (sq. pixels)",
    frame_height=150,
    frame_width=300,
    x_range=p_ecdf.x_range,
)

bokeh.io.show(bokeh.layouts.column(p_ecdf, p_hist))


# Variance cutoff
var_cutoff = 3.0

# Only keep ROIs above variance cutoff
rois = [roi for roi, var in zip(rois, bead_variances) if var >= var_cutoff]

# Total number of beads considered
n_beads_2023 = len(rois)

# Find number of peaks in each ROI
n_peaks = smk.n_peaks_in_rois(peaks, rois)

# Check: Do most ROIs have zero of one peaks?
bokeh.io.show(iqplot.spike(n_peaks.ravel()))


# Get bead loss times
t_lost_2023, beads_lost_2023 = smk.all_bead_loss(t, n_peaks, n_frames=5, frac=0.75)

# Display ECDF with loss times
p = iqplot.ecdf(
    np.concatenate((t_lost_2016, np.nan * np.ones(n_beads_2016 - len(t_lost_2016)))),
    q="time of bead loss (min)",
    legend_label="2016",
)
p = iqplot.ecdf(
    np.concatenate((t_lost_2023, np.nan * np.ones(n_beads_2023 - len(t_lost_2023)))),
    marker_kwargs=dict(color="orange"),
    fill_kwargs=dict(fill_color="orange"),
    legend_label="2023",
    p=p,
)
bokeh.io.show(p)

Bi 1x: Image processing III¶

The data sets¶

The strategy¶

Our pipeline¶

1. Loading images¶

2. Checking focus¶

3. Drift correction¶

4. Filtering¶

5. Find peaks¶

6. Determine ROIs from first frame¶

7. Filter ROIs¶

8. Filter stuck beads¶

9. Find the number of peaks in each ROI¶

10. Compute bead loss times¶

Visualizing the results¶

Saving the results for analysis¶

Using Bokeh to visualize beads¶

Analyzing the 2023 data¶