import matplotlib as mpl
import matplotlib.pyplot as plt

# Optionally, tweak styles.
mpl.rc('figure',  figsize=(10, 5))
mpl.rc('image', cmap='gray')

import numpy as np
import pandas as pd
from pandas import DataFrame, Series  # for convenience

import pims
import trackpy as tp

from glob import glob  # Used only for instructive purposes

@pims.pipeline
def gray(image):
    return image[:, :, 1]  # Take just the green channel

frames = gray(pims.open('../sample_data/bulk_water/*.png'))

frames

(ImageSequence,) processed through proc_func. Original repr:
    <Frames>
    Source: /Users/nxk913/projects/trackpy/trackpy-examples/sample_data/bulk_water/*.png
    Length: 300 frames
    Frame Shape: (424, 640, 4)
    Pixel Datatype: uint8

print(frames[0])  # the first frame

[[125 125 125 ... 120 120 121]
 [125 125 125 ... 120 121 121]
 [125 125 124 ... 121 123 124]
 ...
 [125 126 125 ... 108  98  97]
 [125 125 125 ... 116 109 106]
 [125 125 125 ... 124 119 117]]

frames[0]

plt.imshow(frames[0]);

frames[123].frame_no

123

frames[123].metadata  # Scientific formats can pass experiment meta data here.

{}

f = tp.locate(frames[0], 11, invert=True)

f.head()  # shows the first few rows of data

tp.annotate(f, frames[0]);

fig, ax = plt.subplots()
ax.hist(f['mass'], bins=20)

# Optionally, label the axes.
ax.set(xlabel='mass', ylabel='count')

[Text(0.5, 0, 'mass'), Text(0, 0.5, 'count')]

f = tp.locate(frames[0], 11, invert=True, minmass=20)

tp.annotate(f, frames[0]);

tp.subpx_bias(f);

tp.subpx_bias(tp.locate(frames[0], 7, invert=True, minmass=20));

f = tp.batch(frames[:300], 11, minmass=20, invert=True);

Frame 299: 624 features

# tp.quiet()  # Turn off progress reports for best performance
t = tp.link(f, 5, memory=3)

Frame 299: 624 trajectories present.

t.head()

t1 = tp.filter_stubs(t, 25)
# Compare the number of particles in the unfiltered and filtered data.
print('Before:', t['particle'].nunique())
print('After:', t1['particle'].nunique())

Before: 13715
After: 1505

plt.figure()
tp.mass_size(t1.groupby('particle').mean()); # convenience function -- just plots size vs. mass

t2 = t1[((t1['mass'] > 50) & (t1['size'] < 2.6) &
         (t1['ecc'] < 0.3))]

plt.figure()
tp.annotate(t2[t2['frame'] == 0], frames[0]);

plt.figure()
tp.plot_traj(t2);

d = tp.compute_drift(t2)

d.plot()
plt.show()

tm = tp.subtract_drift(t2.copy(), d)

ax = tp.plot_traj(tm)
plt.show()

im = tp.imsd(tm, 100/285., 24)  # microns per pixel = 100/285., frames per second = 24

fig, ax = plt.subplots()
ax.plot(im.index, im, 'k-', alpha=0.1)  # black lines, semitransparent
ax.set(ylabel=r'$\langle \Delta r^2 \rangle$ [$\mu$m$^2$]',
       xlabel='lag time $t$')
ax.set_xscale('log')
ax.set_yscale('log')

em = tp.emsd(tm, 100/285., 24) # microns per pixel = 100/285., frames per second = 24

fig, ax = plt.subplots()
ax.plot(em.index, em, 'o')
ax.set_xscale('log')
ax.set_yscale('log')
ax.set(ylabel=r'$\langle \Delta r^2 \rangle$ [$\mu$m$^2$]',
       xlabel='lag time $t$')
ax.set(ylim=(1e-2, 10));

plt.figure()
plt.ylabel(r'$\langle \Delta r^2 \rangle$ [$\mu$m$^2$]')
plt.xlabel('lag time $t$');
tp.utils.fit_powerlaw(em)  # performs linear best fit in log space, plots]

frames_short = frames[:30]  # 10% of the original

%timeit tp.batch(frames_short, 11, invert=True, minmass=20);  # Uses all available CPUs

Frame 29: 599 features
3.6 s ± 172 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)

%timeit tp.batch(frames_short, 11, invert=True, minmass=20, processes=1);  # Not parallel

Frame 29: 599 features
670 ms ± 8.1 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)

# Just repeat the movie 10 times. We won't use the trajectories.
frames_long = gray(pims.ImageSequence(glob('../sample_data/bulk_water/*.png') * 10))

%time tp.batch(frames_long, 11, invert=True, minmass=20);  # Uses all available CPUs

Frame 2999: 636 features
CPU times: user 33.4 s, sys: 4.44 s, total: 37.8 s
Wall time: 25.3 s

%time tp.batch(frames_long, 11, invert=True, minmass=20, processes=1);  # Not parallel

Frame 2999: 636 features
CPU times: user 1min 4s, sys: 2.02 s, total: 1min 6s
Wall time: 1min 7s

%timeit tp.batch(frames[:20], 11, invert=True, minmass=20, engine='numba', processes=1)

Frame 19: 576 features
453 ms ± 8.95 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)

%timeit tp.batch(frames[:20], 11, invert=True, minmass=20, engine='python', processes=1)

Frame 19: 576 features
1.02 s ± 12.9 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)

with tp.PandasHDFStore('data.h5') as s:
    tp.batch(frames, 11, invert=True, minmass=200, output=s)

Frame 299: 328 features

with tp.PandasHDFStore('data.h5') as s:
    # As before, we require a minimum "life" of 5 frames and a memory of 3 frames
    for linked in tp.link_df_iter(s, 5, memory=3):
        s.put(linked)

Frame 299: 328 trajectories present.

with tp.PandasHDFStore('data.h5') as s:
    trajectories = pd.concat(iter(s))

len(trajectories.frame.unique())

300

	y	x	mass	size	ecc	signal	raw_mass	ep
0	4.750000	103.668564	192.862485	2.106615	0.066390	10.808405	10714.0	0.073666
1	5.249231	585.779487	164.659302	2.962674	0.078936	4.222033	10702.0	0.075116
2	5.785986	294.792544	244.624615	2.244542	0.219217	15.874846	10686.0	0.077141
3	5.869369	338.173423	187.458282	2.046201	0.185333	13.088304	10554.0	0.099201
4	6.746377	310.584169	151.486558	3.103294	0.053342	4.475355	10403.0	0.147430

selection	syntax example
all the frames	`frames[:]` or simply `frames`.
the first 10 frames	`frames[:10]`
the last 10 frames	`frames[-10:]`
a range of frames	`frames[100:200]`
every 10th frame	`frame[::10]`
a list of specific frames	`frames[[100, 107, 113]]`

	y	x	mass	size	ecc	signal	raw_mass	ep	particle
0	4.750000	103.668564	192.862485	2.106615	0.066390	10.808405	10714.0	0.073666	0
365	284.118980	25.313881	149.037779	2.321961	0.031799	7.008575	10770.0	0.067577	1
364	282.753601	534.788476	222.754482	1.908443	0.103416	15.874846	10415.0	0.141946	2
363	280.010398	275.185353	186.782757	2.508665	0.183181	7.261897	10438.0	0.132499	3
362	279.134153	252.780324	151.064355	2.938060	0.253812	4.306474	10359.0	0.171764	4

walkthrough#

Walkthrough¶

Scientific IPython Setup¶

Step 1: Read the Data¶

Obtaining the sample data¶

Opening images or video¶

Step 2: Locate Features¶

Refine parameters to elminate spurious features¶

Check for subpixel accuracy¶

Locate features in all frames¶

Step 3: Link features into particle trajectories¶

Filter spurious trajectories¶

Remove overall drift¶

Step 4: Analyze trajectories¶

Mean Squared Displacement of Individal Probes¶

Ensemble Mean Squared Displacement¶

Preview of Some Advanced Features¶

Parallelization¶

Optional High Performance Component: Numba¶

Streaming¶