5. Tracking Data Analysis¶

Organism tracking is performed through the MCAM GUI resulting in .CSV output files containing tracking data. This page explores concepts relating to loading data from the CSVs, plotting data, and filtering data.

Output Files¶

Output files are saved in a folder with the same name as the input file and this folder is created in the parent directory of the input file.

Raw Tracking Data - tracking_data.csv - CSV file containing 8 key-points per fish, x, y coordinate and confidence for each keypoint. Note: This file is likely too large to be opened in Excel or other spreadsheet software due to the large number of columns in the data array. This file can be opened and manipulated using Python.

Plotted Tracks - plotted_tracks.png - Visualization of movement over time from blue (earliest, cold) to red (most recent, hot).
Distance Traveled Data - distance_traveled_metrics.csv - Distance traveled and speed calculated for each frame.
Aggregate Metrics - distance_traveled_key_metrics.csv - Distance traveled and speed calculated for each frame.
Video Composite - composite_tracked_video.mp4 - MP4 video containing key-point and skeleton labeled fish for all wells of a well plate.

Units¶

Unless otherwise specified, exported units implicitly:

Distance or length: meters
Time: seconds
Velocity or speed: meters/second
Orientation/Angle: degrees

Zebrafish Examples¶

Zebrafish Tracking Workflow¶

"""
# %% Sample zebrafish tracking workflow script
# By Ramona Optics Inc. Copyright 2023-2024

This script provides an example to walk through the steps of the tracking workflow.

"""

from pathlib import Path

from tqdm import tqdm

from owl import mcam_data
from owl.analysis.models import fetch_model, zebrafish_models_recommended
from owl.analysis.tracking import infer_dataset
from owl.analysis.tracking_data_analysis import (
    compute_fish_length,
    export_csv,
    generate_tracking_dataset,
    make_dataframe,
)
from owl.visualize.tracking import plot_tracks_from_dataset

# %% define the project path where outputs are collected
exported_path = '/MCAM_data/EXPORTED_FOLDER_YOU_WANT_TO_TRACK'

# %% load the exported dataset video file
video_dataset = mcam_data.load(exported_path)

# %% determine the well plate configuration, i.e. 24, 48 or 96 well plate
well_plate = (int(video_dataset.wellplate_config_rows) *
              int(video_dataset.wellplate_config_columns))

# %% create a results folder within the output data path
tracking_filepath = Path(exported_path)
results_folder = tracking_filepath / 'results'
results_folder.mkdir(parents=True, exist_ok=True)

# %% download and point to a pre-trained tracking model
recommended_model_name = zebrafish_models_recommended[f"{well_plate}_well_plate"]
model_path = fetch_model(recommended_model_name)

tracking_dataset = infer_dataset(
    video_dataset,
    model_path,
    tqdm=tqdm,
)

# %% make computations based on raw tracking data and store them in the dataset
tracking_dataset['fish_length_information'] = compute_fish_length(tracking_dataset)

# %% plot the tracks on representative images, color gradient represents speed
plot_tracks_from_dataset(
    tracking_dataset,
    output_filename=results_folder / 'plotted_tracks.png',
    apply_circle_mask=True,
    apply_square_mask=False,
    speed=True,
)

# %% save the tracking data separately from the dataset for future analysis
# the images are already saved so we do not save them again
tracking_dataset = tracking_dataset.drop_vars('images')
tracking_dataset.to_netcdf(tracking_filepath / 'tracking_metadata.nc')

# %% prepare tracking dataset for export to csv format including unit conversions
tracking_dataset = generate_tracking_dataset(tracking_dataset)

# %% prepare raw tracking data for export
tracking_output_df, header = make_dataframe(
    tracking_dataset,
    information_name='tracking_information',
    row_index='time',
    column_indices=('image_x',
                    'image_y',
                    'tracking_keypoint',
                    'tracking_location'),
)
# %% save the raw tracking data
export_csv(
    tracking_output_df,
    results_folder / 'tracking_data.csv',
    header=header,
    index=True
)

Tracking Dataset - Data Filtering¶

"""
# %% Sample zebrafish tracking workflow script
# By Ramona Optics Inc. Copyright 2023-2024

This script provides an example to filter tracking data using
anomaly detection and denoising.

"""

from pathlib import Path

from owl.analysis.tracking_data_analysis import (
    compile_derived_metrics,
    compute_fish_length,
    export_csv,
    filter_anomalies,
    generate_tracking_dataset,
    get_anomaly_mask_well_radius,
    load_tracking_dataset,
    make_dataframe,
)
from owl.visualize.tracking import plot_tracks_from_dataset

# %% define the project path where outputs are collected
exported_path = '/MCAM_data/EXPORTED_FOLDER_YOU_WANT_TO_TRACK'

# %% create a results folder within the output data path
tracking_filepath = Path(exported_path)
results_folder = tracking_filepath / 'results'
results_folder.mkdir(parents=True, exist_ok=True)

# %% load the previously tracked dataset
tracking_dataset = load_tracking_dataset(exported_path)

# %% fish length must be computed prior to anomaly detection
tracking_dataset['fish_length_information'] = compute_fish_length(tracking_dataset)

# %% determine the well plate configuration, i.e. 24, 48 or 96 well plate
well_plate = (int(tracking_dataset.wellplate_config_rows) *
              int(tracking_dataset.wellplate_config_columns))

# %% detect anomalous data, remove it and interpolate to replace missing data
anomaly_mask_well_radius = get_anomaly_mask_well_radius(
    well_plate, apply_circle_mask=True,
)
tracking_dataset['tracking_information'][...], filtering_information = filter_anomalies(
    tracking_dataset, well_radius=anomaly_mask_well_radius
)
tracking_dataset['filtering_information'] = filtering_information

# %% plot the tracks on representative images, color gradient represents speed
plot_tracks_from_dataset(
    tracking_dataset,
    output_filename=results_folder / 'plotted_tracks.png',
    apply_circle_mask=True,
    apply_square_mask=False,
    speed=True,
)

# %% convert the dataset from pixel coordinates to SI units
tracking_dataset = generate_tracking_dataset(tracking_dataset)

# %% compute distance traveled and speed metrics with denoising
tracking_dataset, denoising_information = compile_derived_metrics(
    tracking_dataset,
    denoise=True,
)
tracking_dataset['denoising_information'] = denoising_information

# %% prepare movement metric data for export
metrics_output_df, header = make_dataframe(
    tracking_dataset,
    information_name='movement_metrics',
    row_index='time',
    column_indices=('image_x',
                    'image_y',
                    'tracking_metrics',),
)

# %% save the distance traveled data
export_csv(metrics_output_df,
           results_folder / 'distance_traveled_metrics.csv',
           header=header,
           index=True)

Tracking Dataset - Time Binning¶

"""
# %% Sample zebrafish tracking workflow script
# By Ramona Optics Inc. Copyright 2023-2024

This script is an example to bin tracking data by one second intervals.

"""

from pathlib import Path

from owl.analysis.tracking_data_analysis import (
    compile_derived_metrics,
    export_csv,
    generate_tracking_dataset,
    load_tracking_dataset,
    make_dataframe,
)

# %% define the project path where outputs are collected
exported_path = '/MCAM_data/EXPORTED_FOLDER_YOU_WANT_TO_TRACK'

# %% time bin given in seconds
time_bin = 1

# %% load a previously tracked dataset
tracking_dataset = load_tracking_dataset(exported_path)

# %% ensure a results folder exists within the output data path
tracking_filepath = Path(exported_path)
results_folder = tracking_filepath / 'results'
results_folder.mkdir(parents=True, exist_ok=True)

# %% prepare tracking dataset for export including unit conversions
tracking_dataset = generate_tracking_dataset(tracking_dataset)

# %% calculate distance traveled and speed. this function should be
# run after 'generate_tracking_dataset' to ensure SI units
tracking_dataset = compile_derived_metrics(tracking_dataset)

# %% prepare movement metric data for export
metrics_output_df, header = make_dataframe(
    tracking_dataset,
    information_name='movement_metrics',
    row_index='time',
    column_indices=('image_x',
                    'image_y',
                    'tracking_metrics',),
    time_bin=time_bin,
)

# %% save the distance traveled data
export_csv(metrics_output_df,
           results_folder / 'distance_traveled_metrics.csv',
           header=header,
           index=True)

Tracking Dataset - Data Manipulation¶

# %%
# import the necessary python package
from owl import mcam_data

# %%
# input the path to the tracking metadata file in question
# a sample dataset is available for download here:
# https://drive.google.com/file/d/1sN3gFrqNbS2rNeBnw5CUlA46cOvfSYRn/view?usp=share_link
tracking_metadata_filepath = '/path/to/tracking_metadata.nc'
# load the tracking dataset
tracking_dataset = mcam_data.load(tracking_metadata_filepath)

# %%
# the tracking pipeline is based on the x, y coordinates of each keypoint
# first access the location of the zebrafish "center" keypoint
# in the fourth frame of the video tracked for well 'B4'
# note frame indexing begins at frame 0 so the fourth frame is "3" by index
frame_number = 3
well_letter = 'B'
well_number = 4
keypoint = 'center'

center_x = tracking_dataset.tracking_information.sel({
    'frame_number': frame_number,
    'image_x': well_letter,
    'image_y': well_number,
    'tracking_keypoint': keypoint,
    'tracking_location': 'x',
}).data
center_y = tracking_dataset.tracking_information.sel({
    'frame_number': frame_number,
    'image_x': well_letter,
    'image_y': well_number,
    'tracking_keypoint': keypoint,
    'tracking_location': 'y',
}).data
# within the tracking dataset, locations are in units of pixels
# make sure to cast the stored floating point number to an integer
# so that x, y coordinates can properly register in the 2D image matrix
print(f'Center Key Point Location: ({int(center_x)}, {int(center_y)})')

# %%
# note the shape of the tracking data
# this 5-dimensional data array includes:
# (N_frames, camera_sensor_y, camera_sensor_x, tracking_keypoints, (y, x, confidence))
shape = tracking_dataset.tracking_information.shape
print(f'Tracking dataset shape: {shape}')
# select each one of these dimensions for examination by it's index in the shape tuple
print(f'There are {shape[0]} frames in this dataset.')
print(f'There are {shape[1]} well plate numbers and thus columns in this dataset.')
print(f'There are {shape[2]} well plate letters and thus rows in this dataset.')
print(f'Therefore it is a {shape[1] * shape[2]}-well plate.')
print(f'There are {shape[3]} tracked keypoints in this dataset.')
print(f'There are {shape[4]} tracking locations in this dataset.')

# %%
# assuming the skeleton has been computed and compiled into the tracking dataset
# we can access the length of one tail segment for well 'B4' for the fourth frame
# here we access the first segment in the 'segment_names' list which is defined by
# the 'center' and 'between_center_and_mid' key points
tail_segment_names = [
    'center_between_center_and_mid',
    'between_center_and_mid_mid_tail',
    'mid_tail_between_mid_and_caudal',
    'between_mid_and_caudal_caudal_fin',
]
center_between_center_and_mid_length = tracking_dataset.skeleton_information.sel({
    'frame_number': frame_number,
    'image_x': well_letter,
    'image_y': well_number,
    'skeleton_segments': tail_segment_names[0],
    'skeleton_parameters': 'length',
}).data
print(f'Length: {center_between_center_and_mid_length} pixels.')

# %%
# to convert from units of pixels to meters, first access the width of
# each pixel stored in the dataset, this value is in units of meters
pixel_width = tracking_dataset['pixel_width'].data
print(f'Pixel width: {pixel_width} meters.')

# %%
# convert the length of the tail segment to meters
tail_segment_length_in_meters = center_between_center_and_mid_length * pixel_width
print(f'Length in meters: {tail_segment_length_in_meters}')

# %%
# on this scale it is likely millimeters make more sense than meters
# convert to millimeters
tail_segment_length_in_mm = tail_segment_length_in_meters * 1E3
print(f'Length in millimeters: {tail_segment_length_in_mm}')

# %%
# output a list of all skeleton segments by segment name
skeleton_segments = tracking_dataset.skeleton_information.skeleton_segments.data
print(f'Skeleton segments: {skeleton_segments}')
# the 'tail_segment_names' list above can be redefined by slicing
# this list of segments to just the last four, which are all tail segments
tail_segment_names = skeleton_segments[4:]
print(f'Tail skeleton segments: {tail_segment_names}')
# output a list of all skeleton parameters for each skeleton segment
skeleton_parameters = tracking_dataset.skeleton_information.skeleton_parameters.data
print(f'Skeleton parameters: {skeleton_parameters}')

# %%
# access the length of all four tail segments for the fourth frame and sum them
# to compute the tail length of the zebrafish
tail_segment_lengths = tracking_dataset.skeleton_information.sel({
    'frame_number': frame_number,
    'image_x': well_letter,
    'image_y': well_number,
    'skeleton_segments': tail_segment_names,
    'skeleton_parameters': 'length',
}).data
tail_length = tail_segment_lengths.sum()
print(f'Tail length: {tail_length} pixels.')

# %%
# get this tail length for the first ten frames and take the average as
# the computed tail length
# convert from pixels to millimeters and round this value to 2 decimal places
tail_segment_lengths = tracking_dataset.skeleton_information.sel({
    'frame_number': slice(0, 10),
    'image_x': well_letter,
    'image_y': well_number,
    'skeleton_segments': tail_segment_names,
    'skeleton_parameters': 'length',
}).data
tail_lengths = tail_segment_lengths.sum(axis=1)
average_tail_length_pixels = tail_lengths.mean()
average_tail_length_millimeters = average_tail_length_pixels * pixel_width * 1E3
average_tail_length_millimeters = round(average_tail_length_millimeters, 2)
print(f'Average tail length computed across '
      f'10 frames: {average_tail_length_millimeters} millimeters.')

# %%
# Note: in addition to keypoint tracking data and skeleton information
# other computed values can be accessed similarly from the xarray dataset
# examples:

# tail angles for the four tail keypoints for well 'B4' in the fourth frame
# angles are in units of degrees
# positive (+) reflects tail deflection to the left of the body axis
# negative (-) reflects tail deflection to the right of the body axis
tail_angles = tracking_dataset.tail_information.sel({
    'frame_number': frame_number,
    'image_x': well_letter,
    'image_y': well_number,
    'tail_parameters': 'angle',
}).data
print(f'Tail angles: {tail_angles} degrees.')

Zebrafish Stimulus Analysis Plotting¶

"""
%% Sample zebrafish analysis for stimulus visualization
By Ramona Optics Inc. Copyright 2022-2024

This script provides and example to import previously tracked
locomotion data, averages together the distance traveled for
each fish, and plots this metric with consideration for where
stimuli occurred during the experiment. If no stimuli information
is present, the average distance traveled will be simply plotted.

An additional consideration outlined here is two levels of filtering
excluding fish or frames from the analysis that were missed by the
tracking algorithm. In this example, if more than 5% of the total
frames were missed during tracking, the fish will be excluded.

"""
from pathlib import Path

import numpy as np
import pandas as pd
from matplotlib import pyplot as plt

from owl import mcam_data

# %% definitions:
# define the filepath location of the previously output tracking data
tracking_filepath = 'path/tracking_data'

tracking_filepath = Path(tracking_filepath)
# define the filepath to the distance traveled metrics output .csv.
distance_speed_filename = tracking_filepath / 'results/distance_traveled_metrics.csv'
# define the filepath to the raw tracking data for tracking
# confidence information.
tracking_data_filename = tracking_filepath / 'results/tracking_data.csv'
# define an output path for the plot,
# this should include a filename with '.png' or other image-type suffix
plot_output_path = tracking_filepath / 'results/distance_traveled_plot.png'

# %% script below
# load the previously extracted dataset metadata which exists within the
# tracking filepath
metadata = mcam_data.load(tracking_filepath / 'metadata.nc')

# load the previously exported distance traveled data
distance_speed_df = pd.read_csv(
    distance_speed_filename,
    comment='#',
    header=[0, 1, 2],
    index_col=0,
)
# load the previously exported raw tracking data
tracking_data_df = pd.read_csv(
    tracking_data_filename,
    comment='#',
    header=[0, 1, 2, 3],
    index_col=0,
)

# determine the rows and columns that exist in the dataset
# ensure that the column numbers are interpreted as strings, not integers
rows = metadata.image_x.data
columns = metadata.image_y.data.astype('str')

# %% check if stimuli information exists in the metadata
if 'stimuli_flash_index' in metadata.dims:
    stimuli_durations = metadata.stimuli_flash_duration.data
    stimuli_times = metadata.stimuli_flash_start_time.data
    stimuli_intensities = metadata.stimuli_flash_lux.data
    stimuli_colors = metadata.stimuli_flash_color.data
    stimuli_index = metadata.stimuli_flash_index.data
    print('flash stimulus data loaded!')
elif 'stimuli_vibrate_index' in metadata.dims:
    stimuli_durations = metadata.stimuli_vibrate_duration.data
    stimuli_times = metadata.stimuli_vibrate_start_time.data
    stimuli_frequencies = metadata.stimuli_vibrate_frequency.data
    stimuli_index = metadata.stimuli_vibrate_index.data
    print('vibration stimulus data loaded!')
else:
    print('stimulus information does not exist in this dataset!')

# %% filter out fish that have low confidence in tracking and were
# likely missed by the tracking algorithm
confidence_threshold = 0.1
tracked_keypoint = 'center'
total_frames = len(tracking_data_df)
confidence_column_keys = list(pd.MultiIndex.from_product(
    [rows, columns, [tracked_keypoint], ['likelihood']]
))
confident_wells = []
for column_key in confidence_column_keys:
    confident_data = tracking_data_df[column_key][tracking_data_df[column_key] >=
                                                  confidence_threshold]
    confident_frames = len(confident_data)
    confident_fraction = confident_frames / total_frames
    percent_confident = round(confident_fraction * 100, 2)
    if confident_fraction >= 0.95:
        confident_wells.append(column_key)
    else:
        print(f"Well {column_key[0] + column_key[1]} has been excluded "
              f"with {percent_confident}% confident frames")

# %% average together the distance traveled for all fish with
# confident tracking
distance_traveled_column_keys = []
for well_key in confident_wells:
    distance_traveled_column_keys.append(
        (well_key[0], well_key[1], 'distance_traveled')
    )

average_distance_traveled = \
    distance_speed_df[distance_traveled_column_keys].mean(axis=1)

time = np.array(distance_speed_df.index)

# %% plot the results
fig, ax = plt.subplots()
# plot distance traveled converting from meters to millimeters
ax.plot(time, average_distance_traveled * 1E3,
        color='black', label='distance traveled')
ax.set_ylabel("Average Distance Traveled (mm/s)")
ax.set_xlabel("Time (s)")
ax.set_title("Average Distance Traveled")
ax.legend()
ax.grid()

if 'stimuli_flash_index' in metadata.dims or 'stimuli_vibrate_index' in metadata.dims:
    # for each stimulus draw lines at the beginning and end of the stimulus
    for i in range(len(stimuli_index)):
        stimulus_start = stimuli_times[i]
        stimulus_end = stimuli_times[i] + stimuli_durations[i]
        ax.axvspan(stimulus_start, stimulus_end,
                   alpha=0.2, color='#0e6c67')

# save the plot
fig.savefig(plot_output_path, dpi=300)

Zebrafish Movement Analysis Plotting¶

# %% Sample zebrafish analysis for episode detection
# By Ramona Optics Inc. Copyright 2022-2024
import numpy as np
import pandas as pd
from matplotlib import pyplot as plt

# You can enter the full name of the file yo uwant to track here.
tracking_data_filename = 'tracking_data.csv'
distance_speed_filename = 'distance_traveled_metrics.csv'


wellplate_diameter = 6.85E-3
wellplate_radius = wellplate_diameter / 2

tracking_data_df = pd.read_csv(
    tracking_data_filename,
    comment='#',
    header=[0, 1, 2, 3],
    index_col=0,
)

distance_speed_df = pd.read_csv(
    distance_speed_filename,
    comment='#',
    header=[0, 1, 2],
    index_col=0,
)
# %% Extract the time, it matches between the two csv files
time = np.asarray(tracking_data_df.index)
# %% Select the information we want to extract
well_name = "B6"
keypoint = "center"

well_letter = well_name[0]
well_number = well_name[1:]
# %%

well_data = tracking_data_df[well_letter, well_number, keypoint]
yx = well_data[["y", "x"]]

# %%
fig, ax = plt.subplots()

# Units of x and y are in meters. for a 96 well plate, we can plot them in mm
ax.plot(yx["x"] * 1E3, yx["y"] * 1E3, '.-', label="RAW")
ax.add_patch(
    plt.Circle((0, 0), radius=wellplate_radius * 1E3,
               edgecolor='Black', facecolor=None, fill=False))
ax.axis('equal')
ax.set_xlabel("x (mm)")
ax.set_ylabel("y (mm)")
ax.set_title(f"Center position well {well_name} -- Raw (unprocesssed) tracking data")
ax.set_ylim([-(int(wellplate_radius * 1E3) + 1), int(wellplate_radius * 1E3) + 1])


# %% Filter away points that are missed in the analysis
likelihood_threshold = 0.1
likelihood = well_data["likelihood"]
likelihood_below_threshold = likelihood < likelihood_threshold

yx_filtered = yx.to_numpy().copy()
yx_filtered[likelihood_below_threshold, ...] = np.nan


def interpolate_nan_points(points_vector):
    # https://stackoverflow.com/questions/6518811/interpolate-nan-values-in-a-numpy-array
    nans = np.isnan(points_vector)

    def f():
        return lambda z: z.nonzero()[0]

    points_vector[nans] = np.interp(f()(nans), f()(~nans), points_vector[~nans])
    return points_vector


yx_filtered[:, 0] = interpolate_nan_points(yx_filtered[:, 0])
yx_filtered[:, 1] = interpolate_nan_points(yx_filtered[:, 1])

fig, ax = plt.subplots()

ax.plot(yx_filtered[:, 1] * 1E3, yx_filtered[:, 0] * 1E3, '-',
        color='#ff7f0e', label="Filtered")
ax.add_patch(
    plt.Circle((0, 0), radius=wellplate_radius * 1E3,
               edgecolor='Black', facecolor=None, fill=False))
ax.axis('equal')
ax.set_xlabel("x (mm)")
ax.set_ylabel("y (mm)")
ax.set_title(f"Center position well {well_name} -- Filtered tracking data")
ax.set_ylim([-(int(wellplate_radius * 1E3) + 1), int(wellplate_radius * 1E3) + 1])
# %% Plot tracks
fig, ax = plt.subplots()

# Units of x and y are in meters. for a 96 well plate, we can plot them in mm
ax.plot(yx["x"] * 1E3, yx["y"] * 1E3, '.-', label="RAW")
ax.plot(yx_filtered[:, 1] * 1E3, yx_filtered[:, 0] * 1E3, '-',
        label="Filtered")
ax.add_patch(
    plt.Circle((0, 0), radius=wellplate_radius * 1E3,
               edgecolor='Black', facecolor=None, fill=False))
ax.axis('equal')
ax.set_xlabel("x (mm)")
ax.set_ylabel("y (mm)")
ax.set_title(f"Center position well {well_name} -- Raw and Filtered data")
ax.set_ylim([-(int(wellplate_radius * 1E3) + 1), int(wellplate_radius * 1E3) + 1])
ax.legend()
# %% Extract peak speed
speed = distance_speed_df[well_letter, well_number, "speed"]
max_speed = speed.max()
max_speed_mm_per_s = max_speed * 1E3
print(f"Maximum speed for well {well_name} = {max_speed_mm_per_s:.2f} mm/s")

# %% Plot the speed over time.

fig, ax = plt.subplots()
ax.plot(time, speed * 1E3)
ax.set_ylabel("Speed (mm/s)")
ax.set_xlabel("Time (s)")
ax.set_title(f"Speed for zebrafish in well {well_name}")
ax.grid()
# %% Threshold the speed

# units of speed for analysis are m/s
speed_threshold = 30E-3
index_above_threshold = speed > speed_threshold

fig, ax = plt.subplots()
ax.plot(time, speed * 1E3, label="Zebrafish Speed (mm/s)")
ax.plot([time[0], time[-1]], [speed_threshold * 1E3, speed_threshold * 1E3],
        '--r', label=f"Threshold: {speed_threshold * 1E3:.1f} mm/s")
ax.plot(time[index_above_threshold], speed[index_above_threshold] * 1E3,
        '.', label="Speed Above Threshold")
ax.set_ylabel("Speed (mm/s)")
ax.set_xlabel("Time (s)")
ax.set_title(f"Speed for zebrafish in well {well_name}")
ax.legend()
ax.grid()

# %% cleanup the data
# Require at least 5 time points, approximately 31.25 with 160 fps
# to be considered a peak. You can reduce this to 3 instead of 5 for 120 fps
# Should be an odd number
minimum_consecutive_points = 5

index_above_threshold_clean = index_above_threshold.copy()
# Erode by two points on either side
# Remove two rising edges and two falling edges

for i in range(1, minimum_consecutive_points, 2):
    edges = np.diff(index_above_threshold_clean, prepend=False)
    index_above_threshold_clean[edges] = False
    edges = np.diff(index_above_threshold_clean, append=False)
    index_above_threshold_clean[edges] = False


for i in range(1, minimum_consecutive_points, 2):
    edges = np.diff(index_above_threshold_clean, append=False)
    index_above_threshold_clean[edges] = True
    edges = np.diff(index_above_threshold_clean, prepend=False)
    index_above_threshold_clean[edges] = True

fig, ax = plt.subplots()
ax.plot(time, speed * 1E3,
        label="Zebrafish Speed (mm/s)")
ax.plot([time[0], time[-1]], [speed_threshold * 1E3, speed_threshold * 1E3], '--r',
        label=f"Threshold: {speed_threshold * 1E3:.1f} mm/s")
ax.plot(
    time[index_above_threshold],
    speed[index_above_threshold] * 1E3, '.',
    label="Speed Above Threshold (raw)",
)
ax.plot(
    # time[index_above_threshold_clean],
    time,
    speed.where(index_above_threshold_clean) * 1E3, '-o',
    label="Speed Above Threshold (filtered)",
    markerfacecolor=(0, 0, 0, 0), markeredgecolor='m',
    color="m")
ax.set_ylabel("Speed (mm/s)")
ax.set_xlabel("Time (s)")
ax.set_title(f"Speed for zebrafish in well {well_name}")
ax.legend()
ax.grid()
# %% Count the number of events:
rising_edges = (
    np.diff(index_above_threshold_clean, prepend=False) &
    index_above_threshold
)
falling_edges = (
    np.diff(index_above_threshold_clean, prepend=False) &
    (~index_above_threshold)
)

time_event_start = rising_edges.index[rising_edges == True].to_numpy()  # noqa
time_event_end = falling_edges.index[falling_edges == True].to_numpy()  # noqa
number_of_events = len(time_event_end)
event_duration = time_event_end - time_event_start
average_duration = event_duration.mean()
print(f"There were {number_of_events} events")
print(f"The average duration of the events was {average_duration * 1E3:.0f} milliseconds.")

Zebrafish Thigmotaxis Assay Analysis¶

"""
%% Sample Thigmotaxis Assay Analysis
By Ramona Optics Inc. Copyright 2022-2024

This example script gives one method for using MCAM™ tracking data to analyze
a Thigmotaxis assay using a 24-well plate

According to one publication (Schnorr S., et. al, 2011), the authors
validate a Thigmotaxis assay using a 24 well plate (16.2mm diameter wells)
with both light/dark conditions and stimulant/depressant chemical
experimental conditions. The authors comments (Materials and Methods
Section 2.3, pg. 368) that well plate selection is determined by assuring
the “swimming arena must be sufficiently large to allow distinction
between inner and outer zones” and to do this both inner and outer
zones must be “at least equivalent or larger than the body length of
the larvae (approx 4mm for larvae aged 5dpf)”. It is also noted that
a 6 well or 12 well format could work for this assay however using a
24-well plate the area of inner and outer zones are equal “thus ruling
out biases in the analysis of zone preference related to differences in
zone size.” Finally they comment that both 96- and 48-well plate formats
are likely too small to fit these requirements.

Reference: Measuring thigmotaxis in larval zebrafish Schnorr et al. 2011
10.1016/j.bbr.2011.12.016
https://www.sciencedirect.com/science/article/abs/pii/S0166432811008758?via%3Dihub

This assay has been formulated with the 24-well plate in mind. This script,
specifically, determines the radius of the inner zone of a single well for
each well of the well plate and checks if x, y locations of each fish are
within this outside of this zone.

Notes:
    For this analysis we have chosen not to interpolate to fill gaps of non-
    confident values. Only confident values are considered.

Assay Output (.csv):
Fraction confident frames
Fraction of time spent in the outer zone for each well
"""

import numpy as np
import pandas as pd

# %% definitions:
# define the filepath location of the previously output tracking data
tracking_data_filename = 'path/tracking_data.csv'
# define an output path for the data .csv file,
# this should include a filename with '.csv' suffix
output_filepath = 'path/thigmotaxis_data.csv'

# the outer zone width, change this input parameter given in millimeters
outer_zone_width_in_mm = 4
# well plate single-well diameter, this may need to be changed depending on
# the well plate in use, again given in millimeters
well_diameter_in_mm = 16.2
well_radius_in_mm = well_diameter_in_mm / 2
inner_zone_radius_in_mm = well_radius_in_mm - outer_zone_width_in_mm
inner_zone_radius_in_m = inner_zone_radius_in_mm / 1E3

# set the confidence threshold used to filter out badly tracked keypoints
# anecdotally 0.1 yields a very similar result to 0.95 while retaining
# significantly more frames, we recommend using 0.1
confidence_threshold = 0.1
# select the keypoint to be tracked, generally 'center'
tracked_keypoint = 'center'

# %% load the previously exported raw tracking data
tracking_data_df = pd.read_csv(
    tracking_data_filename,
    comment='#',
    header=[0, 1, 2, 3],
    index_col=0,
)
N_frames = len(tracking_data_df)

# construct a list of well letter and number combinations that exist
column_keys_array = np.array(list(tracking_data_df.keys()))
well_letters = np.unique(column_keys_array[:, 0])
well_numbers = np.unique(column_keys_array[:, 1])
# ensure well number sorting occurs as if they are integers for proper ordering
well_numbers = sorted(well_numbers, key=int)
wellnames = []
for well_letter in well_letters:
    for well_number in well_numbers:
        wellnames.append((well_letter, well_number))

# construct an array to store output data
output_data = np.zeros((2, len(wellnames)))

# %% iterate through each well computing the time spent in the outer zone
for i, well in enumerate(wellnames):
    well_letter = well[0]
    well_number = well[1]

    x_key = (well_letter, well_number, tracked_keypoint, 'x')
    y_key = (well_letter, well_number, tracked_keypoint, 'y')
    likelihood_key = (well_letter, well_number, tracked_keypoint, 'likelihood')

    # compute the fraction of confident frames
    confident_frames = tracking_data_df[
        tracking_data_df[likelihood_key] >= confidence_threshold]
    N_confident_frames = len(confident_frames)
    fraction_confident = N_confident_frames / N_frames

    # compute the distance from origin at each timepoint
    distance_from_origin = np.sqrt(confident_frames[x_key] ** 2 +
                                   confident_frames[y_key] ** 2)
    # count the frames the fish is in the outer zone
    outer_zone_frames = len(confident_frames[
        distance_from_origin > inner_zone_radius_in_m])
    fraction_in_outer_zone = outer_zone_frames / N_frames

    # store computed data to output data array
    output_data[0, i] = fraction_confident
    output_data[1, i] = fraction_in_outer_zone


# %% construct an output dataframe with the data we have generated
column_keys = pd.MultiIndex.from_tuples(wellnames)
index = ['fraction_confident_frames', 'fraction_in_outer_zone']
thigmotaxis_data_df = pd.DataFrame(
    output_data,
    index=index,
    columns=column_keys
)

# %% save the output data
thigmotaxis_data_df.to_csv(output_filepath, index=True)

Extracting Stimulus Metadata¶

"""
# %% Extract stimulus metadata from an MCAM dataset
# By Ramona Optics Inc. Copyright 2023-2024

Modify the metadata and output paths.

This script assumes that stimulus information is present in the input metadata file.

"""

from pathlib import Path

from owl import mcam_data
from owl.analysis.tracking_data_analysis import export_csv, make_stimulus_metadata_dataframe

metadata_path = '/path/to/metadata.nc'

output_path = '/path/to/output_folder'

metadata = mcam_data.load(metadata_path)
output_path = Path(output_path)

stimulus_metadata_df, header = make_stimulus_metadata_dataframe(
    metadata,
    row_index='time'
)
output_filepath = output_path / 'stimulus_metadata.csv'
export_csv(
    stimulus_metadata_df,
    output_filepath,
    header=header,
    index=True
)

print(f"Stimulus metadata saved to {output_filepath}")

For more information, please see the section titled “MCAM Data Analysis” in the MCAM User Manual.