Source code for keypoint_moseq.util

import os
import glob
import tabulate
import warnings
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import jax, jax.numpy as jnp
from textwrap import fill
from scipy.ndimage import median_filter, convolve1d, gaussian_filter1d
from sklearn.decomposition import PCA
from sklearn.neighbors import NearestNeighbors
from scipy.spatial.distance import pdist, squareform
from jax_moseq.models.keypoint_slds import inverse_rigid_transform
from jax_moseq.utils import get_frequencies, batch
from vidio.read import OpenCVReader
from typing import Optional

na = jnp.newaxis



[docs]
def np_io(fn):
    """Converts a function involving jax arrays to one that inputs and outputs
    numpy arrays."""
    return lambda *args, **kwargs: jax.device_get(
        fn(*jax.device_put(args), **jax.device_put(kwargs))
    )




[docs]
def print_dims_to_explain_variance(pca, f):
    """Print the number of principal components requred to explain a given
    fraction of  variance.

    Parameters
    ----------
    pca: sklearn.decomposition._pca.PCA, A fit PCA model
    f: float, Target variance fraction
    """
    cs = np.cumsum(pca.explained_variance_ratio_)
    if cs[-1] < f:
        print(f"All components together only explain {cs[-1]*100}% of variance.")
    else:
        print(f">={f*100}% of variance exlained by {(cs>f).nonzero()[0].min()+1} components.")




[docs]
def list_files_with_exts(filepath_pattern, ext_list, recursive=True):
    """This function lists all the files matching a pattern and with a an
    extension in a list of extensions.

    Parameters
    ----------
    filepath_pattern : str or list
        A filepath pattern or a list thereof. Filepath patterns can be be a
        single file, a directory, or a path with wildcards (e.g.,
        '/path/to/dir/prefix*').

    ext_list : list of str
        A list of file extensions to search for.

    recursive : bool, default=True
        Whether to search for files recursively.

    Returns
    -------
    list
        A list of file paths.
    """
    if isinstance(filepath_pattern, list):
        matches = []
        for fp in filepath_pattern:
            matches += list_files_with_exts(fp, ext_list, recursive=recursive)
        return sorted(set(matches))

    else:
        # make sure extensions all start with "." and are lowercase
        ext_list = ["." + ext.strip(".").lower() for ext in ext_list]

        if os.path.isdir(filepath_pattern):
            filepath_pattern = os.path.join(filepath_pattern, "*")

        # find all matches (recursively)
        matches = glob.glob(filepath_pattern)
        if recursive:
            for match in list(matches):
                matches += glob.glob(os.path.join(match, "**"), recursive=True)

        # filter matches by extension
        matches = [match for match in matches if os.path.splitext(match)[1].lower() in ext_list]
        return matches




[docs]
def find_matching_videos(
    keys,
    video_dir,
    as_dict=False,
    recursive=True,
    recording_name_suffix="",
    video_extension=None,
):
    """
    Find video files for a set of recording names. The filename of each video
    is assumed to be a prefix within the recording name, i.e. the recording
    name has the form `{video_name}{more_text}`. If more than one video matches
    a recording name, the longest match will be used. For example given the
    following video directory::

        video_dir
        ├─ videoname1.avi
        └─ videoname2.avi

    the videos would be matched to recording names as follows::

        >>> keys = ['videoname1blahblah','videoname2yadayada']
        >>> find_matching_videos(keys, video_dir, as_dict=True)

        {'videoname1blahblah': 'video_dir/videoname1.avi',
         'videoname2blahblah': 'video_dir/videoname2.avi'}

    A suffix can also be specified, in which case the recording name is assumed
    to have the form `{video_name}{suffix}{more_text}`.

    Parameters
    -------
    keys: iterable
        Recording names (as strings)

    video_dir: str
        Path to the video directory.

    video_extension: str, default=None
        Extension of the video files. If None, videos are assumed to have the
        one of the following extensions: "mp4", "avi", "mov"

    recursive: bool, default=True
        If True, search recursively for videos in subdirectories of
        `video_dir`.

    as_dict: bool, default=False
        Determines whether to return a dict mapping recording names to video
        paths, or a list of paths in the same order as `keys`.

    recording_name_suffix: str, default=None
        Suffix to append to the video name when searching for a match.

    Returns
    -------
    video_paths: list or dict (depending on `as_dict`)
    """

    if video_extension is None:
        extensions = [".mp4", ".avi", ".mov"]
    else:
        if video_extension[0] != ".":
            video_extension = "." + video_extension
        extensions = [video_extension]

    videos = list_files_with_exts(video_dir, extensions, recursive=recursive)
    videos_to_paths = {os.path.splitext(os.path.basename(f))[0]: f for f in videos}

    video_paths = []
    for key in keys:
        matches = [
            v
            for v in videos_to_paths
            if os.path.basename(key).startswith(v + recording_name_suffix)
        ]
        assert len(matches) > 0, fill(f"No matching videos found for {key}")

        longest_match = sorted(matches, key=lambda v: len(v))[-1]
        video_paths.append(videos_to_paths[longest_match])

    if as_dict:
        return dict(zip(keys, video_paths))
    else:
        return video_paths




[docs]
def pad_along_axis(arr, pad_widths, axis=0, value=0):
    """Pad an array along a single axis.

    Parameters
    -------
    arr: ndarray, Array to be padded
    pad_widths: tuple (int,int), Amount of padding on either end
    axis: int, Axis along which to add padding
    value: float, Value of padded array elements

    Returns
    _______
    padded_arr: ndarray
    """
    pad_widths_full = [(0, 0)] * len(arr.shape)
    pad_widths_full[axis] = pad_widths
    padded_arr = np.pad(arr, pad_widths_full, constant_values=value)
    return padded_arr




[docs]
def filter_angle(angles, size=9, axis=0, method="median"):
    """Perform median filtering on time-series of angles by transforming to a
    (cos,sin) representation, filtering in R^2, and then transforming back into
    angle space.

    Parameters
    -------
    angles: ndarray
        Array of angles (in radians)

    size: int, default=9
        Size of the filtering kernel

    axis: int, default=0
        Axis along which to filter

    method: str, default='median'
        Method for filtering. Options are 'median' and 'gaussian'

    Returns
    -------
    filtered_angles: ndarray
    """
    if method == "median":
        kernel = np.where(np.arange(len(angles.shape)) == axis, size, 1)
        filter = lambda x: median_filter(x, kernel)
    elif method == "gaussian":
        filter = lambda x: gaussian_filter1d(x, size, axis=axis)
    return np.arctan2(filter(np.sin(angles)), filter(np.cos(angles)))




[docs]
def get_centroids_headings(
    coordinates,
    anterior_idxs,
    posterior_idxs,
    bodyparts=None,
    use_bodyparts=None,
    **kwargs,
):
    """Compute centroids and headings from keypoint coordinates.

    Parameters
    -------
    coordinates: dict
        Dictionary mapping recording names to keypoint coordinates as
        ndarrays of shape (n_frames, n_bodyparts, [2 or 3]).

    anterior_idxs: array-like of int
        Indices of anterior bodyparts (after reindexing by `use_bodyparts`
        when the latter is specified).

    posterior_idxs: array-like of int
        Indices of anterior bodyparts (after reindexing by `use_bodyparts`
        when the latter is specified).

    bodyparts: list of str, default=None
        List of bodypart names in `coordinates`. Used to reindex coordinates
        when `use_bodyparts` is specified.

    use_bodyparts: list of str, default=None
        Ordered list of bodyparts used to reindex `coordinates`.

    Returns
    -------
    centroids: dict
        Dictionary mapping recording names to centroid coordinates as ndarrays
        of shape (n_frames, [2 or 3]).

    headings: dict
        Dictionary mapping recording names to heading angles (in radians) as 1d
        arrays of shape (n_frames,).
    """
    if bodyparts is not None and use_bodyparts is not None:
        coordinates = reindex_by_bodyparts(coordinates, bodyparts, use_bodyparts)

    centroids, headings = {}, {}
    for key, coords in coordinates.items():
        coords = interpolate_keypoints(coords, np.isnan(coords).any(-1))
        centroids[key] = np.median(coords, axis=1)
        anterior_loc = coords[:, posterior_idxs].mean(1)
        posterior_loc = coords[:, anterior_idxs].mean(1)
        heading_vec = (anterior_loc - posterior_loc)[:, :2]
        headings[key] = np.arctan2(*heading_vec.T[::-1]) + np.pi

    return centroids, headings




[docs]
def filter_centroids_headings(centroids, headings, filter_size=9):
    """Perform median filtering on centroids and headings.

    Parameters
    -------
    centroids: dict
        Centroids stored as a dictionary mapping recording names to ndarrays,
        of shape (n_frames, [2 or 3]).

    headings: dict
        Dictionary mapping recording names to heading angles (in radians) as 1d
        arrays of shape (n_frames,).

    filter_size: int, default=9
        Kernel size for median filtering

    Returns
    -------
    filtered_centroids: dict
    filtered_headings: dict
    """
    centroids = {k: median_filter(v, (filter_size, 1)) for k, v in centroids.items()}
    headings = {k: filter_angle(v, size=filter_size) for k, v in headings.items()}
    return centroids, headings




[docs]
def get_syllable_instances(
    stateseqs,
    min_duration=3,
    pre=30,
    post=60,
    min_frequency=0,
    min_instances=0,
):
    """Map each syllable to a list of instances when it occured. Only include
    instances that meet the criteria specified by `pre`, `post`, and
    `min_duration`. Only include syllables that meet the criteria specified by
    `min_frequency` and `min_instances`.

    Parameters
    -------
    stateseqs: dict {str : 1d array}
        Dictionary mapping names to syllable sequences

    min_duration: int, default=3
        Mininum duration for inclusion of a syllable instance

    pre: int, default=30
        Syllable instances that start before this location in the state
        sequence will be excluded

    post: int, default=60
        Syllable instances that end after this location in the state sequence
        will be excluded

    min_frequency: int, default=0
        Minimum allowed frequency (across all state sequences) for inclusion of
        a syllable

    min_instances: int, default=0
        Minimum number of instances (across all state sequences) for inclusion
        of a syllable

    Returns
    -------
    syllable_instances: dict
        Dictionary mapping each syllable to a list of instances. Each instance
        is a tuple (name,start,end) representing subsequence
        `stateseqs[name][start:end]`.
    """
    num_syllables = int(max(map(max, stateseqs.values())) + 1)
    syllable_instances = [[] for syllable in range(num_syllables)]

    for key, stateseq in stateseqs.items():
        transitions = np.nonzero(stateseq[1:] != stateseq[:-1])[0] + 1
        starts = np.insert(transitions, 0, 0)
        ends = np.append(transitions, len(stateseq))
        for s, e, syllable in zip(starts, ends, stateseq[starts]):
            if e - s >= min_duration and s >= pre and s < len(stateseq) - post:
                syllable_instances[syllable].append((key, s, e))

    frequencies_filter = get_frequencies(stateseqs) >= min_frequency
    counts_filter = np.array(list(map(len, syllable_instances))) >= min_instances
    use_syllables = np.all([frequencies_filter, counts_filter], axis=0).nonzero()[0]
    return {syllable: syllable_instances[syllable] for syllable in use_syllables}




[docs]
def get_edges(use_bodyparts, skeleton):
    """Represent the skeleton as a list of index-pairs.

    Parameters
    -------
    use_bodyparts: list
        Bodypart names

    skeleton: list
        Pairs of bodypart names as tuples (bodypart1,bodypart2)

    Returns
    -------
    edges: list
        Pairs of indexes representing the enties of `skeleton`
    """
    edges = []
    if len(skeleton) > 0:
        if isinstance(skeleton[0][0], int):
            edges = skeleton
        else:
            assert use_bodyparts is not None, fill(
                "If skeleton edges are specified using bodypart names, "
                "`use_bodyparts` must be specified"
            )

            for bp1, bp2 in skeleton:
                if bp1 in use_bodyparts and bp2 in use_bodyparts:
                    edges.append([use_bodyparts.index(bp1), use_bodyparts.index(bp2)])
    return edges




[docs]
def reindex_by_bodyparts(data, bodyparts, use_bodyparts, axis=1):
    """Use an ordered list of bodyparts to reindex keypoint coordinates.

    Parameters
    -------
    data: dict or ndarray
        A single array of keypoint coordinates or a dict mapping from names to
        arrays of keypoint coordinates

    bodyparts: list
        Label for each keypoint represented in `data`

    use_bodyparts: list
        Ordered subset of keypoint labels

    axis: int, default=1
        The axis in `data` that represents keypoints. It is required that
        `data.shape[axis]==len(bodyparts)`.

    Returns
    -------
    reindexed_data: ndarray or dict
        Keypoint coordinates in the same form as `data` with reindexing
        applied.
    """
    ix = np.array([bodyparts.index(bp) for bp in use_bodyparts])
    if isinstance(data, np.ndarray):
        return np.take(data, ix, axis)
    else:
        return {k: np.take(v, ix, axis) for k, v in data.items()}




[docs]
def get_instance_trajectories(
    syllable_instances,
    coordinates,
    pre=0,
    post=None,
    centroids=None,
    headings=None,
    filter_size=9,
):
    """Extract keypoint trajectories for a collection of syllable instances.

    If centroids and headings are provided, each trajectory is transformed into
    the ego-centric reference frame from the moment of syllable onset. When
    `post` is not None, trajectories will all terminate a fixed number of
    frames after syllable onset.

    Parameters
    -------
    syllable_instances: list
        List of syllable instances, where each instance is a tuple of the form
        (name,start,end)

    coordinates: dict
        Dictionary mapping names to coordinates, formatted as ndarrays with
        shape (num_frames, num_keypoints, d)

    pre: int, default=0
        Number of frames to include before syllable onset

    post: int, defualt=None
        Determines the length of the trajectory. When `post=None`, the
        trajectory terminates at the end of the syllable instance. Otherwise
        the trajectory terminates at a fixed number of frames after syllable
        (where the number is determined by `post`).

    centroids: dict, default=None
        Dictionary with the same keys as `coordinates` mapping each name to an
        ndarray with shape (num_frames, d)

    headings: dict, default=None
        Dictionary with the same keys as `coordinates` mapping each name to a
        1d array of heading angles in radians

    filter_size: int, default=9
        Size of median filter applied to `centroids` and `headings`

    Returns
    -------
    trajectories: list
        List or array of trajectories (a list is used when `post=None`,
        otherwise an array). Each trajectory is an array of shape
        (n_frames, n_bodyparts, [2 or 3]).
    """
    if centroids is not None and headings is not None:
        centroids, headings = filter_centroids_headings(
            centroids, headings, filter_size=filter_size
        )

    if post is None:
        trajectories = [coordinates[key][s - pre : e] for key, s, e in syllable_instances]
        if centroids is not None and headings is not None:
            trajectories = [
                np_io(inverse_rigid_transform)(x, centroids[key][s], headings[key][s])
                for x, (key, s, e) in zip(trajectories, syllable_instances)
            ]
    else:
        trajectories = np.array(
            [coordinates[key][s - pre : s + post] for key, s, e in syllable_instances]
        )
        if centroids is not None and headings is not None:
            c = np.array([centroids[key][s] for key, s, e in syllable_instances])[:, None]
            h = np.array([headings[key][s] for key, s, e in syllable_instances])[:, None]
            trajectories = np_io(inverse_rigid_transform)(trajectories, c, h)

    return trajectories




[docs]
def sample_instances(
    syllable_instances,
    num_samples,
    mode="random",
    pca_samples=50000,
    pca_dim=4,
    n_neighbors=50,
    coordinates=None,
    pre=5,
    post=15,
    centroids=None,
    headings=None,
    filter_size=9,
):
    """Sample a fixed number of instances for each syllable.

    Parameters
    ----------
    syllable_instances: dict
        Mapping from each syllable to a list of instances, where each instance
        is a tuple of the form (name,start,end)

    num_samples: int
        Number of samples return for each syllable

    mode: str, {'random', 'density'}, default='random'
        Sampling method to use. Options are:

        - 'random': Instances are chosen randomly (without replacement)
        - 'density': For each syllable, a syllable-specific density function is
          computed in trajectory space and compared to the overall density
          across all syllables. An exemplar instance that maximizes this ratio
          is chosen for each syllable, and its nearest neighbors are randomly
          sampled.

    pca_samples: int, default=50000
        Number of trajectories to sample when fitting a PCA model for density
        estimation (used when `mode='density'`)

    pca_dim: int, default=4
        Number of principal components to use for density estimation (used when
        `mode='density'`)

    n_neighbors: int, defualt=50
        Number of neighbors to use for density estimation and for sampling the
        neighbors of the examplar syllable instance (used when
        `mode='density'`)

    coordinates, pre, pos, centroids, heading, filter_size
        Passed to :py:func:`keypoint_moseq.util.get_instance_trajectories`

    Returns
    -------
    sampled_instances: dict
        Dictionary in the same format as `syllable_instances` mapping each
        syllable to a list of sampled instances.
    """
    assert mode in ["random", "density"]
    assert all([len(v) >= num_samples for v in syllable_instances.values()])
    assert n_neighbors >= num_samples

    if mode == "random":
        sampled_instances = {
            syllable: [
                instances[i] for i in np.random.choice(len(instances), num_samples, replace=False)
            ]
            for syllable, instances in syllable_instances.items()
        }
        return sampled_instances

    elif mode == "density":
        assert not (coordinates is None or headings is None or centroids is None), fill(
            "`coordinates`, `headings` and `centroids` are required when " '`mode == "density"`'
        )

        for key in coordinates.keys():
            outliers = np.isnan(coordinates[key]).any(-1)
            coordinates[key] = interpolate_keypoints(coordinates[key], outliers)

        trajectories = {
            syllable: get_instance_trajectories(
                instances,
                coordinates,
                pre=pre,
                post=post,
                centroids=centroids,
                headings=headings,
                filter_size=filter_size,
            )
            for syllable, instances in syllable_instances.items()
        }
        X = np.vstack(list(trajectories.values()))

        if X.shape[0] > pca_samples:
            X = X[np.random.choice(X.shape[0], pca_samples, replace=False)]

        pca = PCA(n_components=pca_dim).fit(X.reshape(X.shape[0], -1))
        Xpca = pca.transform(X.reshape(X.shape[0], -1))
        all_nbrs = NearestNeighbors(n_neighbors=n_neighbors).fit(Xpca)

        sampled_instances = {}

        for syllable, X in trajectories.items():
            Xpca = pca.transform(X.reshape(X.shape[0], -1))
            nbrs = NearestNeighbors(n_neighbors=n_neighbors).fit(Xpca)
            distances, indices = nbrs.kneighbors(Xpca)
            local_density = 1 / distances.mean(1)

            distances, _ = all_nbrs.kneighbors(Xpca)
            global_density = 1 / distances.mean(1)
            exemplar = np.argmax(local_density / global_density)
            samples = np.random.choice(indices[exemplar], num_samples, replace=False)
            sampled_instances[syllable] = [syllable_instances[syllable][i] for i in samples]

        return sampled_instances

    else:
        raise ValueError("Invalid mode: {}".format(mode))




[docs]
def interpolate_along_axis(x, xp, fp, axis=0):
    """Linearly interpolate along a given axis.

    Parameters
    ----------
    x: 1D array
        The x-coordinates of the interpolated values
    xp: 1D array
        The x-coordinates of the data points
    fp: ndarray
        The y-coordinates of the data points. fp.shape[axis] must
        be equal to the length of xp.

    Returns
    -------
    x_interp: ndarray
        The interpolated values, with the same shape as fp except along the
        interpolation axis.
    """
    assert len(xp.shape) == len(x.shape) == 1
    assert fp.shape[axis] == len(xp)
    assert len(xp) > 0, "xp must be non-empty; cannot interpolate without datapoints"

    fp = np.moveaxis(fp, axis, 0)
    shape = fp.shape[1:]
    fp = fp.reshape(fp.shape[0], -1)

    x_interp = np.zeros((len(x), fp.shape[1]))
    for i in range(fp.shape[1]):
        x_interp[:, i] = np.interp(x, xp, fp[:, i])
    x_interp = x_interp.reshape(len(x), *shape)
    x_interp = np.moveaxis(x_interp, 0, axis)
    return x_interp




[docs]
def interpolate_keypoints(coordinates, outliers):
    """Use linear interpolation to impute the coordinates of outliers.

    Parameters
    ----------
    coordinates : ndarray of shape (num_frames, num_keypoints, dim)
        Keypoint observations.
    outliers : ndarray of shape (num_frames, num_keypoints)
        Binary indicator whose true entries are outlier points.

    Returns
    -------
    interpolated_coordinates : ndarray with same shape as `coordinates`
        Keypoint observations with outliers imputed.
    """
    interpolated_coordinates = np.zeros_like(coordinates)
    for i in range(coordinates.shape[1]):
        xp = np.nonzero(~outliers[:, i])[0]
        if len(xp) > 0:
            interpolated_coordinates[:, i, :] = interpolate_along_axis(
                np.arange(coordinates.shape[0]), xp, coordinates[xp, i, :]
            )
    return interpolated_coordinates




[docs]
def filtered_derivative(Y_flat, ksize, axis=0):
    """Compute the filtered derivative of a signal along a given axis.

    When `ksize=3`, for example, the filtered derivative is

    .. math::

        \\dot{y_t} = \\frac{1}{3}( x_{t+3}+x_{t+2}+x_{t+1}-x_{t-1}-x_{t-2}-x_{t-3})


    Parameters
    ----------
    Y_flat: ndarray
        The signal to differentiate

    ksize: int
        The size of the filter. Must be odd.

    axis: int, default=0
        The axis along which to differentiate

    Returns
    -------
    dY: ndarray
        The filtered derivative of the signal
    """
    kernel = np.ones(ksize + 1) / (ksize + 1)
    pre = convolve1d(Y_flat, kernel, origin=-(ksize + 1) // 2, axis=axis)
    post = convolve1d(Y_flat, kernel, origin=ksize // 2, axis=axis)
    return post - pre




[docs]
def permute_cyclic(arr, mask=None, axis=0):
    """Cyclically permute an array along a given axis.

    Parameters
    ----------
    arr: ndarray
        The array to permute

    mask: ndarray, optional
        A boolean mask indicating which elements to permute. If None, all
        elements are permuted.

    axis: int, default=0
        The axis along which to permute

    Returns
    -------
    arr_permuted: ndarray
        The permuted array
    """
    if mask is None:
        mask = np.ones_like(arr)

    arr = np.moveaxis(arr, axis, 0)
    mask = np.moveaxis(mask, axis, 0)

    shape = arr.shape
    arr = arr.reshape(arr.shape[0], -1)
    mask = mask.reshape(mask.shape[0], -1)

    arr_permuted = np.zeros_like(arr)
    for i in range(arr.shape[1]):
        arr_permuted[mask[:, i] > 0, i] = np.roll(
            arr[mask[:, i] > 0, i], np.random.randint(0, mask[:, i].sum())
        )

    arr_permuted = arr_permuted.reshape(shape)
    arr_permuted = np.moveaxis(arr_permuted, 0, axis)
    return arr_permuted



def _print_colored_table(row_labels, col_labels, values):
    try:
        from IPython.display import display

        display_available = True
    except ImportError:
        display_available = False

    title = "Proportion of NaNs"
    df = pd.DataFrame(values, index=row_labels, columns=col_labels)

    if display_available:

        def colorize(val):
            color = plt.get_cmap("Reds")(val * 0.8)
            return f"background-color: rgba({int(color[0]*255)}, {int(color[1]*255)}, {int(color[2]*255)}, {color[3]})"

        colored_df = df.style.applymap(colorize).set_caption("Proportion of NaNs")
        display(colored_df)
        return colored_df
    else:
        print(title)
        print(tabulate(df, headers="keys", tablefmt="simple_grid", showindex=True))



[docs]
def check_nan_proportions(coordinates, bodyparts, warning_threshold=0.5, breakdown=False, **kwargs):
    """Check if any bodyparts have a high proportion of NaNs.

    Parameters
    ----------
    coordinates: dict
        Dictionary mapping filenames to keypoint coordinates as ndarrays of
        shape (n_frames, n_bodyparts, 2)

    bodyparts: list of str
        Name of each bodypart. The order of the names should match the order of
        the bodyparts in `coordinates`.

    warning_threshold: float, default=0.5
        If the proportion of NaNs for a bodypart is greater than
        `warning_threshold`, then a warning is printed.

    breakdown: bool, default=False
        Whether to print a table detailing the proportion of NaNs for each
        bodyparts in each array of `coordinates`.
    """
    if breakdown:
        keys = sorted(coordinates.keys())
        nan_props = [np.isnan(coordinates[k]).any(-1).mean(0) for k in keys]
        _print_colored_table(keys, bodyparts, nan_props)
    else:
        all_coords = np.concatenate(list(coordinates.values()))
        nan_props = np.isnan(all_coords).any(-1).mean(0)
        if np.any(nan_props > warning_threshold):
            bps = [bp for bp, p in zip(bodyparts, nan_props) if p > warning_threshold]
            warnings.warn(
                "\nCoordinates for the following bodyparts are missing (set to NaN) in at least "
                "{}% of frames:\n - {}\n\n".format(warning_threshold * 100, "\n - ".join(bps))
            )
            warnings.warn(
                "This may cause problems during modeling. See "
                "https://keypoint-moseq.readthedocs.io/en/latest/FAQs.html#high-proportion-of-nans"
                " for additional information."
            )



def _get_percent_padding(sequence_lengths, seg_length):
    """
    Calculate the percentage of padding required when batching sequences of the specified
    lengths (see :py:func:`keypoint_moseq.util.batch`)

    Parameters
    ----------
    sequence_lengths : numpy.ndarray
        Array of sequence lengths
    seg_length : int
        Segment length to use for batching

    Returns
    -------
    percent_padding: float
        Percentage of total padding required relative to total sequence length.
        Formula: (total_padding / total_sequence_length) * 100

    Examples
    --------
    >>> sequence_lengths = np.array([8, 15, 4])
    >>> seg_length = 10
    >>> percent_padding = _get_percent_padding(sequence_lengths, seg_length)
    # Returns padding percentage considering:
    # - Padding needed for 8-element sequence (2 elements)
    # - Padding needed for 15-element sequence (5 elements)
    # - Padding needed for 4-element sequence (6 elements)
    # Result will be (2+5+6) / (8+15+4) * 100 = 48.15%
    """
    padding = (-sequence_lengths % seg_length).sum()
    return padding / sequence_lengths.sum() * 100


def _find_optimal_segment_length(
    sequence_lengths,
    max_seg_length=10_000,
    max_percent_padding=50,
    min_fragment_length=4,
):
    """Find a segment length to use for batching (see :py:func:`keypoint_moseq.util.batch`).

    Parameters
    ----------
    sequence_lengths : array-like
        Lengths of sequences to be batched. All lengths must be greater than `min_fragment_length`.
    max_seg_length : int, default=10_000
        Maximum allowed segment length.
    max_percent_padding : float, default=50
        Maximum allowed padding as a percentage of summed sequence lengths.
    min_fragment_length : int, default=4
        Minimum allowed length sequence length after batching (excluding padding).

    Returns
    -------
    segment_length: int
        Segment length that (approximately) satisfies all constraints.

    Notes
    -----
    The algorithm has two main phases:
    1. Find a segment length that satisfies the padding constraint by trying progressively
       shorter sequence lengths
    2. Increment segment length to ensure all batched sequences are >= min_fragment_length
    """
    sequence_lengths = np.array(sequence_lengths)
    assert np.all(
        sequence_lengths > min_fragment_length
    ), f"All sequences must have at least {min_fragment_length + 1} elements"

    candidate_seg_lengths = np.sort(np.unique(np.minimum(sequence_lengths, max_seg_length)))[::-1]

    for seg_length in candidate_seg_lengths:
        percent_padding = _get_percent_padding(sequence_lengths, seg_length)
        if percent_padding <= max_percent_padding:
            break

    if percent_padding > max_percent_padding:
        warnings.warn(
            f"No segment length found that satisfies the padding constraint. "
            f"Using maximum value of {max_seg_length}. "
            f"This may cause modeling to run more slowly than necessary. "
            f"To fix, try decreasing 'max_seg_length'."
        )
        seg_length = max_seg_length

    while True:
        remainders = sequence_lengths % seg_length
        nonzero_remainders = remainders[remainders != 0]

        if np.all(nonzero_remainders >= min_fragment_length):
            break

        seg_length += nonzero_remainders.min()

    return seg_length



[docs]
def format_data(
    coordinates,
    confidences=None,
    keys=None,
    bodyparts=None,
    use_bodyparts=None,
    conf_pseudocount=1e-3,
    added_noise_level=0.1,
    seg_length=None,
    max_seg_length=10_000,
    max_percent_padding=50,
    min_fragment_length=4,
    **kwargs,
):
    """Format keypoint coordinates and confidences for inference.

    Data are transformed as follows:
        1. Coordinates and confidences are each merged into a single array
           using :py:func:`keypoint_moseq.util.batch`. Each row of the merged
           arrays is a segment from one recording.
        2. The keypoints axis is reindexed according to the order of elements
           in `use_bodyparts` with respect to their initial orer in
           `bodyparts`.
        3. Uniform noise proportional to `added_noise_level` is added to the
           keypoint coordinates to prevent degenerate solutions during fitting.
        4. Keypoint confidences are augmented by `conf_pseudocount`.
        5. Wherever NaNs occur in the coordinates, they are replaced by values
           imputed using linear interpolation, and the corresponding
           confidences are set to `conf_pseudocount`.

    Parameters
    ----------
    coordinates: dict
        Keypoint coordinates for a collection of recordings. Values must be
        numpy arrays of shape (T,K,D) where K is the number of keypoints and
        D={2 or 3}.

    confidences: dict, default=None
        Nonnegative confidence values for the keypoints in `coordinates` as
        numpy arrays of shape (T,K).

    keys: list of str, default=None
        (See :py:func:`keypoint_moseq.util.batch`)

    bodyparts: list, default=None
        Label for each keypoint represented in `coordinates`. Required to
        reindex coordinates and confidences according to `use_bodyparts`.

    use_bodyparts: list, default=None
        Ordered subset of keypoint labels to be used for modeling. If
        `use_bodyparts=None`, then all keypoints are used.

    conf_pseudocount: float, default=1e-3
        Pseudocount used to augment keypoint confidences.

    seg_length: int, default=None
        Force a specific segment length for batching instead of determining one algorithmically.
        If provided, 'max_seg_length', and 'max_percent_padding' are ignored.
        'min_fragment_length' is still enforced to prevent downstream runtime errors.

    max_seg_length: int, default=10,000
        Maximim allowed segment length for batching (see :py:func:`keypoint_moseq.util.batch`).
        Ignored if `seg_length` is provided.

    max_percent_padding: float, default=50
        Maximum allowed padding as a percentage of the total sequence length when data are batched
        (see :py:func:`keypoint_moseq.util.batch`). Ignored if `seg_length` is provided.

    min_fragment_length: int, default=4
        Minimum allowed sequence length after batching (see :py:func:`keypoint_moseq.util.batch`).

    Returns
    -------
    data: dict with the following items

        Y: jax array with shape (n_segs, seg_length, K, D)
            Keypoint coordinates from all recordings broken into fixed-length
            segments.

        conf: jax array with shape (n_segs, seg_length, K)
            Confidences from all recordings broken into fixed-length segments.
            If no input is provided for `confidences`, then
            `data["conf"]=None`.

        mask: jax array with shape (n_segs, seg_length)
            Binary array where 0 indicates areas of padding
            (see :py:func:`keypoint_moseq.util.batch`).

    metadata: tuple (keys, bounds)
        Metadata for the rows of `Y`, `conf` and `mask`, as a tuple with a
        array of recording names and an array of (start,end) times. See
        :py:func:`jax_moseq.utils.batch` for details.
    """
    if keys is None:
        keys = sorted(coordinates.keys())
    else:
        bad_keys = set(keys) - set(coordinates.keys())
        assert len(bad_keys) == 0, fill(f"Keys {bad_keys} not found in coordinates")

    assert len(keys) > 0, "No recordings found"

    num_keypoints = [coordinates[key].shape[-2] for key in keys]
    assert len(set(num_keypoints)) == 1, fill(
        f"All recordings must have the same number of keypoints, but "
        f"found {set(num_keypoints)} keypoints across recordings."
    )

    if bodyparts is not None:
        assert len(bodyparts) == num_keypoints[0], fill(
            f"The number of keypoints in `coordinates` ({num_keypoints[0]}) "
            f"does not match the number of labels in `bodyparts` "
            f"({len(bodyparts)})"
        )

    if any(["/" in key for key in keys]):
        warnings.warn(
            fill(
                'WARNING: Recording names should not contain "/", this will cause '
                "problems with saving/loading hdf5 files."
            )
        )

    if confidences is None:
        confidences = {key: np.ones_like(coordinates[key][..., 0]) for key in keys}

    if bodyparts is not None and use_bodyparts is not None:
        coordinates = reindex_by_bodyparts(coordinates, bodyparts, use_bodyparts)
        confidences = reindex_by_bodyparts(confidences, bodyparts, use_bodyparts)

    for key in keys:
        outliers = np.isnan(coordinates[key]).any(-1)
        coordinates[key] = interpolate_keypoints(coordinates[key], outliers)
        confidences[key] = np.where(outliers, 0, np.nan_to_num(confidences[key]))

    if not seg_length:
        seg_length = _find_optimal_segment_length(
            [coordinates[key].shape[0] for key in keys],
            max_seg_length=max_seg_length,
            max_percent_padding=max_percent_padding,
            min_fragment_length=min_fragment_length,
        )

    Y, mask, metadata = batch(coordinates, seg_length=seg_length, keys=keys)
    assert np.all(mask.sum(axis=1) >= min_fragment_length), fill(
        f"All segments must contain at least {min_fragment_length} frames of data, "
        f"but found segments with as few as {int(mask.sum(axis=1).min())} frames."
    )
    Y = Y.astype(float)

    conf = batch(confidences, seg_length=seg_length, keys=keys)[0]
    if np.min(conf) < 0:
        conf = np.maximum(conf, 0)
        warnings.warn(fill("Negative confidence values are not allowed and will be set to 0."))
    conf = conf + conf_pseudocount

    if added_noise_level > 0:
        rng = np.random.default_rng(42)
        Y += rng.uniform(-added_noise_level, added_noise_level, Y.shape)

    data = jax.device_put({"mask": mask, "Y": Y, "conf": conf})
    return data, metadata




[docs]
def get_typical_trajectories(
    coordinates,
    results,
    pre=5,
    post=15,
    min_frequency=0.005,
    min_duration=3,
    bodyparts=None,
    use_bodyparts=None,
    density_sample=True,
    sampling_options={"n_neighbors": 50},
):
    """Generate representative keypoint trajectories for each syllable.

    Parameters
    ----------
    coordinates: dict
        Dictionary mapping recording names to keypoint coordinates as ndarrays
        of shape (n_frames, n_bodyparts, 2).

    results: dict
        Dictionary containing modeling results for a dataset (see
        :py:func:`keypoint_moseq.fitting.extract_results`).

    pre: int, default=5, post: int, default=15
        Defines the temporal window around syllable onset for computing the
        average trajectory. Note that the window is independent of the actual
        duration of the syllable.

    min_frequency: float, default=0.005
        Minimum frequency of a syllable to plotted.

    min_duration: float, default=3
        Minimum duration of a syllable instance to be included in the
        trajectory average.

    bodyparts: list of str, default=None
        List of bodypart names in `coordinates`.

    use_bodyparts: list of str, default=None
        Ordered list of bodyparts to include in each trajectory. If None, all
        bodyparts will be included.

    density_sample : bool, default=True
        Whether to use density sampling when generating trajectories. If True,
        the trajectory is based on the most exemplary syllable instances,
        rather than being average across all instances.

    sampling_options: dict, default={'n_neighbors':50}
        Dictionary of options for sampling syllable instances (see
        :py:func:`keypoint_moseq.util.sample_instances`). Only used when
        `density_sample` is True.

    Returns
    -------
    representative_trajectories: dict
        Dictionary mapping syllable indexes to representative trajectories
        as arrays of shape (pre+pose, n_bodyparts, [2 or 3]).
    """
    if bodyparts is not None and use_bodyparts is not None:
        coordinates = reindex_by_bodyparts(coordinates, bodyparts, use_bodyparts)

    syllables = {k: v["syllable"] for k, v in results.items()}
    centroids = {k: v["centroid"] for k, v in results.items()}
    headings = {k: v["heading"] for k, v in results.items()}

    min_instances = sampling_options["n_neighbors"] if density_sample else 1
    syllable_instances = get_syllable_instances(
        syllables,
        pre=pre,
        post=post,
        min_duration=min_duration,
        min_frequency=min_frequency,
        min_instances=min_instances,
    )

    if len(syllable_instances) == 0:
        raise ValueError(
            fill(
                "No syllables with sufficient instances to generate a trajectory. "
                "This usually occurs when there is not enough inut data or when "
                "all frames have the same syllable label (use "
                "`plot_syllable_frequencies` to check if this is the case)"
            )
        )
        return

    if density_sample:
        sampling_options["mode"] = "density"
        sampled_instances = sample_instances(
            syllable_instances,
            sampling_options["n_neighbors"],
            coordinates=coordinates,
            centroids=centroids,
            headings=headings,
            pre=pre,
            post=post,
            **sampling_options,
        )
    else:
        sampled_instances = syllable_instances

    trajectories = {
        syllable: get_instance_trajectories(
            instances,
            coordinates,
            pre=pre,
            post=post,
            centroids=centroids,
            headings=headings,
        )
        for syllable, instances in sampled_instances.items()
    }

    return {s: np.nanmedian(ts, axis=0) for s, ts in trajectories.items()}




[docs]
def syllable_similarity(
    coordinates,
    results,
    metric="cosine",
    pre=5,
    post=15,
    min_frequency=0.005,
    min_duration=3,
    bodyparts=None,
    use_bodyparts=None,
    density_sample=False,
    sampling_options={"n_neighbors": 50},
    **kwargs,
):
    """Generate a distance matrix over syllable trajectories.

    See :py:func:`keypoint_moseq.util.get_typical_trajectories` for a
    description of the parameters not listed below.

    Parameters
    ----------
    metric: str, default='cosine'
        Distance metric to use. See :py:func:`scipy.spatial.pdist` for options.

    Returns
    -------
    distances : ndarray of shape (n_syllables, n_syllables)
        Pairwise distances between the typical trajectories associated with
        each syllable. Only syllables with sufficient frequency of occurence
        are included.

    syllable_ixs : array of int
        Syllable indexes corresponding to the rows and columns of `distances`.
    """
    typical_trajectories = get_typical_trajectories(
        coordinates,
        results,
        pre,
        post,
        min_frequency,
        min_duration,
        bodyparts,
        use_bodyparts,
        density_sample,
        sampling_options,
    )

    syllable_ixs = sorted(typical_trajectories.keys())
    Xs = np.stack([typical_trajectories[s] for s in syllable_ixs])
    distances = squareform(pdist(Xs.reshape(Xs.shape[0], -1), metric))
    return distances, syllable_ixs




[docs]
def downsample_timepoints(data, downsample_rate):
    """
    Downsample timepoints, e.g. of coordinates or confidences.

    Parameters
    ----------
    data: ndarray or dict
        Array of shape (n_frames, ...) or a dictionary with such arrays as values.

    downsample_rate: int
        The downsampling rate (e.g., `downsample_rate=2` keeps every other frame).

    Returns
    -------
    downsampled_data: ndarray or dict
        Downsampled array or dictionary of arrays.

    indexes: ndarray or dict
        Downsampled timepoints (in the original numbering)
    """
    if isinstance(data, dict):
        downsampled_data = {}
        indexes = {}
        for k, v in data.items():
            downsampled_data[k], indexes[k] = downsample_timepoints(v, downsample_rate)
    else:
        downsampled_data = data[::downsample_rate]
        indexes = np.arange(len(downsampled_data)) * downsample_rate
    return downsampled_data, indexes




[docs]
def check_video_paths(video_paths, keys):
    """
    Check if video paths are valid and match the keys.

    Parameters
    ----------
    video_paths: dict
        Dictionary mapping keys to video paths.

    keys: list
        List of keys that require a video path.

    Raises
    ------
    ValueError
        If any of the following are true:
        - a video path is not provided for a key in `keys`
        - a video isn't readable.
        - a video path does not exist.
    """
    missing_keys = set(keys) - set(video_paths.keys())

    nonexistent_videos = []
    unreadable_videos = []
    for path in video_paths.values():
        if not os.path.exists(path):
            nonexistent_videos.append(path)
        else:
            try:
                reader = OpenCVReader(path)
                reader[reader.nframes - 1]
                reader.close()
            except:
                unreadable_videos.append(path)

    error_messages = []

    if len(missing_keys) > 0:
        error_messages.append("The following keys require a video path: {}".format(missing_keys))
    if len(nonexistent_videos) > 0:
        error_messages.append("The following videos do not exist: {}".format(nonexistent_videos))
    if len(unreadable_videos) > 0:
        error_messages.append(
            "The following videos are not readable and must be reencoded: {}".format(
                unreadable_videos
            )
        )

    if len(error_messages) > 0:
        raise ValueError("\n\n".join(error_messages))




[docs]
def generate_syllable_mapping(results: dict, syllable_grouping: list[list[int]], runlength: bool = True) -> dict[int, int]:
    """
    Create a mapping from old syllable indexes to new syllable indexes such that each group of
    syllables in `syllable_grouping` is mapped to a single index. All syllables not included in
    `syllable_grouping` will be treated as single-index groups. New indices are assigned to groups
    based on frequency, with the most frequent groups getting the lowest indices.

    Parameters
    ----------
    results: dict
        Dictionary containing modeling results for a dataset (see
        :py:func:`keypoint_moseq.fitting.extract_results`).

    syllable_grouping: list[list[int]]
        List of lists representing groups of syllables that should be mapped to a single index.

    runlength: bool, default=True
        If True, frequencies are quantified using the number of non-consecutive
        occurrences of each syllable. If False, frequency is quantified by
        total number of frames.

    Returns
    -------
    mapping: dict[int, int]
        A dictionary mapping each original syllable index to a new syllable index.

    Example
    -------
    >>> results = load_hdf5(results_path)
    >>> syllable_grouping = [[0, 1], [2, 5, 6]]
    >>> mapping = generate_syllable_mapping(results, syllable_grouping)
    >>> print(mapping)
    >>> # {0: 0, 1: 0, 2: 1, 3: 2, 4: 3, 5: 1, 6: 1}
    """
    syllables = {k: res["syllable"] for k, res in results.items()}
    syllable_frequencies = get_frequencies(syllables, runlength=runlength)

    # Get a list of all syllables that are in a group
    syllables_to_group = [s for group in syllable_grouping for s in group]

    # Calculate the total frequency for each group of syllables
    all_frequencies = []
    for group in syllable_grouping:
        group_frequency = sum(syllable_frequencies[s] for s in group)
        all_frequencies.append((group_frequency, group))

    # Add individual syllables not in any group
    for syllable in range(len(syllable_frequencies)):
        if syllable not in syllables_to_group:
            all_frequencies.append((syllable_frequencies[syllable], [syllable]))

    all_frequencies.sort(reverse=True)

    mapping = {}
    for i, (_, syllables) in enumerate(all_frequencies):
        for syllable in syllables:
            mapping[syllable] = i

    return mapping




[docs]
def apply_syllable_mapping(results: dict, mapping: dict[int, int]) -> dict:
    """
    Relabel syllables based on the provided mapping.

    Parameters
    ----------
    results: dict
        Dictionary containing modeling results for a dataset (see
        :py:func:`keypoint_moseq.fitting.extract_results`).

    mapping: dict[int, int]
        A dictionary mapping each original syllable index to a new syllable index.

    Returns
    -------
    remapped_results: dict
        A dictionary with the same structure as `results`, but with relabled syllables.
    """
    new_results = {}
    for key, value in results.items():
        new_results[key] = {}
        for k, v in value.items():
            if k == "syllable":
                new_results[key][k] = np.array([mapping[s] for s in v])
            else:
                new_results[key][k] = np.copy(v)
    return new_results




[docs]
def get_distance_to_medoid(coordinates: np.ndarray) -> np.ndarray:
    """Compute the Euclidean distance from each keypoint to the medoid (median position)
    of all keypoints at each frame.

    Parameters
    -------
    coordinates: ndarray of shape (n_frames, n_keypoints, keypoint_dim)
        Keypoint coordinates where keypoint_dim is 2 or 3.

    Returns
    -------
    distances: ndarray of shape (n_frames, n_keypoints)
        Euclidean distances from each keypoint to the medoid position at each frame.
    """
    medoids = np.median(coordinates, axis=1)  # (n_frames, keypoint_dim)
    return np.linalg.norm(coordinates - medoids[:, None, :], axis=-1)  # (n_frames, n_keypoints)




[docs]
def find_medoid_distance_outliers(
    coordinates: np.ndarray, outlier_scale_factor: float = 6.0
) -> dict[str, np.ndarray]:
    """Identify keypoint distance outliers using Median Absolute Deviation (MAD).

    Keypoints are considered outliers when their distance to the medoid at a given timepoint differs
    from its median value by a multiple of the median absolute deviation (MAD) for that keypoint.

    Parameters
    -------
    coordinates: ndarray of shape (n_frames, n_keypoints, keypoint_dim)
        Keypoint coordinates where keypoint_dim is 2 or 3. Only the first two dimensions (x, y) are
        used for distance calculations.

    outlier_scale_factor: float, default=6.0
        Multiplier used to set the outlier threshold. Higher values result in fewer outliers.

    **kwargs
        Additional keyword arguments (ignored), usually overflow from **config().

    Returns
    -------
    result: dict with the following items

        mask: ndarray of shape (n_frames, n_keypoints)
            Boolean array where True indicates outlier keypoints.

        thresholds: ndarray of shape (n_keypoints,)
            Distance thresholds used to classify outlier timepoints for each keypoint.
    """
    distances = get_distance_to_medoid(coordinates)  # (n_frames, n_keypoints)
    medians = np.median(distances, axis=0)  # (n_keypoints,)
    MADs = np.median(np.abs(distances - medians[None, :]), axis=0)  # (n_keypoints,)
    outlier_thresholds = MADs * outlier_scale_factor + medians  # (n_keypoints,)
    outlier_mask = distances > outlier_thresholds[None, :]  # (n_frames, n_keypoints)
    return {"mask": outlier_mask, "thresholds": outlier_thresholds}




[docs]
def plot_keypoint_traces(
    traces: list[np.ndarray],
    plot_title: Optional[str] = None,
    bodyparts: Optional[list[str]] = None,
    line_labels: Optional[list[str]] = None,
    thresholds: Optional[np.ndarray] = None,
    shading_mask: Optional[np.ndarray] = None,
) -> plt.Figure:
    """Create a multi-panel plot showing keypoint traces over time (used to visualize outliers).

    Creates a figure with one subplot per keypoint, where each subplot shows multiple
    trace lines over time. Optional features include threshold lines, shaded regions,
    and custom labels.

    Parameters
    -------
    traces: list of ndarrays
        List of arrays, each with shape (n_frames, n_keypoints). Each array
        represents a different trace to plot.

    plot_title: str, optional
        Title to display at the top of the figure.

    bodyparts: list of str, optional
        Names of bodyparts corresponding to each keypoint. Used for subplot titles.
        Must have length equal to n_keypoints.

    line_labels: list of str, optional
        Labels for each trace line in the legend. Must have length equal to
        the number of traces.

    thresholds: ndarray of shape (n_keypoints,), optional
        Threshold values to plot as horizontal dashed lines for each keypoint.

    shading_mask: ndarray of shape (n_frames, n_keypoints), optional
        Boolean mask indicating frames to shade (e.g., outlier frames).
        True values will be shaded in grey.

    Returns
    -------
    fig: matplotlib.figure.Figure
        The created figure with subplots for each keypoint.
    """

    if not traces:
        raise ValueError("traces cannot be empty")

    n_keypoints = traces[0].shape[1]

    for i, trace_array in enumerate(traces):
        if trace_array.shape[1] != n_keypoints:
            raise ValueError(
                f"All trace arrays must have same number of keypoints. "
                f"Array {i} has {trace_array.shape[1]} keypoints, expected {n_keypoints}"
            )

    if bodyparts is not None and len(bodyparts) != n_keypoints:
        raise ValueError(
            f"Length of bodyparts list ({len(bodyparts)}) does not match "
            f"number of keypoints in traces ({n_keypoints})"
        )

    if shading_mask is not None:
        if shading_mask.shape != traces[0].shape:
            raise ValueError(
                f"Shading mask shape {shading_mask.shape} must match traces shape {traces[0].shape}"
            )

    fig, axes = plt.subplots(n_keypoints, 1, figsize=(16, 3 * n_keypoints), constrained_layout=True)
    if n_keypoints == 1:
        axes = [axes]  # Ensure axes is always a list

    for keypoint_idx in range(n_keypoints):
        ax = axes[keypoint_idx]

        if shading_mask is not None:
            shaded_frames = np.where(shading_mask[:, keypoint_idx])[0]
            if len(shaded_frames) > 0:
                for frame in shaded_frames:
                    ax.axvspan(frame - 0.5, frame + 0.5, alpha=0.1, color="grey")

        for line_idx, trace_array in enumerate(traces):
            label = line_labels[line_idx] if line_labels else f"Line {line_idx}"
            ax.plot(trace_array[:, keypoint_idx], label=label)

        if thresholds is not None:
            threshold_value = thresholds[keypoint_idx]
            ax.axhline(
                y=threshold_value,
                color="black",
                linestyle="--",
                alpha=0.7,
                label=f"Threshold ({threshold_value:.2f})",
            )

        ax.set_xlabel("Frame")
        ax.set_ylabel("Trace Value")

        if bodyparts is not None:
            ax.set_title(f"{bodyparts[keypoint_idx]}")
        else:
            ax.set_title(f"Keypoint {keypoint_idx}")

        ax.legend(loc="upper right")
        ax.grid(True, alpha=0.3)

    if plot_title is not None:
        fig.suptitle(plot_title, fontsize=16)
    return fig




[docs]
def plot_medoid_distance_outliers(
    project_dir: str,
    recording_name: str,
    original_coordinates: np.ndarray,
    interpolated_coordinates: np.ndarray,
    outlier_mask,
    outlier_thresholds,
    bodyparts: list[str],
    overwrite=False,
    **kwargs,
):
    """Create and save a plot comparing distance-to-medoid for original vs. interpolated keypoints.

    Generates a multi-panel plot showing the distance from each keypoint to the medoid
    position for both original and interpolated coordinates. The plot includes threshold
    lines and shaded regions for outlier frames. Saves the figure to the QA plots
    directory.

    Parameters
    -------
    project_dir: str
        Path to the project directory where the plot will be saved.

    recording_name: str
        Name of the recording, used for the plot title and filename.

    original_coordinates: ndarray of shape (n_frames, n_keypoints, keypoint_dim)
        Original keypoint coordinates before interpolation.

    interpolated_coordinates: ndarray of shape (n_frames, n_keypoints, keypoint_dim)
        Keypoint coordinates after interpolation.

    outlier_mask: ndarray of shape (n_frames, n_keypoints)
        Boolean mask indicating outlier keypoints (True = outlier).

    outlier_thresholds: ndarray of shape (n_keypoints,)
        Distance thresholds for each keypoint above which points are considered outliers.

    bodyparts: list of str
        Names of bodyparts corresponding to each keypoint. Must have length equal to
        n_keypoints.

    overwrite: bool, default False
        Whether or not to overwrite outlier interpolation QA plots

    **kwargs
        Additional keyword arguments (ignored), usually overflow from **config().

    Returns
    -------
    None
        The plot is saved to 'QA/plots/keypoint_distance_outliers/{recording_name}.png'.
    """

    plot_path = os.path.join(
        project_dir,
        "QA",
        "plots",
        "keypoint_distance_outliers",
        f"{recording_name}.png",
    )
    os.makedirs(os.path.dirname(plot_path), exist_ok=True)

    if os.path.exists(plot_path) and not overwrite:
        return

    original_distances = get_distance_to_medoid(original_coordinates)  # (n_frames, n_keypoints)
    interpolated_distances = get_distance_to_medoid(
        interpolated_coordinates
    )  # (n_frames, n_keypoints)

    fig = plot_keypoint_traces(
        traces=[original_distances, interpolated_distances],
        plot_title=recording_name,
        bodyparts=bodyparts,
        line_labels=["Original", "Interpolated"],
        thresholds=outlier_thresholds,
        shading_mask=outlier_mask,
    )

    fig.savefig(plot_path, dpi=300)
    plt.close()




[docs]
def outlier_removal(coordinates, confidences, project_dir, overwrite=False, outlier_scale_factor=6.0, bodyparts=None, **kwargs):
    """Remove outlier keypoints for all recordings in a dataset.

    For each recording, identifies outlier keypoints based on their distance 
    to the medoid, interpolates the outliers, sets their confidences to 0,
    and generates diagnostic plots.

    Parameters
    ----------
    coordinates: dict
        Dictionary mapping recording names to keypoint coordinates
    confidences: dict  
        Dictionary mapping recording names to keypoint confidences
    project_dir: str
        Path to project directory for saving plots
    overwrite: bool, default False
        Whether or not to overwrite outlier interpolation QA plots
    outlier_scale_factor: float, default=6.0
        Multiplier used to set the outlier threshold
    bodyparts: list of str, default=None
        Names of bodyparts for plot labels
    **kwargs
        Additional configuration parameters (ignored)

    Returns
    -------
    coordinates: dict
        Updated coordinates with outliers interpolated
    confidences: dict
        Updated confidences with outlier values set to conf_pseudocount
    """
    for recording_name in coordinates:
        raw_coords = coordinates[recording_name].copy()
        outliers = find_medoid_distance_outliers(raw_coords, outlier_scale_factor=outlier_scale_factor)
        coordinates[recording_name] = interpolate_keypoints(raw_coords, outliers["mask"])

        # Setting confidences to 0 will signal to format_data to interpolate these points 
        # there as well
        confidences[recording_name] = np.where(outliers["mask"], 0, confidences[recording_name])
        plot_medoid_distance_outliers(
            project_dir,
            recording_name,
            raw_coords,
            coordinates[recording_name],
            outliers["mask"],
            outliers["thresholds"],
            bodyparts=bodyparts,
            overwrite=overwrite,
            **kwargs
        )

    return coordinates, confidences



[docs]
def estimate_sigmasq_loc(Y: jnp.ndarray, mask: jnp.ndarray, filter_size: int = 30) -> float:
    """
    Automatically estimate `sigmasq_loc` (prior controlling the centroid movement across frames).

    Parameters
    ----------
    Y : jax.ndarray
        Keypoint coordinates; shape=(batch, frames, keypoints, dimensions).
    mask : jax.ndarray
        Mask indicating valid frames; shape=(batch, frames).
    filter_size: int
        Kernel size for median filtering to smooth the centroid trajectory.

    Returns
    -------
    float
        Mean of the squared distances between consecutive smoothed centroids.
    """
    masked_centroids = np.where(mask[:, :, None], np.median(Y, axis=2), np.nan)
    smoothed_centroids = median_filter(masked_centroids, (1, filter_size, 1))
    distances = np.linalg.norm(np.diff(smoothed_centroids, axis=1), axis=-1)  # (batch, frames)
    return float(np.nanmean(distances)**2)