Documentation for `Exclusion.py`¶

Exclusion ¶

This file implements various exclusion and filtering criteria in a modular way that can be reused elsewhere, e.g. in controllers.

BoxHolder ¶

BoxHolder()

A class to allow quick lookup of boxes (e.g. exclusion items, targets, etc). Creates an interval tree on mz as this is likely to narrow things down quicker. Also has a method for returning an rt interval tree for a particular mz and an mz interval tree for a particular RT.

Initialise a BoxHolder object

Source code in vimms/Exclusion.py

def __init__(self):
    """
    Initialise a BoxHolder object
    """
    self.boxes_mz = IntervalTree()
    self.boxes_rt = IntervalTree()

add_box ¶

add_box(box)

Add a box to the IntervalTree

Parameters:

Name	Type	Description	Default
`box`		the box to add	required

Returns: None

Source code in vimms/Exclusion.py

def add_box(self, box):
    """
    Add a box to the IntervalTree

    Args:
        box: the box to add

    Returns: None

    """
    mz_from = box.from_mz
    mz_to = box.to_mz
    rt_from = box.from_rt
    rt_to = box.to_rt
    self.boxes_mz.addi(mz_from, mz_to, box)
    self.boxes_rt.addi(rt_from, rt_to, box)

check_point ¶

check_point(mz, rt)

Find the boxes that match this mz and rt value

Parameters:

Name	Type	Description	Default
`mz`		the m/z to check	required
`rt`		the RT to check	required

Returns: the list of hits (boxes that contain this point)

Source code in vimms/Exclusion.py

def check_point(self, mz, rt):
    """
    Find the boxes that match this mz and rt value

    Args:
        mz: the m/z to check
        rt: the RT to check

    Returns: the list of hits (boxes that contain this point)

    """
    regions = self.boxes_mz.at(mz)
    hits = set()
    for r in regions:
        if r.data.rt_match(rt):
            hits.add(r.data)
    return hits

get_subset_mz ¶

get_subset_mz(mz)

Create an interval tree based upon mz for all boxes active at m/z

Parameters:

Name	Type	Description	Default
`mz`		the m/z value to check	required

Returns: a new BoxHolder object containing the subset of boxes at m/z

Source code in vimms/Exclusion.py

def get_subset_mz(self, mz):
    """
    Create an interval tree based upon mz for all boxes active at m/z

    Args:
        mz: the m/z value to check

    Returns: a new BoxHolder object containing the subset of boxes at m/z

    """
    regions = self.boxes_mz.at(mz)
    it = BoxHolder()
    for r in regions:
        box = r.data
        it.add_box(box)
    return it

get_subset_rt ¶

get_subset_rt(rt)

Create an interval tree based upon mz for all boxes active at rt

Parameters:

Name	Type	Description	Default
`rt`		the RT to check	required

Returns: a new BoxHolder object containing the subset of boxes at RT

Source code in vimms/Exclusion.py

def get_subset_rt(self, rt):
    """
    Create an interval tree based upon mz for all boxes active at rt

    Args:
        rt: the RT to check

    Returns: a new BoxHolder object containing the subset of boxes at RT

    """
    regions = self.boxes_rt.at(rt)
    it = BoxHolder()
    for r in regions:
        box = r.data
        it.add_box(box)
    return it

is_in_box ¶

is_in_box(mz, rt)

Check if this mz and rt is in any box

Parameters:

Name	Type	Description	Default
`mz`		the m/z to check	required
`rt`		the RT to check	required

Returns: True if it's a match, False otherwise.

Source code in vimms/Exclusion.py

def is_in_box(self, mz, rt):
    """
    Check if this mz and rt is in *any* box

    Args:
        mz: the m/z to check
        rt: the RT to check

    Returns: True if it's a match, False otherwise.

    """
    hits = self.check_point(mz, rt)
    if len(hits) > 0:
        return True
    else:
        return False

is_in_box_mz ¶

is_in_box_mz(mz)

Check if an mz value is in any box

Parameters:

Name	Type	Description	Default
`mz`		the m/z to check	required

Returns: True if it's a match, False otherwise.

Source code in vimms/Exclusion.py

def is_in_box_mz(self, mz):
    """
    Check if an mz value is in any box

    Args:
        mz: the m/z to check

    Returns: True if it's a match, False otherwise.

    """
    regions = self.boxes_mz.at(mz)
    if len(regions) > 0:
        return True
    else:
        return False

is_in_box_rt ¶

is_in_box_rt(rt)

Check if an RT value is in any box

Parameters:

Name	Type	Description	Default
`rt`		the m/z to check	required

Returns: True if it's a match, False otherwise.

Source code in vimms/Exclusion.py

def is_in_box_rt(self, rt):
    """
    Check if an RT value is in any box

    Args:
        rt: the m/z to check

    Returns: True if it's a match, False otherwise.

    """
    regions = self.boxes_rt.at(rt)
    if len(regions) > 0:
        return True
    else:
        return False

DEWFilter ¶

DEWFilter(rt_tol)

Bases: ScoreFilter

A class that implements dynamic exclusion filter

Initialises a dynamic exclusion filter based on time only Args: rt_tol: the RT tolerance (in seconds)

Source code in vimms/Exclusion.py

def __init__(self, rt_tol):
    """
    Initialises a dynamic exclusion filter based on time only
    Args:
        rt_tol: the RT tolerance (in seconds)
    """
    self.rt_tol = rt_tol

filter ¶

filter(current_rt, rois)

Check whether intensity values are above or below the threshold Args: current_rt: the current RT value rois: a list of vimms.Roi.Roi objects.

Returns: an array of indicators for the filter

Source code in vimms/Exclusion.py

def filter(self, current_rt, rois):
    """
    Check whether intensity values are above or below the threshold
    Args:
        current_rt: the current RT value
        rois: a list of [vimms.Roi.Roi][] objects.

    Returns: an array of indicators for the filter
    """

    last_frag_rts = [roi.last_frag_rt for roi in rois]

    # Handles None values by converting to NaN for which all
    # comparisons return 0
    return np.logical_not(current_rt - np.array(last_frag_rts, dtype=np.double) <= self.rt_tol)

ExclusionItem ¶

ExclusionItem(from_mz, to_mz, from_rt, to_rt, frag_at)

A class to store the item to exclude when computing dynamic exclusion window

Creates a dynamic exclusion item

Parameters:

Name	Description	Default
`from_mz`	m/z lower bounding box	required
`to_mz`	m/z upper bounding box	required
`from_rt`	RT lower bounding box	required
`to_rt`	RT upper bounding box	required
`frag_at`	RT when this ExclusionItem is fragmented	required

Source code in vimms/Exclusion.py

def __init__(self, from_mz, to_mz, from_rt, to_rt, frag_at):
    """
    Creates a dynamic exclusion item

    Args:
        from_mz: m/z lower bounding box
        to_mz: m/z upper bounding box
        from_rt: RT lower bounding box
        to_rt: RT upper bounding box
        frag_at: RT when this ExclusionItem is fragmented
    """
    self.from_mz = from_mz
    self.to_mz = to_mz
    self.from_rt = from_rt
    self.to_rt = to_rt
    self.frag_at = frag_at
    self.mz = (self.from_mz + self.to_mz) / 2.0
    self.rt = self.frag_at
    self.counter = 0  # add a counter field

mz_match ¶

mz_match(mz)

Checks that a certain m/z point lies in this box Args: mz: the m/z value to check

Returns: True if it's a match, False otherwise.

Source code in vimms/Exclusion.py

def mz_match(self, mz):
    """
    Checks that a certain m/z point lies in this box
    Args:
        mz: the m/z value to check

    Returns: True if it's a match, False otherwise.

    """
    if mz >= self.from_mz and mz <= self.to_mz:
        return True
    else:
        return False

peak_in ¶

peak_in(mz, rt)

Checks that a peak described by its (mz, rt) values lies in this box. Args: mz: the m/z value to check rt: the RT value to check

Returns: True if it's a match, False otherwise.

Source code in vimms/Exclusion.py

def peak_in(self, mz, rt):
    """
    Checks that a peak described by its (mz, rt) values lies in this box.
    Args:
        mz: the m/z value to check
        rt: the RT value to check

    Returns: True if it's a match, False otherwise.

    """
    if self.rt_match(rt) and self.mz_match(mz):
        return True
    else:
        return False

rt_match ¶

rt_match(rt)

Checks that a certain RT point lies in this box Args: rt: the RT value to check

Returns: True if it's a match, False otherwise.

Source code in vimms/Exclusion.py

def rt_match(self, rt):
    """
    Checks that a certain RT point lies in this box
    Args:
        rt: the RT value to check

    Returns: True if it's a match, False otherwise.

    """
    if rt >= self.from_rt and rt <= self.to_rt:
        return True
    else:
        return False

LengthFilter ¶

LengthFilter(min_roi_length_for_fragmentation)

Bases: ScoreFilter

A class that implements a check on minimum length of ROI for fragmentation

Initialise a length filter

Parameters:

Name	Type	Description	Default
`min_roi_length_for_fragmentation`		the minimum length of ROI for fragmentation	required

Source code in vimms/Exclusion.py

def __init__(self, min_roi_length_for_fragmentation):
    """
    Initialise a length filter

    Args:
        min_roi_length_for_fragmentation: the minimum length of ROI for fragmentation
    """
    self.min_roi_length_for_fragmentation = min_roi_length_for_fragmentation

filter ¶

filter(roi_lengths)

Check that ROI lengths are above the threshold Args: roi_lengths: a numpy array of ROI lengths

Returns: an array of indicator whether the lengths are above threshold

Source code in vimms/Exclusion.py

def filter(self, roi_lengths):
    """
    Check that ROI lengths are above the threshold
    Args:
        roi_lengths: a numpy array of ROI lengths

    Returns: an array of indicator whether the lengths are above threshold

    """
    return roi_lengths >= self.min_roi_length_for_fragmentation

MinIntensityFilter ¶

MinIntensityFilter(min_ms1_intensity)

Bases: ScoreFilter

A class that implements minimum intensity filter

Initialises the minimum intensity filter Args: min_ms1_intensity: the minimum intensity to check

Source code in vimms/Exclusion.py

def __init__(self, min_ms1_intensity):
    """
    Initialises the minimum intensity filter
    Args:
        min_ms1_intensity: the minimum intensity to check
    """
    self.min_ms1_intensity = min_ms1_intensity

filter ¶

filter(intensities)

Check whether intensity values are above or below the threshold Args: intensities: an array of intensity values

Returns: an array of indicators for the filter

Source code in vimms/Exclusion.py

def filter(self, intensities):
    """
    Check whether intensity values are above or below the threshold
    Args:
        intensities: an array of intensity values

    Returns: an array of indicators for the filter

    """
    return np.array(intensities) > self.min_ms1_intensity

ScoreFilter ¶

Bases: ABC

Base class for various filters

SmartROIFilter ¶

Bases: ScoreFilter

A class that implements SmartROI filtering criteria. For more details, refer to our paper 'Rapid Development ...'

filter ¶

filter(rois)

Filter ROIs based on SmartROI rules.

Parameters:

Name	Type	Description	Default
`rois`		a list of [vimms.Roi.Roi] objects. if this is a normal ROI object, always return True for everything otherwise track the status based on the SmartROI rules	required

Returns: an array of indicator whether ROI can be fragmented or not.

Source code in vimms/Exclusion.py

def filter(self, rois):
    """
    Filter ROIs based on SmartROI rules.


    Args:
        rois: a list of [vimms.Roi.Roi] objects. if this is a normal ROI object,
              always return True for everything otherwise track the status based
              on the SmartROI rules

    Returns: an array of indicator whether ROI can be fragmented or not.

    """
    can_fragments = np.array([roi.can_fragment for roi in rois])
    return can_fragments

TopNExclusion ¶

TopNExclusion(
    mz_tol,
    rt_tol,
    exclude_after_n_times=1,
    exclude_t0=0,
    initial_exclusion_list=None,
)

A class that perform standard dynamic exclusion for Top-N. This is based on checked whether an m/z and RT value lies in certain exclusion boxes.

Initialise a Top-N dynamic exclusion object

Parameters:

Name	Type	Description	Default
`mz_tol`			required
`rt_tol`			required
`exclude_after_n_times`			`1`
`exclude_t0`			`0`
`initial_exclusion_list`			`None`

Source code in vimms/Exclusion.py

def __init__(
    self, mz_tol, rt_tol, exclude_after_n_times=1, exclude_t0=0, initial_exclusion_list=None
):
    """
    Initialise a Top-N dynamic exclusion object

    Args:
        mz_tol:
        rt_tol:
        exclude_after_n_times:
        exclude_t0:
        initial_exclusion_list:
    """
    self.mz_tol = mz_tol
    self.rt_tol = rt_tol
    self.exclude_after_n_times = exclude_after_n_times
    self.exclude_t0 = exclude_t0

    self.exclude_check = BoxHolder()
    self.dynamic_exclusion = BoxHolder()

    # Initialise 'dynamic_exclusion' with its initial value, if provided
    if initial_exclusion_list is not None:
        for initial in initial_exclusion_list:
            self.dynamic_exclusion.add_box(initial)

is_excluded ¶

is_excluded(mz, rt)

Checks if a pair of (mz, rt) value is currently excluded by dynamic exclusion window

Parameters:

Name	Description	Default
`mz`	m/z value	required
`rt`	RT value	required
`mz_tol`	m/z tolerance	required
`rt_tol`	rt_tolerance	required

Returns: True if excluded (with weight 0.0), False otherwise (weight 1.0).

Source code in vimms/Exclusion.py

def is_excluded(self, mz, rt):
    """
    Checks if a pair of (mz, rt) value is currently excluded by
    dynamic exclusion window

    Args:
        mz: m/z value
        rt: RT value
        mz_tol: m/z tolerance
        rt_tol: rt_tolerance

    Returns: True if excluded (with weight 0.0), False otherwise (weight 1.0).

    """
    # check the main dynamic exclusion list to see if this ion should be excluded
    dew_check = self.dynamic_exclusion.is_in_box(mz, rt)
    if dew_check:
        return True, 0.0

    # if not excluded, then check the initial list to see if we need to increment count
    found = False
    hits = self.exclude_check.check_point(mz, rt)
    if len(hits) > 0:  # if there are initial hits, increment them

        # here we increment all hits that contain this (mz, rt) point
        # and check if any of them has been excluded more times than the threshold
        for box in hits:
            box.increment_counter()
            if box.counter >= self.exclude_after_n_times:
                found = True

    # if some boxes have hit threshold that were reached, exclude this ion
    if found:
        x = self._get_exclusion_item(mz, rt, self.mz_tol, self.rt_tol)
        self.dynamic_exclusion.add_box(x)
        return True, 0.0

    # finally this ion is not excluded if it is not in either the main or initial lists
    return False, 1.0

update ¶

update(current_scan, ms2_tasks)

For every scheduled MS2 scan, add its precursor m/z for initial exclusion check A tolerance of initial_t0 is used

Parameters:

Name	Type	Description	Default
`current_scan`		the current MS1 scan	required
`ms2_tasks`		scheduled ms2 tasks	required

Returns: None

Source code in vimms/Exclusion.py

def update(self, current_scan, ms2_tasks):
    """
    For every scheduled MS2 scan, add its precursor m/z for initial exclusion check
    A tolerance of initial_t0 is used

    Args:
        current_scan: the current MS1 scan
        ms2_tasks: scheduled ms2 tasks

    Returns: None

    """
    rt = current_scan.rt
    for task in ms2_tasks:
        for precursor in task.get("precursor_mz"):
            mz = precursor.precursor_mz

            # new way of checking DEW -- with an initial boxholder to check first
            if self.exclude_t0 > 0:
                x = self._get_exclusion_item(mz, rt, self.mz_tol, self.exclude_t0)
                self.exclude_check.add_box(x)

            else:  # fallback to the old way by adding directly to the DEW boxholder
                x = self._get_exclusion_item(mz, rt, self.mz_tol, self.rt_tol)
                self.dynamic_exclusion.add_box(x)

WeightedDEWExclusion ¶

WeightedDEWExclusion(mz_tol, rt_tol, exclusion_t_0)

Bases: TopNExclusion

A class that perform weighted dynamic exclusion for Top-N. This is further described in our paper 'Rapid Development ...'

Initialises a weighted dynamic exclusion object Args: rt_tol: the RT tolerance (in seconds) exclusion_t_0: WeightedDEW parameter

Source code in vimms/Exclusion.py

def __init__(self, mz_tol, rt_tol, exclusion_t_0):
    """
    Initialises a weighted dynamic exclusion object
    Args:
        rt_tol: the RT tolerance (in seconds)
        exclusion_t_0: WeightedDEW parameter
    """
    super().__init__(mz_tol, rt_tol)
    self.exclusion_t_0 = exclusion_t_0
    if self.exclusion_t_0 > self.rt_tol:
        raise ValueError("exclusion_t_0 must be lte rt_tol")

WeightedDEWFilter ¶

WeightedDEWFilter(exclusion)

Bases: ScoreFilter

A class that implements weighted dynamic exclusion filter

Initialises a weighted dynamic exclusion filter

Parameters:

Name	Type	Description	Default
`exclusion`		a vimms.Exclusion.ExclusionItem object	required

Source code in vimms/Exclusion.py

def __init__(self, exclusion):
    """
    Initialises a weighted dynamic exclusion filter

    Args:
        exclusion: a [vimms.Exclusion.ExclusionItem][] object
    """
    self.exclusion = exclusion

filter ¶

filter(current_rt, rois)

Check whether ROIs are excluded or not based on weighted dynamic exclusion filter Args: current_rt: the current RT value rois: a list of vimms.Roi.Roi objects.

Returns: a numpy array of weights for each ROI.

Source code in vimms/Exclusion.py

def filter(self, current_rt, rois):
    """
    Check whether ROIs are excluded or not based on weighted dynamic exclusion filter
    Args:
        current_rt: the current RT value
        rois: a list of [vimms.Roi.Roi][] objects.

    Returns: a numpy array of weights for each ROI.

    """
    weights = []
    for roi in rois:
        last_mz, last_rt, last_intensity = roi.get_last_datum()
        is_exc, weight = self.exclusion.is_excluded(last_mz, last_rt)
        weights.append(weight)
    return np.array(weights)

compute_weight ¶

compute_weight(current_rt, frag_at, rt_tol, exclusion_t_0)

Compute the weight for current RT at frag_at given the RT tolerance and other parameters. Args: current_rt: the current RT value frag_at: the retention time when fragmentation last occured rt_tol: RT tolerance (in seconds) exclusion_t_0: weighted DEW parameter

Returns: a new weight

Source code in vimms/Exclusion.py

def compute_weight(current_rt, frag_at, rt_tol, exclusion_t_0):
    """
    Compute the weight for current RT at frag_at given the RT tolerance and other parameters.
    Args:
        current_rt: the current RT value
        frag_at: the retention time when fragmentation last occured
        rt_tol: RT tolerance (in seconds)
        exclusion_t_0: weighted DEW parameter

    Returns: a new weight

    """
    if frag_at is None:
        # never been fragmented before, always include (weight 1.0)
        return False, 1.0
    elif current_rt >= frag_at + rt_tol:
        # outside the windows of rt_tol, always include (weight > 1.0)
        return False, 1.0
    elif current_rt <= frag_at + exclusion_t_0:
        # fragmented but within exclusion_t_0, always exclude (weight 0.0)
        return True, 0.0
    else:
        # compute weight according to the WeightedDEW scheme
        weight = (current_rt - (exclusion_t_0 + frag_at)) / (rt_tol - exclusion_t_0)
        if weight > 1:
            logger.warning(
                "exclusion weight %f is greater than 1 ("
                "current_rt %f exclusion_t_0 %f frag_at %f "
                "rt_tol %f)" % (weight, current_rt, exclusion_t_0, frag_at, rt_tol)
            )
        # assert weight <= 1, weight
        return True, weight

Documentation for Exclusion.py¶

Exclusion ¶

BoxHolder ¶

add_box ¶

check_point ¶

get_subset_mz ¶

get_subset_rt ¶

is_in_box ¶

is_in_box_mz ¶

is_in_box_rt ¶

DEWFilter ¶

filter ¶

ExclusionItem ¶

mz_match ¶

peak_in ¶

rt_match ¶

LengthFilter ¶

filter ¶

MinIntensityFilter ¶

filter ¶

ScoreFilter ¶

SmartROIFilter ¶

filter ¶

TopNExclusion ¶

is_excluded ¶

update ¶

WeightedDEWExclusion ¶

WeightedDEWFilter ¶

filter ¶

compute_weight ¶

Documentation for `Exclusion.py`¶