development/doxygen/refiners_8py_source.html

import functools

import numpy as np

import collections

import copy


from tracking.validation.plot import ValidationPlot, compose_axis_label

from tracking.validation.fom import ValidationFiguresOfMerit

from tracking.validation.classification import ClassificationAnalysis

from tracking.validation.pull import PullAnalysis

from tracking.validation.tolerate_missing_key_formatter import TolerateMissingKeyFormatter

from tracking.root_utils import root_cd, root_save_name


import ROOT


import logging


def get_logger():

    return logging.getLogger(__name__)


formatter = TolerateMissingKeyFormatter()


class Refiner:

    """Python module to refine a peeled dictionary"""


    def __init__(self, refiner_function=None):

        """Constructor of the Refiner instance"""


        self.refiner_function = refiner_function


    def __get__(self, harvesting_module, cls=None):

        """Getter of the Refiner instance"""

        if harvesting_module is None:

            # Class access

            return self

        else:

            # Instance access

            refine = self.refine


            def bound_call(*args, **kwds):

                return refine(harvesting_module, *args, **kwds)

            return bound_call


    def __call__(self, harvesting_module, crops=None, *args, **kwds):

        """implementation of the function-call of the Refiner instance

             r = Refiner()

             r(harvester) # decoration

             r(harvester, crops, args, keywords) # refinement

        """

        if crops is None:

            # Decoration mode

            harvesting_module.refiners.append(self)

            return harvesting_module

        else:

            # Refining mode

            return self.refine(harvesting_module, crops, *args, **kwds)


    def refine(self, harvesting_module, *args, **kwds):

        """Apply the instance's refiner function"""

        self.refiner_function(harvesting_module, *args, **kwds)


class SaveFiguresOfMeritRefiner(Refiner):

    """Refiner for figures of merit"""


    default_name = "{module.id}_figures_of_merit{groupby_key}"


    default_title = "Figures of merit in {module.title}"


    default_contact = "{module.contact}"


    default_description = "Figures of merit are the {aggregation.__name__} of {keys}"


    default_check = "Check for reasonable values"


    default_key = "{aggregation.__name__}_{part_name}"


    @staticmethod

    def mean(xs):

        return np.nanmean(xs)


    default_aggregation = mean


    def __init__(self,

                 name=None,

                 title=None,

                 contact=None,

                 description=None,

                 check=None,

                 key=None,

                 aggregation=None,

                 ):

        """Constructor for this refiner"""


        super().__init__()


        self.name = name


        self.title = title


        self.description = description


        self.check = check


        self.contact = contact


        self.key = key


        self.aggregation = aggregation


    def refine(self,

               harvesting_module,

               crops,

               tdirectory=None,

               groupby_part_name=None,

               groupby_value=None,

               **kwds):

        """Process the figures of merit"""


        name = self.name or self.default_name

        title = self.title or self.default_title

        contact = self.contact or self.default_contact

        description = self.description or self.default_description

        check = self.check or self.default_check


        aggregation = self.aggregation or self.default_aggregation


        replacement_dict = dict(

            refiner=self,

            module=harvesting_module,

            aggregation=aggregation,

            groupby_key='_' + groupby_part_name + groupby_value if groupby_part_name else "",

            groupby=groupby_part_name,  # deprecated

            groupby_value=groupby_value,  # deprecated

        )


        name = formatter.format(name, **replacement_dict)

        title = formatter.format(title, **replacement_dict)

        contact = formatter.format(contact, **replacement_dict)


        figures_of_merit = ValidationFiguresOfMerit(name,

                                                    contact=contact,

                                                    title=title)


        for part_name, parts in iter_items_sorted_for_key(crops):

            key = self.key or self.default_key

            key = formatter.format(key, part_name=part_name, **replacement_dict)

            figures_of_merit[key] = aggregation(parts)


        keys = list(figures_of_merit.keys())


        description = formatter.format(description, keys=keys, **replacement_dict)

        check = formatter.format(check, keys=keys, **replacement_dict)


        figures_of_merit.description = description

        figures_of_merit.check = check


        if tdirectory:

            figures_of_merit.write(tdirectory)


        print(figures_of_merit)


class SaveHistogramsRefiner(Refiner):

    """Refiner for histograms"""


    default_name = "{module.id}_{part_name}_histogram{groupby_key}{stackby_key}"


    default_title = "Histogram of {part_name}{groupby_key}{stackby_key} from {module.title}"


    default_contact = "{module.contact}"


    default_description = "This is a histogram of {part_name}{groupby_key}{stackby_key}."


    default_check = "Check if the distribution is reasonable"


    def __init__(self,

                 name=None,

                 title=None,

                 contact=None,

                 description=None,

                 check=None,

                 lower_bound=None,

                 upper_bound=None,

                 bins=None,

                 outlier_z_score=None,

                 allow_discrete=False,

                 stackby="",

                 fit=None,

                 fit_z_score=None):

        """Constructor for this refiner"""


        super().__init__()


        self.name = name


        self.title = title


        self.description = description


        self.check = check


        self.contact = contact


        self.lower_bound = lower_bound


        self.upper_bound = upper_bound


        self.bins = bins


        self.outlier_z_score = outlier_z_score


        self.allow_discrete = allow_discrete


        self.stackby = stackby


        self.fit = fit


        self.fit_z_score = fit_z_score


    def refine(self,

               harvesting_module,

               crops,

               tdirectory=None,

               groupby_part_name=None,

               groupby_value=None,

               **kwds):

        """Process the histogram"""


        stackby = self.stackby

        if stackby:

            stackby_parts = crops[stackby]

        else:

            stackby_parts = None


        replacement_dict = dict(

            refiner=self,

            module=harvesting_module,

            stackby_key=' stacked by ' + stackby if stackby else "",

            groupby_key=' in group ' + groupby_part_name + groupby_value if groupby_part_name else "",

        )


        contact = self.contact or self.default_contact

        contact = formatter.format(contact, **replacement_dict)


        for part_name, parts in iter_items_sorted_for_key(crops):

            name = self.name or self.default_name

            title = self.title or self.default_title

            description = self.description or self.default_description

            check = self.check or self.default_check


            name = formatter.format(name, part_name=part_name, **replacement_dict)

            title = formatter.format(title, part_name=part_name, **replacement_dict)

            description = formatter.format(description, part_name=part_name, **replacement_dict)

            check = formatter.format(check, part_name=part_name, **replacement_dict)


            histogram = ValidationPlot(name)

            histogram.hist(parts,

                           lower_bound=self.lower_bound,

                           upper_bound=self.upper_bound,

                           bins=self.bins,

                           outlier_z_score=self.outlier_z_score,

                           allow_discrete=self.allow_discrete,

                           stackby=stackby_parts)


            histogram.title = title

            histogram.contact = contact

            histogram.description = description

            histogram.check = check


            histogram.xlabel = compose_axis_label(part_name)


            if self.fit:

                if self.fit_z_score is None:

                    kwds = dict()

                else:

                    kwds = dict(z_score=self.fit_z_score)


                fit_method_name = 'fit_' + str(self.fit)

                try:

                    fit_method = getattr(histogram, fit_method_name)

                except AttributeError:

                    histogram.fit(str(self.fit), **kwds)

                else:

                    fit_method(**kwds)


            if tdirectory:

                histogram.write(tdirectory)


class Plot2DRefiner(Refiner):

    """Refiner for profile histograms and 2D scatterplots"""


    plot_kind = "profile"


    def __init__(self,

                 y,

                 x=None,

                 name=None,

                 title=None,

                 contact=None,

                 description=None,

                 check=None,

                 stackby=None,

                 y_unit=None,

                 y_binary=None,

                 y_log=None,

                 lower_bound=None,

                 upper_bound=None,

                 bins=None,

                 outlier_z_score=None,

                 fit=None,

                 fit_z_score=None,

                 skip_single_valued=False,

                 allow_discrete=False):

        """Constructor for this refiner"""


        super().__init__()


        self.name = name


        self.title = title


        self.description = description


        self.check = check


        self.contact = contact


        self.x = x


        self.y = y


        self.stackby = stackby


        self.y_unit = y_unit


        self.lower_bound = lower_bound


        self.upper_bound = upper_bound


        self.bins = bins


        self.y_binary = y_binary


        self.y_log = y_log


        self.outlier_z_score = outlier_z_score


        self.allow_discrete = allow_discrete


        self.fit = fit


        self.fit_z_score = fit_z_score


        self.skip_single_valued = skip_single_valued


    def refine(self,

               harvesting_module,

               crops,

               tdirectory=None,

               groupby_part_name=None,

               groupby_value=None,

               **kwds):

        """Process the profile histogram / scatterplot"""


        stackby = self.stackby

        if stackby:

            stackby_parts = crops[stackby]

        else:

            stackby_parts = None


        replacement_dict = dict(

            refiner=self,

            module=harvesting_module,

            stackby_key=' stacked by ' + stackby if stackby else "",

            groupby_key=' in group ' + groupby_part_name + groupby_value if groupby_part_name else "",

        )


        contact = self.contact or self.default_contact

        contact = formatter.format(contact, **replacement_dict)


        y_crops = select_crop_parts(crops, select=self.y)

        x_crops = select_crop_parts(crops, select=self.x, exclude=self.y)


        for y_part_name, y_parts in iter_items_sorted_for_key(y_crops):

            for x_part_name, x_parts in iter_items_sorted_for_key(x_crops):


                if self.skip_single_valued and not self.has_more_than_one_value(x_parts):

                    get_logger().info('Skipping "%s" by "%s" profile because x has only a single value "%s"',

                                      y_part_name,

                                      x_part_name,

                                      x_parts[0])

                    continue


                if self.skip_single_valued and not self.has_more_than_one_value(y_parts):

                    get_logger().info('Skipping "%s" by "%s" profile because y has only a single value "%s"',

                                      y_part_name,

                                      x_part_name,

                                      y_parts[0])

                    continue


                name = self.name or self.default_name

                title = self.title or self.default_title

                description = self.description or self.default_description

                check = self.check or self.default_check


                name = formatter.format(name,

                                        x_part_name=x_part_name,

                                        y_part_name=y_part_name,

                                        **replacement_dict)


                title = formatter.format(title,

                                         x_part_name=x_part_name,

                                         y_part_name=y_part_name,

                                         **replacement_dict)


                description = formatter.format(description,

                                               x_part_name=x_part_name,

                                               y_part_name=y_part_name,

                                               **replacement_dict)


                check = formatter.format(check,

                                         x_part_name=x_part_name,

                                         y_part_name=y_part_name,

                                         **replacement_dict)


                profile_plot = ValidationPlot(name)


                plot_kind = self.plot_kind

                if plot_kind == "profile":

                    profile_plot.profile(x_parts,

                                         y_parts,

                                         lower_bound=self.lower_bound,

                                         upper_bound=self.upper_bound,

                                         bins=self.bins,

                                         y_binary=self.y_binary,

                                         y_log=self.y_log,

                                         outlier_z_score=self.outlier_z_score,

                                         allow_discrete=self.allow_discrete,

                                         stackby=stackby_parts)


                    if self.fit:

                        if self.fit_z_score is None:

                            kwds = dict()

                        else:

                            kwds = dict(z_score=self.fit_z_score)


                        fit_method_name = 'fit_' + str(self.fit)

                        try:

                            fit_method = getattr(profile_plot, fit_method_name)

                        except BaseException:

                            profile_plot.fit(str(self.fit), **kwds)

                        else:

                            fit_method(**kwds)


                elif plot_kind == "scatter":

                    profile_plot.scatter(x_parts,

                                         y_parts,

                                         lower_bound=self.lower_bound,

                                         upper_bound=self.upper_bound,

                                         outlier_z_score=self.outlier_z_score,

                                         stackby=stackby_parts)


                profile_plot.title = title

                profile_plot.contact = contact

                profile_plot.description = description

                profile_plot.check = check


                profile_plot.xlabel = compose_axis_label(x_part_name)

                profile_plot.ylabel = compose_axis_label(y_part_name, self.y_unit)


                if tdirectory:

                    profile_plot.write(tdirectory)


    @staticmethod

    def has_more_than_one_value(xs):

        """check if a list has at least two unique values"""

        first_x = xs[0]

        for x in xs:

            if x != first_x:

                return True

        else:

            return False


class SaveProfilesRefiner(Plot2DRefiner):

    """Refiner for profile histograms"""


    default_name = "{module.id}_{y_part_name}_by_{x_part_name}_profile{groupby_key}{stackby_key}"


    default_title = "Profile of {y_part_name} by {x_part_name} from {module.title}"


    default_contact = "{module.contact}"


    default_description = "This is a profile of {y_part_name} over {x_part_name}."


    default_check = "Check if the trend line is reasonable."


    plot_kind = "profile"


class SaveScatterRefiner(Plot2DRefiner):

    """Refiner for 2D scatterplots"""


    default_name = "{module.id}_{y_part_name}_by_{x_part_name}_scatter{groupby_key}{stackby_key}"


    default_title = "Scatter of {y_part_name} by {x_part_name} from {module.title}"


    default_contact = "{module.contact}"


    default_description = "This is a scatter of {y_part_name} over {x_part_name}."


    default_check = "Check if the distributions is reasonable."


    plot_kind = "scatter"


class SaveClassificationAnalysisRefiner(Refiner):

    """Refiner for truth-classification analyses"""


    default_contact = "{module.contact}"


    default_truth_name = "{part_name}_truth"


    default_estimate_name = "{part_name}_estimate"


    def __init__(self,

                 part_name=None,

                 contact=None,

                 estimate_name=None,

                 truth_name=None,

                 cut_direction=None,

                 cut=None,

                 lower_bound=None,

                 upper_bound=None,

                 outlier_z_score=None,

                 allow_discrete=False,

                 unit=None):

        """Constructor for this refiner"""


        self.part_name = part_name


        self.contact = contact


        self.estimate_name = estimate_name


        self.truth_name = truth_name


        self.cut = cut


        self.cut_direction = cut_direction


        self.lower_bound = lower_bound


        self.upper_bound = upper_bound


        self.outlier_z_score = outlier_z_score


        self.allow_discrete = allow_discrete


        self.unit = unit


    def refine(self,

               harvesting_module,

               crops,

               tdirectory=None,

               groupby_part_name=None,

               groupby_value=None,

               **kwds):

        """Process the truth-classification analysis"""


        replacement_dict = dict(

            refiner=self,

            module=harvesting_module,

            groupby_key='_' + groupby_part_name + groupby_value if groupby_part_name else "",

            groupby=groupby_part_name,  # deprecated

            groupby_value=groupby_value,  # deprecated

        )


        contact = self.contact or self.default_contact

        contact = formatter.format(contact, **replacement_dict)


        if self.truth_name is not None:

            truth_name = self.truth_name

        else:

            truth_name = self.default_truth_name


        truth_name = formatter.format(truth_name, part_name=self.part_name)

        truths = crops[truth_name]


        if self.estimate_name is not None:

            estimate_name = self.estimate_name

        else:

            estimate_name = self.default_estimate_name


        if isinstance(estimate_name, str):

            estimate_names = [estimate_name, ]

        else:

            estimate_names = estimate_name


        for estimate_name in estimate_names:

            estimate_name = formatter.format(estimate_name, part_name=self.part_name)

            estimates = crops[estimate_name]


            classification_analysis = ClassificationAnalysis(quantity_name=estimate_name,

                                                             contact=contact,

                                                             cut_direction=self.cut_direction,

                                                             cut=self.cut,

                                                             lower_bound=self.lower_bound,

                                                             upper_bound=self.upper_bound,

                                                             outlier_z_score=self.outlier_z_score,

                                                             allow_discrete=self.allow_discrete,

                                                             unit=self.unit)


            classification_analysis.analyse(estimates, truths)


            if tdirectory:

                classification_analysis.write(tdirectory)


class SavePullAnalysisRefiner(Refiner):

    """Refiner for pull analyses"""


    default_name = "{module.id}_{quantity_name}"


    default_contact = "{module.contact}"


    default_title_postfix = " from {module.title}"


    default_truth_name = "{part_name}_truth"


    default_estimate_name = "{part_name}_estimate"


    default_variance_name = "{part_name}_variance"


    def __init__(self,

                 name=None,

                 contact=None,

                 title_postfix=None,

                 part_name=None,

                 part_names=None,

                 truth_name=None,

                 estimate_name=None,

                 variance_name=None,

                 quantity_name=None,

                 aux_names=None,

                 unit=None,

                 outlier_z_score=None,

                 absolute=False,

                 which_plots=None):

        """Constructor for this refiner"""

        if aux_names is None:

            aux_names = []


        self.name = name


        self.contact = contact


        self.title_postfix = title_postfix


        self.part_names = []

        if part_names is not None:

            self.part_names = part_names


        if part_name is not None:

            self.part_names.append(part_name)


        self.truth_name = truth_name


        self.estimate_name = estimate_name


        self.variance_name = variance_name


        self.quantity_name = quantity_name


        self.unit = unit


        self.aux_names = aux_names


        self.outlier_z_score = outlier_z_score


        self.absolute = absolute


        self.which_plots = which_plots


    def refine(self,

               harvesting_module,

               crops,

               tdirectory=None,

               groupby_part_name=None,

               groupby_value=None,

               **kwds):

        """Process the pull analysis"""


        replacement_dict = dict(

            refiner=self,

            module=harvesting_module,

            # stackby_key='_' + stackby if stackby else "",

            groupby_key='_' + groupby_part_name + groupby_value if groupby_part_name else "",

            groupby=groupby_part_name,  # deprecated

            groupby_value=groupby_value,  # deprecated

        )


        contact = self.contact or self.default_contact

        contact = formatter.format(contact, **replacement_dict)


        name = self.name or self.default_name


        if self.aux_names:

            auxiliaries = select_crop_parts(crops, self.aux_names)

        else:

            auxiliaries = {}


        for part_name in self.part_names:

            name = formatter.format(name, part_name=part_name, **replacement_dict)

            plot_name = name + "_{subplot_name}"


            title_postfix = self.title_postfix

            if title_postfix is None:

                title_postfix = self.default_title_postfix


            title_postfix = formatter.format(title_postfix, part_name=part_name, **replacement_dict)

            plot_title = "{subplot_title} of {quantity_name}" + title_postfix


            if self.truth_name is not None:

                truth_name = self.truth_name

            else:

                truth_name = self.default_truth_name


            if self.estimate_name is not None:

                estimate_name = self.estimate_name

            else:

                estimate_name = self.default_estimate_name


            if self.variance_name is not None:

                variance_name = self.variance_name

            else:

                variance_name = self.default_variance_name


            truth_name = formatter.format(truth_name, part_name=part_name)

            estimate_name = formatter.format(estimate_name, part_name=part_name)

            variance_name = formatter.format(variance_name, part_name=part_name)


            truths = crops[truth_name]

            estimates = crops[estimate_name]

            try:

                variances = crops[variance_name]

            except KeyError:

                variances = None


            quantity_name = self.quantity_name or part_name


            which_plots = self.which_plots


            pull_analysis = PullAnalysis(quantity_name,

                                         unit=self.unit,

                                         absolute=self.absolute,

                                         outlier_z_score=self.outlier_z_score,

                                         plot_name=plot_name,

                                         plot_title=plot_title)


            pull_analysis.analyse(truths,

                                  estimates,

                                  variances,

                                  auxiliaries=auxiliaries,

                                  which_plots=which_plots)


            pull_analysis.contact = contact


            if tdirectory:

                pull_analysis.write(tdirectory)


class SaveTreeRefiner(Refiner):

    """Refiner for ROOT TTrees"""


    default_name = "{module.id}_tree"


    default_title = "Tree of {module.id}"


    def __init__(self,

                 name=None,

                 title=None):

        """Constructor for this refiner"""

        super().__init__()


        self.name = name


        self.title = title


    def refine(self,

               harvesting_module,

               crops,

               tdirectory=None,

               groupby_part_name=None,

               groupby_value=None,

               **kwds):

        """Process the TTree"""


        replacement_dict = dict(

            refiner=self,

            module=harvesting_module,

            groupby_key='_' + groupby_part_name + groupby_value if groupby_part_name else "",

            groupby=groupby_part_name,  # deprecated

            groupby_value=groupby_value,  # deprecated

        )


        with root_cd(tdirectory):

            name = self.name or self.default_name

            title = self.title or self.default_title


            name = formatter.format(name, **replacement_dict)

            title = formatter.format(title, **replacement_dict)


            output_ttree = ROOT.TTree(root_save_name(name), title)

            for part_name, parts in iter_items_sorted_for_key(crops):

                self.add_branch(output_ttree, part_name, parts)


            output_ttree.FlushBaskets()

            output_ttree.Write()


    def add_branch(self, output_ttree, part_name, parts):

        """Add a TBranch to the TTree"""

        input_value = np.zeros(1, dtype=float)


        branch_type_spec = f'{part_name}/D'

        tbranch = output_ttree.Branch(part_name, input_value, branch_type_spec)


        if output_ttree.GetNbranches() == 1:

            # On filling of the first branch we need to use the fill method of the TTree

            # For all other branches we can use the one of the branch

            # #justrootthings

            for value in parts:

                input_value[0] = value

                output_ttree.Fill()


        else:

            for value in parts:

                input_value[0] = value

                tbranch.Fill()


        output_ttree.GetEntry(0)

        output_ttree.ResetBranchAddress(tbranch)

        also_subbranches = True  # No subbranches here but we drop the buffers just in case.

        output_ttree.DropBranchFromCache(tbranch, also_subbranches)


class FilterRefiner(Refiner):

    """Refiner for filters"""


    def __init__(self, wrapped_refiner, filter=None, on=None):

        """Constructor for this refiner"""


        self.wrapped_refiner = wrapped_refiner


        if filter is None:


            self.filter = np.nonzero

        else:

            self.filter = filter


        self.on = on


    def refine(self, harvesting_module, crops, *args, **kwds):

        """Process this filter"""

        filtered_crops = filter_crops(crops, self.filter, part_name=self.on)

        self.wrapped_refiner(harvesting_module, filtered_crops, *args, **kwds)


class SelectRefiner(Refiner):

    """Refiner for selection"""


    def __init__(self, wrapped_refiner, select=None, exclude=None):

        """Constructor for this refiner"""

        if select is None:

            select = []

        if exclude is None:

            exclude = []


        self.wrapped_refiner = wrapped_refiner


        self.select = select


        self.exclude = exclude


    def refine(self, harvesting_module, crops, *args, **kwds):

        """Process this selection"""

        selected_crops = select_crop_parts(crops, select=self.select, exclude=self.exclude)

        self.wrapped_refiner(harvesting_module, selected_crops, *args, **kwds)


class GroupByRefiner(Refiner):

    """Refiner for grouping"""


    default_exclude_by = True


    def __init__(self,

                 wrapped_refiner,

                 by=None,

                 exclude_by=None):

        """Constructor for this refiner"""

        if by is None:

            by = []


        self.wrapped_refiner = wrapped_refiner


        self.by = by


        self.exclude_by = exclude_by if exclude_by is not None else self.default_exclude_by


    def refine(self,

               harvesting_module,

               crops,

               groupby_part_name=None,

               groupby_value=None,

               *args,

               **kwds):

        """Process this grouping"""


        by = self.by


        # A single name to do the group by

        if isinstance(by, str) or by is None:

            part_name = by

            # Wrap it into a list an continue with the general case

            by = [part_name, ]


        for groupby_spec in by:

            if groupby_spec is None:

                # Using empty string as groupby_value to indicate that all values have been selected

                value = None

                self.wrapped_refiner(harvesting_module,

                                     crops,

                                     groupby_part_name=None,

                                     groupby_value=value,

                                     *args,

                                     **kwds)

                continue


            elif isinstance(groupby_spec, str):

                part_name = groupby_spec

                groupby_parts = crops[part_name]

                unique_values, index_of_values = np.unique(groupby_parts, return_inverse=True)

                groupby_values = [f" = {value}]" for value in unique_values]


            elif isinstance(groupby_spec, tuple):

                part_name = groupby_spec[0]

                cuts = groupby_spec[1]


                groupby_parts = crops[part_name]


                # Take care of nans

                digitization_cuts = list(np.sort(cuts))

                if digitization_cuts[-1] != np.inf:

                    digitization_cuts.append(np.inf)

                index_of_values = np.digitize(groupby_parts, digitization_cuts, right=True)


                groupby_values = [f"below {digitization_cuts[0]}"]

                bin_bounds = list(zip(digitization_cuts[0:], digitization_cuts[1:]))

                for lower_bound, upper_bound in bin_bounds:

                    if lower_bound == upper_bound:

                        # degenerated bin case

                        groupby_values.append(f"= {lower_bound}")

                    elif upper_bound == np.inf:

                        groupby_values.append(f"above {lower_bound}")

                    else:

                        groupby_values.append(f"between {lower_bound} and {upper_bound}")

                groupby_values.append("is nan")

                assert len(groupby_values) == len(digitization_cuts) + 1


            else:

                raise ValueError(f"Unknown groupby specification {groupby_spec}")


            # Exclude the groupby variable if desired

            selected_crops = select_crop_parts(crops, exclude=part_name if self.exclude_by else None)

            for index_of_value, groupby_value in enumerate(groupby_values):

                indices_for_value = index_of_values == index_of_value

                if not np.any(indices_for_value):

                    continue


                filtered_crops = filter_crops(selected_crops, indices_for_value)


                self.wrapped_refiner(harvesting_module,

                                     filtered_crops,

                                     groupby_part_name=part_name,

                                     groupby_value=groupby_value,

                                     *args,

                                     **kwds)


class CdRefiner(Refiner):

    """Refiner for change-directory"""


    default_folder_name = ""


    default_groupby_addition = "_groupby_{groupby}_{groupby_value}"


    def __init__(self,

                 wrapped_refiner,

                 folder_name=None,

                 groupby_addition=None):

        """Constructor for this refiner"""


        self.wrapped_refiner = wrapped_refiner


        self.folder_name = folder_name


        self.groupby_addition = groupby_addition


    def refine(self,

               harvesting_module,

               crops,

               tdirectory=None,

               groupby_part_name=None,

               groupby_value=None,

               *args,

               **kwds):

        """Process the change-directory"""


        folder_name = self.folder_name

        if folder_name is None:

            if groupby_value is not None:

                folder_name = "{groupby_addition}"

            else:

                folder_name = self.default_folder_name


        groupby_addition = self.groupby_addition


        if groupby_addition is None:

            groupby_addition = self.default_groupby_addition


        if groupby_part_name is None and groupby_value is None:

            groupby_addition = ""

        else:

            groupby_addition = formatter.format(groupby_addition,

                                                groupby=groupby_part_name,

                                                groupby_value=groupby_value)


        folder_name = formatter.format(folder_name,

                                       groupby_addition=groupby_addition,

                                       groupby=groupby_part_name,

                                       groupby_value=groupby_value)


        folder_name = '/'.join(root_save_name(name) for name in folder_name.split('/'))


        with root_cd(tdirectory):

            with root_cd(folder_name) as tdirectory:

                self.wrapped_refiner(harvesting_module,

                                     crops,

                                     tdirectory=tdirectory,

                                     groupby_part_name=groupby_part_name,

                                     groupby_value=groupby_value,

                                     *args,

                                     **kwds)


class ExpertLevelRefiner(Refiner):

    """Refiner for expert-level categorization"""


    def __init__(self, wrapped_refiner, above_expert_level=None, below_expert_level=None):

        """Constructor for this refiner"""


        self.wrapped_refiner = wrapped_refiner


        self.above_expert_level = above_expert_level


        self.below_expert_level = below_expert_level


    def refine(self, harvesting_module, crops, *args, **kwds):

        """Process the expert-level categorization"""


        above_expert_level = self.above_expert_level

        below_expert_level = self.below_expert_level


        proceed = True

        if above_expert_level is not None:

            proceed = proceed and harvesting_module.expert_level > above_expert_level


        if below_expert_level is not None:

            proceed = proceed and harvesting_module.expert_level < below_expert_level


        if proceed:

            self.wrapped_refiner(harvesting_module, crops, *args, **kwds)


# Meta refiner decorators

def groupby(refiner=None, **kwds):

    def group_decorator(wrapped_refiner):

        return GroupByRefiner(wrapped_refiner, **kwds)

    if refiner is None:

        return group_decorator

    else:

        return group_decorator(refiner)


def select(refiner=None, **kwds):

    def select_decorator(wrapped_refiner):

        return SelectRefiner(wrapped_refiner, **kwds)

    if refiner is None:

        return select_decorator

    else:

        return select_decorator(refiner)


def filter(refiner=None, **kwds):

    def filter_decorator(wrapped_refiner):

        return FilterRefiner(wrapped_refiner, **kwds)

    if refiner is None:

        return filter_decorator

    else:

        return filter_decorator(refiner)


def cd(refiner=None, **kwds):

    def cd_decorator(wrapped_refiner):

        return CdRefiner(wrapped_refiner, **kwds)

    if refiner is None:

        return cd_decorator

    else:

        return cd_decorator(refiner)


def context(refiner=None,

            above_expert_level=None, below_expert_level=None,

            folder_name=None, folder_groupby_addition=None,

            filter=None, filter_on=None,

            groupby=None, exclude_groupby=None,

            select=None, exclude=None):


    def context_decorator(wrapped_refiner):

        # Apply meta refiners in the reverse order that they shall be executed

        if exclude is not None or select is not None:

            wrapped_refiner = SelectRefiner(wrapped_refiner,

                                            select=select, exclude=exclude)


        if folder_name is not None or groupby is not None or folder_groupby_addition is not None:

            wrapped_refiner = CdRefiner(wrapped_refiner,

                                        folder_name=folder_name,

                                        groupby_addition=folder_groupby_addition)


        if groupby is not None:

            wrapped_refiner = GroupByRefiner(wrapped_refiner,

                                             by=groupby,

                                             exclude_by=exclude_groupby)


        if filter is not None or filter_on is not None:

            wrapped_refiner = FilterRefiner(wrapped_refiner,

                                            filter=filter,

                                            on=filter_on)


        if above_expert_level is not None or below_expert_level is not None:

            wrapped_refiner = ExpertLevelRefiner(wrapped_refiner,

                                                 above_expert_level=above_expert_level,

                                                 below_expert_level=below_expert_level)


        if not isinstance(wrapped_refiner, Refiner):

            wrapped_refiner = Refiner(wrapped_refiner)


        return wrapped_refiner


    if refiner is None:

        return context_decorator

    else:

        return functools.wraps(refiner)(context_decorator(refiner))


def refiner_with_context(refiner_factory):

    @functools.wraps(refiner_factory)

    def module_decorator_with_context(above_expert_level=None, below_expert_level=None,

                                      folder_name=None, folder_groupby_addition=None,

                                      filter=None, filter_on=None,

                                      groupby=None, exclude_groupby=None,

                                      select=None, exclude=None,

                                      **kwds_for_refiner_factory):


        refiner = refiner_factory(**kwds_for_refiner_factory)


        return context(refiner,

                       above_expert_level=above_expert_level, below_expert_level=below_expert_level,

                       folder_name=folder_name, folder_groupby_addition=folder_groupby_addition,

                       filter=filter, filter_on=filter_on,

                       groupby=groupby, exclude_groupby=exclude_groupby,

                       select=select, exclude=exclude)


    return module_decorator_with_context


@refiner_with_context

def save_fom(**kwds):

    return SaveFiguresOfMeritRefiner(**kwds)


@refiner_with_context

def save_histograms(**kwds):

    return SaveHistogramsRefiner(**kwds)


@refiner_with_context

def save_profiles(**kwds):

    return SaveProfilesRefiner(**kwds)


@refiner_with_context

def save_scatters(**kwds):

    return SaveScatterRefiner(**kwds)


@refiner_with_context

def save_classification_analysis(**kwds):

    return SaveClassificationAnalysisRefiner(**kwds)


@refiner_with_context

def save_pull_analysis(**kwds):

    return SavePullAnalysisRefiner(**kwds)


@refiner_with_context

def save_tree(**kwds):

    return SaveTreeRefiner(**kwds)


def select_crop_parts(crops, select=None, exclude=None):

    if select is None:

        select = []

    if exclude is None:

        exclude = []


    if isinstance(select, str):

        select = [select, ]


    if isinstance(exclude, str):

        exclude = [exclude, ]


    if isinstance(crops, collections.abc.MutableMapping):

        part_names = list(crops.keys())


        if not select and not exclude:

            return crops


        if select:

            not_selected_part_names = [name for name in part_names if name not in select]


            # if the selection item is a callable function do not count it as not selectable yet

            select_not_in_part_names = [name for name in select

                                        if not isinstance(name, collections.abc.Callable) and name not in part_names]

            if select_not_in_part_names:

                get_logger().warning("Cannot select %s, because they are not in crop part names %s",

                                     select_not_in_part_names, sorted(part_names))

        else:

            not_selected_part_names = []


        if exclude:

            excluded_part_names = [name for name in part_names if name in exclude]

        else:

            excluded_part_names = []


        excluded_part_names.extend(not_selected_part_names)


        # Make a shallow copy

        selected_crops = copy.copy(crops)

        for part_name in set(excluded_part_names):

            del selected_crops[part_name]


        if isinstance(select, collections.abc.Mapping):

            # select is a rename mapping

            for part_name, new_part_name in list(select.items()):

                if isinstance(part_name, collections.abc.Callable):

                    selected_crops[new_part_name] = part_name(**crops)

                elif part_name in selected_crops:

                    parts = selected_crops[part_name]

                    del selected_crops[part_name]

                    selected_crops[new_part_name] = parts


        return selected_crops


    else:

        raise ValueError(f"Unrecognised crop {crops} of type {type(crops)}")


def filter_crops(crops, filter_function, part_name=None):

    if isinstance(filter_function, np.ndarray):

        filter_indices = filter_function

    else:

        parts = crops[part_name]

        filter_indices = filter_function(parts)


    if isinstance(crops, np.ndarray):

        return crops[filter_indices]


    elif isinstance(crops, collections.abc.MutableMapping):

        # Make a shallow copy

        filtered_crops = copy.copy(crops)

        for part_name, parts in list(crops.items()):

            filtered_crops[part_name] = parts[filter_indices]

        return filtered_crops


    else:

        raise ValueError(f"Unrecognised crop {crops} of type {type(crops)}")


def iter_items_sorted_for_key(crops):

    # is the type of crops is a dictionary assume, that it should be sorted

    # in all other cases the users class has to take care of the sorting

    if isinstance(crops, dict):

        keys = sorted(crops.keys())

        return ((key, crops[key]) for key in keys)

    else:

        return list(crops.items())

tracking.harvest.refiners.CdRefiner
Definition: refiners.py:1039

tracking.harvest.refiners.CdRefiner.default_folder_name
str default_folder_name
Folder name to be used if a groupby selection is active.
Definition: refiners.py:1043

tracking.harvest.refiners.CdRefiner.__init__
def __init__(self, wrapped_refiner, folder_name=None, groupby_addition=None)
Definition: refiners.py:1050

tracking.harvest.refiners.CdRefiner.folder_name
folder_name
cached value of the folder name
Definition: refiners.py:1056

tracking.harvest.refiners.CdRefiner.refine
def refine(self, harvesting_module, crops, tdirectory=None, groupby_part_name=None, groupby_value=None, *args, **kwds)
Definition: refiners.py:1067

tracking.harvest.refiners.CdRefiner.wrapped_refiner
wrapped_refiner
cached value of the wrapped refiner
Definition: refiners.py:1054

tracking.harvest.refiners.CdRefiner.groupby_addition
groupby_addition
cached value of the suffix for a groupby selection
Definition: refiners.py:1058

tracking.harvest.refiners.CdRefiner.default_groupby_addition
str default_groupby_addition
Default suffix for a groupby selection.
Definition: refiners.py:1045

tracking.harvest.refiners.ExpertLevelRefiner
Definition: refiners.py:1107

tracking.harvest.refiners.ExpertLevelRefiner.below_expert_level
below_expert_level
cached value of the lower range of the expert level
Definition: refiners.py:1118

tracking.harvest.refiners.ExpertLevelRefiner.wrapped_refiner
wrapped_refiner
cached value of the wrapped refiner
Definition: refiners.py:1114

tracking.harvest.refiners.ExpertLevelRefiner.refine
def refine(self, harvesting_module, crops, *args, **kwds)
Definition: refiners.py:1120

tracking.harvest.refiners.ExpertLevelRefiner.__init__
def __init__(self, wrapped_refiner, above_expert_level=None, below_expert_level=None)
Definition: refiners.py:1110

tracking.harvest.refiners.ExpertLevelRefiner.above_expert_level
above_expert_level
cached value of the upper range of the expert level
Definition: refiners.py:1116

tracking.harvest.refiners.FilterRefiner
Definition: refiners.py:893

tracking.harvest.refiners.FilterRefiner.on
on
cached value of the part name to filter on
Definition: refiners.py:909

tracking.harvest.refiners.FilterRefiner.wrapped_refiner
wrapped_refiner
cached value of the wrapped refiner
Definition: refiners.py:900

tracking.harvest.refiners.FilterRefiner.refine
def refine(self, harvesting_module, crops, *args, **kwds)
Definition: refiners.py:911

tracking.harvest.refiners.FilterRefiner.filter
filter
cached value of the filter
Definition: refiners.py:904

tracking.harvest.refiners.FilterRefiner.__init__
def __init__(self, wrapped_refiner, filter=None, on=None)
Definition: refiners.py:896

tracking.harvest.refiners.GroupByRefiner
Definition: refiners.py:939

tracking.harvest.refiners.GroupByRefiner.by
by
cached value of the group-by classifier
Definition: refiners.py:955

tracking.harvest.refiners.GroupByRefiner.__init__
def __init__(self, wrapped_refiner, by=None, exclude_by=None)
Definition: refiners.py:948

tracking.harvest.refiners.GroupByRefiner.wrapped_refiner
wrapped_refiner
cached value of the wrapped refiner
Definition: refiners.py:953

tracking.harvest.refiners.GroupByRefiner.exclude_by
exclude_by
cached value of the exclude-by classifier
Definition: refiners.py:957

tracking.harvest.refiners.GroupByRefiner.default_exclude_by
bool default_exclude_by
default value of the exclude-by classifier
Definition: refiners.py:943

tracking.harvest.refiners.GroupByRefiner.refine
def refine(self, harvesting_module, crops, groupby_part_name=None, groupby_value=None, *args, **kwds)
Definition: refiners.py:965

tracking.harvest.refiners.Plot2DRefiner
Definition: refiners.py:312

tracking.harvest.refiners.Plot2DRefiner.title
title
cached user-defined title for this profile histogram / scatterplot
Definition: refiners.py:344

tracking.harvest.refiners.Plot2DRefiner.y_log
y_log
cached flag for logarithmic y axis for this profile histogram / scatterplot
Definition: refiners.py:371

tracking.harvest.refiners.Plot2DRefiner.description
description
cached user-defined description for this profile histogram / scatterplot
Definition: refiners.py:347

tracking.harvest.refiners.Plot2DRefiner.contact
contact
cached user-defined contact person for this profile histogram / scatterplot
Definition: refiners.py:351

tracking.harvest.refiners.Plot2DRefiner.fit
fit
cached fit for this profile histogram / scatterplot
Definition: refiners.py:379

tracking.harvest.refiners.Plot2DRefiner.upper_bound
upper_bound
cached upper bound for this profile histogram / scatterplot
Definition: refiners.py:365

tracking.harvest.refiners.Plot2DRefiner.y
y
cached value of ordinate
Definition: refiners.py:356

tracking.harvest.refiners.Plot2DRefiner.outlier_z_score
outlier_z_score
cached Z-score (for outlier detection) for this profile histogram / scatterplot
Definition: refiners.py:374

tracking.harvest.refiners.Plot2DRefiner.y_binary
y_binary
cached flag for probability y axis (range 0.0 .
Definition: refiners.py:369

tracking.harvest.refiners.Plot2DRefiner.skip_single_valued
skip_single_valued
cached flag to skip single-valued bins for this profile histogram / scatterplot
Definition: refiners.py:384

tracking.harvest.refiners.Plot2DRefiner.allow_discrete
allow_discrete
cached flag to allow discrete values for this profile histogram / scatterplot
Definition: refiners.py:376

tracking.harvest.refiners.Plot2DRefiner.plot_kind
str plot_kind
by default, this refiner is for profile histograms
Definition: refiners.py:315

tracking.harvest.refiners.Plot2DRefiner.fit_z_score
fit_z_score
cached fit Z-score (for outlier detection) for this profile histogram / scatterplot
Definition: refiners.py:381

tracking.harvest.refiners.Plot2DRefiner.stackby
stackby
cached stacking selection for this profile histogram / scatterplot
Definition: refiners.py:358

tracking.harvest.refiners.Plot2DRefiner.y_unit
y_unit
cached measurement unit for ordinate
Definition: refiners.py:360

tracking.harvest.refiners.Plot2DRefiner.__init__
def __init__(self, y, x=None, name=None, title=None, contact=None, description=None, check=None, stackby=None, y_unit=None, y_binary=None, y_log=None, lower_bound=None, upper_bound=None, bins=None, outlier_z_score=None, fit=None, fit_z_score=None, skip_single_valued=False, allow_discrete=False)
Definition: refiners.py:336

tracking.harvest.refiners.Plot2DRefiner.x
x
cached value of abscissa
Definition: refiners.py:354

tracking.harvest.refiners.Plot2DRefiner.has_more_than_one_value
def has_more_than_one_value(xs)
Definition: refiners.py:505

tracking.harvest.refiners.Plot2DRefiner.name
name
cached user-defined name for this profile histogram / scatterplot
Definition: refiners.py:342

tracking.harvest.refiners.Plot2DRefiner.bins
bins
cached number of bins for this profile histogram / scatterplot
Definition: refiners.py:367

tracking.harvest.refiners.Plot2DRefiner.refine
def refine(self, harvesting_module, crops, tdirectory=None, groupby_part_name=None, groupby_value=None, **kwds)
Definition: refiners.py:392

tracking.harvest.refiners.Plot2DRefiner.lower_bound
lower_bound
cached lower bound for this profile histogram / scatterplot
Definition: refiners.py:363

tracking.harvest.refiners.Plot2DRefiner.check
check
cached user-defined user-check action for this profile histogram / scatterplot
Definition: refiners.py:349

tracking.harvest.refiners.Refiner
Definition: refiners.py:34

tracking.harvest.refiners.Refiner.refiner_function
refiner_function
cached copy of the instance's refiner function
Definition: refiners.py:40

tracking.harvest.refiners.Refiner.__init__
def __init__(self, refiner_function=None)
Definition: refiners.py:37

tracking.harvest.refiners.Refiner.refine
def refine(self, harvesting_module, *args, **kwds)
Definition: refiners.py:69

tracking.harvest.refiners.Refiner.__get__
def __get__(self, harvesting_module, cls=None)
Definition: refiners.py:42

tracking.harvest.refiners.Refiner.__call__
def __call__(self, harvesting_module, crops=None, *args, **kwds)
Definition: refiners.py:55

tracking.harvest.refiners.SaveClassificationAnalysisRefiner
Definition: refiners.py:549

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.truth_name
truth_name
cached truth-values-collection name for this truth-classification analysis
Definition: refiners.py:581

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.cut
cut
cached threshold of estimates for this truth-classification analysis
Definition: refiners.py:584

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.contact
contact
cached contact person for this truth-classification analysis
Definition: refiners.py:577

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.upper_bound
upper_bound
cached upper bound of estimates for this truth-classification analysis
Definition: refiners.py:591

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.outlier_z_score
outlier_z_score
cached Z-score (for outlier detection) of estimates for this truth-classification analysis
Definition: refiners.py:593

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.allow_discrete
allow_discrete
cached discrete-value flag of estimates for this truth-classification analysis
Definition: refiners.py:595

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.unit
unit
cached measurement unit of estimates for this truth-classification analysis
Definition: refiners.py:597

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.estimate_name
estimate_name
cached estimates-collection name for this truth-classification analysis
Definition: refiners.py:579

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.cut_direction
cut_direction
cached cut direction (> or <) of estimates for this truth-classification analysis
Definition: refiners.py:586

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.__init__
def __init__(self, part_name=None, contact=None, estimate_name=None, truth_name=None, cut_direction=None, cut=None, lower_bound=None, upper_bound=None, outlier_z_score=None, allow_discrete=False, unit=None)
Definition: refiners.py:571

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.default_estimate_name
str default_estimate_name
default name for the truth-classification analysis estimates collection
Definition: refiners.py:558

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.part_name
part_name
cached part name for this truth-classification analysis
Definition: refiners.py:575

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.default_truth_name
str default_truth_name
default name for the truth-classification analysis truth-values collection
Definition: refiners.py:556

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.refine
def refine(self, harvesting_module, crops, tdirectory=None, groupby_part_name=None, groupby_value=None, **kwds)
Definition: refiners.py:605

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.lower_bound
lower_bound
cached lower bound of estimates for this truth-classification analysis
Definition: refiners.py:589

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.default_contact
str default_contact
default contact person for this truth-classification analysis
Definition: refiners.py:553

tracking.harvest.refiners.SaveFiguresOfMeritRefiner
Definition: refiners.py:74

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.title
title
cached title of the figure of merit
Definition: refiners.py:113

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.description
description
cached description of the figure of merit
Definition: refiners.py:116

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.contact
contact
cached contact person of the figure of merit
Definition: refiners.py:120

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.__init__
def __init__(self, name=None, title=None, contact=None, description=None, check=None, key=None, aggregation=None)
Definition: refiners.py:105

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.default_name
str default_name
default name for this refiner
Definition: refiners.py:77

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.mean
def mean(xs)
return the mean of the parts, ignoring NaNs
Definition: refiners.py:91

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.default_description
str default_description
default description for this refiner
Definition: refiners.py:83

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.default_aggregation
def default_aggregation
default aggregation is the mean of the parts
Definition: refiners.py:95

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.default_key
str default_key
default key name for this refiner
Definition: refiners.py:87

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.default_check
str default_check
default user-check action for this refiner
Definition: refiners.py:85

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.aggregation
aggregation
cached copy of the crops-aggregation method
Definition: refiners.py:125

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.default_title
str default_title
default title for this refiner
Definition: refiners.py:79

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.key
key
cached copy of the figures-of-merit key
Definition: refiners.py:123

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.name
name
cached name of the figure of merit
Definition: refiners.py:111

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.refine
def refine(self, harvesting_module, crops, tdirectory=None, groupby_part_name=None, groupby_value=None, **kwds)
Definition: refiners.py:133

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.check
check
cached user-check action of the figure of merit
Definition: refiners.py:118

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.default_contact
str default_contact
default contact person for this refiner
Definition: refiners.py:81

tracking.harvest.refiners.SaveHistogramsRefiner
Definition: refiners.py:180

tracking.harvest.refiners.SaveHistogramsRefiner.title
title
cached user-defined title for this histogram
Definition: refiners.py:214

tracking.harvest.refiners.SaveHistogramsRefiner.description
description
cached user-defined description for this histogram
Definition: refiners.py:217

tracking.harvest.refiners.SaveHistogramsRefiner.contact
contact
cached user-defined contact person for this histogram
Definition: refiners.py:221

tracking.harvest.refiners.SaveHistogramsRefiner.fit
fit
cached fit for this histogram
Definition: refiners.py:238

tracking.harvest.refiners.SaveHistogramsRefiner.upper_bound
upper_bound
cached upper bound for this histogram
Definition: refiners.py:226

tracking.harvest.refiners.SaveHistogramsRefiner.outlier_z_score
outlier_z_score
cached Z-score (for outlier detection) for this histogram
Definition: refiners.py:231

tracking.harvest.refiners.SaveHistogramsRefiner.default_name
str default_name
default name for this histogram
Definition: refiners.py:183

tracking.harvest.refiners.SaveHistogramsRefiner.allow_discrete
allow_discrete
cached flag to allow discrete values for this histogram
Definition: refiners.py:233

tracking.harvest.refiners.SaveHistogramsRefiner.__init__
def __init__(self, name=None, title=None, contact=None, description=None, check=None, lower_bound=None, upper_bound=None, bins=None, outlier_z_score=None, allow_discrete=False, stackby="", fit=None, fit_z_score=None)
Definition: refiners.py:206

tracking.harvest.refiners.SaveHistogramsRefiner.fit_z_score
fit_z_score
cached fit Z-score (for outlier detection) for this histogram
Definition: refiners.py:240

tracking.harvest.refiners.SaveHistogramsRefiner.stackby
stackby
cached stacking selection for this histogram
Definition: refiners.py:235

tracking.harvest.refiners.SaveHistogramsRefiner.default_description
str default_description
default description for this histogram
Definition: refiners.py:189

tracking.harvest.refiners.SaveHistogramsRefiner.default_check
str default_check
default user-check action for this histogram
Definition: refiners.py:191

tracking.harvest.refiners.SaveHistogramsRefiner.default_title
str default_title
default title for this histogram
Definition: refiners.py:185

tracking.harvest.refiners.SaveHistogramsRefiner.name
name
cached user-defined name for this histogram
Definition: refiners.py:212

tracking.harvest.refiners.SaveHistogramsRefiner.bins
bins
cached number of bins for this histogram
Definition: refiners.py:228

tracking.harvest.refiners.SaveHistogramsRefiner.refine
def refine(self, harvesting_module, crops, tdirectory=None, groupby_part_name=None, groupby_value=None, **kwds)
Definition: refiners.py:248

tracking.harvest.refiners.SaveHistogramsRefiner.lower_bound
lower_bound
cached lower bound for this histogram
Definition: refiners.py:224

tracking.harvest.refiners.SaveHistogramsRefiner.check
check
cached user-defined user-check action for this histogram
Definition: refiners.py:219

tracking.harvest.refiners.SaveHistogramsRefiner.default_contact
str default_contact
default contact person for this histogram
Definition: refiners.py:187

tracking.harvest.refiners.SaveProfilesRefiner
Definition: refiners.py:515

tracking.harvest.refiners.SavePullAnalysisRefiner
Definition: refiners.py:657

tracking.harvest.refiners.SavePullAnalysisRefiner.variance_name
variance_name
cached name for the pull analysis variances collection
Definition: refiners.py:712

tracking.harvest.refiners.SavePullAnalysisRefiner.truth_name
truth_name
cached name for the pull analysis truth-values collection
Definition: refiners.py:708

tracking.harvest.refiners.SavePullAnalysisRefiner.default_variance_name
str default_variance_name
default name for the pull analysis variances collection
Definition: refiners.py:672

tracking.harvest.refiners.SavePullAnalysisRefiner.quantity_name
quantity_name
cached name of the quantity for the pull analysis
Definition: refiners.py:715

tracking.harvest.refiners.SavePullAnalysisRefiner.contact
contact
cached contact person for this pull analysis
Definition: refiners.py:695

tracking.harvest.refiners.SavePullAnalysisRefiner.outlier_z_score
outlier_z_score
cached Z-score (for outlier detection) for the pull analysis
Definition: refiners.py:723

tracking.harvest.refiners.SavePullAnalysisRefiner.default_name
str default_name
default name for this pull analysis
Definition: refiners.py:661

tracking.harvest.refiners.SavePullAnalysisRefiner.part_names
part_names
cached array of part names for this pull analysis
Definition: refiners.py:700

tracking.harvest.refiners.SavePullAnalysisRefiner.unit
unit
cached measurement unit for the pull analysis
Definition: refiners.py:717

tracking.harvest.refiners.SavePullAnalysisRefiner.aux_names
aux_names
cached auxiliary names for the pull analysis
Definition: refiners.py:720

tracking.harvest.refiners.SavePullAnalysisRefiner.estimate_name
estimate_name
cached name for the pull analysis estimates collection
Definition: refiners.py:710

tracking.harvest.refiners.SavePullAnalysisRefiner.title_postfix
title_postfix
cached suffix for the title of this pull analysis
Definition: refiners.py:697

tracking.harvest.refiners.SavePullAnalysisRefiner.__init__
def __init__(self, name=None, contact=None, title_postfix=None, part_name=None, part_names=None, truth_name=None, estimate_name=None, variance_name=None, quantity_name=None, aux_names=None, unit=None, outlier_z_score=None, absolute=False, which_plots=None)
Definition: refiners.py:688

tracking.harvest.refiners.SavePullAnalysisRefiner.default_title_postfix
str default_title_postfix
default suffix for the title of this pull analysis
Definition: refiners.py:665

tracking.harvest.refiners.SavePullAnalysisRefiner.default_estimate_name
str default_estimate_name
default name for the pull analysis estimates collection
Definition: refiners.py:670

tracking.harvest.refiners.SavePullAnalysisRefiner.name
name
cached name for this pull analysis
Definition: refiners.py:693

tracking.harvest.refiners.SavePullAnalysisRefiner.default_truth_name
str default_truth_name
default name for the pull analysis truth-values collection
Definition: refiners.py:668

tracking.harvest.refiners.SavePullAnalysisRefiner.refine
def refine(self, harvesting_module, crops, tdirectory=None, groupby_part_name=None, groupby_value=None, **kwds)
Definition: refiners.py:735

tracking.harvest.refiners.SavePullAnalysisRefiner.which_plots
which_plots
cached list of plots produced by the pull analysis
Definition: refiners.py:727

tracking.harvest.refiners.SavePullAnalysisRefiner.absolute
absolute
cached absolute-value-comparison flag for the pull analysis
Definition: refiners.py:725

tracking.harvest.refiners.SavePullAnalysisRefiner.default_contact
str default_contact
default contact person for this pull analysis
Definition: refiners.py:663

tracking.harvest.refiners.SaveScatterRefiner
Definition: refiners.py:532

tracking.harvest.refiners.SaveTreeRefiner
Definition: refiners.py:817

tracking.harvest.refiners.SaveTreeRefiner.title
title
cached title for this TTree
Definition: refiners.py:834

tracking.harvest.refiners.SaveTreeRefiner.default_name
str default_name
default name for this TTree
Definition: refiners.py:821

tracking.harvest.refiners.SaveTreeRefiner.__init__
def __init__(self, name=None, title=None)
Definition: refiners.py:827

tracking.harvest.refiners.SaveTreeRefiner.add_branch
def add_branch(self, output_ttree, part_name, parts)
Definition: refiners.py:867

tracking.harvest.refiners.SaveTreeRefiner.default_title
str default_title
default title for this TTree
Definition: refiners.py:823

tracking.harvest.refiners.SaveTreeRefiner.name
name
cached name for this TTree
Definition: refiners.py:832

tracking.harvest.refiners.SaveTreeRefiner.refine
def refine(self, harvesting_module, crops, tdirectory=None, groupby_part_name=None, groupby_value=None, **kwds)
Definition: refiners.py:842

tracking.harvest.refiners.SelectRefiner
Definition: refiners.py:917

tracking.harvest.refiners.SelectRefiner.__init__
def __init__(self, wrapped_refiner, select=None, exclude=None)
Definition: refiners.py:920

tracking.harvest.refiners.SelectRefiner.wrapped_refiner
wrapped_refiner
cached value of the wrapped refiner
Definition: refiners.py:927

tracking.harvest.refiners.SelectRefiner.refine
def refine(self, harvesting_module, crops, *args, **kwds)
Definition: refiners.py:933

tracking.harvest.refiners.SelectRefiner.exclude
exclude
cached value of the exclusion flag
Definition: refiners.py:931

tracking.harvest.refiners.SelectRefiner.select
select
cached value of the selector
Definition: refiners.py:929

tracking.validation.classification.ClassificationAnalysis
Definition: classification.py:25

tracking.validation.fom.ValidationFiguresOfMerit
Definition: fom.py:19

tracking.validation.plot.ValidationPlot
Definition: plot.py:159

tracking.validation.pull.PullAnalysis
Definition: pull.py:26

tracking.root_utils
Definition: root_utils.py:1

tracking.validation.classification
Definition: classification.py:1

tracking.validation.fom
Definition: fom.py:1

tracking.validation.plot
Definition: plot.py:1

tracking.validation.pull
Definition: pull.py:1

tracking.validation.tolerate_missing_key_formatter
Definition: tolerate_missing_key_formatter.py:1