release-08-01-10/doxygen/refiners_8py_source.html

 import functools

 import numpy as np

 import collections

 import copy


 from tracking.validation.plot import ValidationPlot, compose_axis_label

 from tracking.validation.fom import ValidationFiguresOfMerit

 from tracking.validation.classification import ClassificationAnalysis

 from tracking.validation.pull import PullAnalysis

 from tracking.validation.tolerate_missing_key_formatter import TolerateMissingKeyFormatter

 from tracking.root_utils import root_cd, root_save_name


 import ROOT


 import logging


 def get_logger():

     return logging.getLogger(__name__)


 formatter = TolerateMissingKeyFormatter()


 class Refiner(object):

     """Python module to refine a peeled dictionary"""


     def __init__(self, refiner_function=None):

         """Constructor of the Refiner instance"""


         self.refiner_functionrefiner_function = refiner_function


     def __get__(self, harvesting_module, cls=None):

         """Getter of the Refiner instance"""

         if harvesting_module is None:

             # Class access

             return self

         else:

             # Instance access

             refine = self.refinerefine


             def bound_call(*args, **kwds):

                 return refine(harvesting_module, *args, **kwds)

             return bound_call


     def __call__(self, harvesting_module, crops=None, *args, **kwds):

         """implementation of the function-call of the Refiner instance

              r = Refiner()

              r(harvester) # decoration

              r(harvester, crops, args, keywords) # refinement

         """

         if crops is None:

             # Decoration mode

             harvesting_module.refiners.append(self)

             return harvesting_module

         else:

             # Refining mode

             return self.refinerefine(harvesting_module, crops, *args, **kwds)


     def refine(self, harvesting_module, *args, **kwds):

         """Apply the instance's refiner function"""

         self.refiner_functionrefiner_function(harvesting_module, *args, **kwds)


 class SaveFiguresOfMeritRefiner(Refiner):

     """Refiner for figures of merit"""


     default_name = "{module.id}_figures_of_merit{groupby_key}"


     default_title = "Figures of merit in {module.title}"


     default_contact = "{module.contact}"


     default_description = "Figures of merit are the {aggregation.__name__} of {keys}"


     default_check = "Check for reasonable values"


     default_key = "{aggregation.__name__}_{part_name}"


     @staticmethod

     def mean(xs):

         return np.nanmean(xs)


     default_aggregation = mean


     def __init__(self,

                  name=None,

                  title=None,

                  contact=None,

                  description=None,

                  check=None,

                  key=None,

                  aggregation=None,

                  ):

         """Constructor for this refiner"""


         super(SaveFiguresOfMeritRefiner, self).__init__()


         self.namename = name


         self.titletitle = title


         self.descriptiondescription = description


         self.checkcheck = check


         self.contactcontact = contact


         self.keykey = key


         self.aggregationaggregation = aggregation


     def refine(self,

                harvesting_module,

                crops,

                tdirectory=None,

                groupby_part_name=None,

                groupby_value=None,

                **kwds):

         """Process the figures of merit"""


         name = self.namename or self.default_namedefault_name

         title = self.titletitle or self.default_titledefault_title

         contact = self.contactcontact or self.default_contactdefault_contact

         description = self.descriptiondescription or self.default_descriptiondefault_description

         check = self.checkcheck or self.default_checkdefault_check


         aggregation = self.aggregationaggregation or self.default_aggregationdefault_aggregation


         replacement_dict = dict(

             refiner=self,

             module=harvesting_module,

             aggregation=aggregation,

             groupby_key='_' + groupby_part_name + groupby_value if groupby_part_name else "",

             groupby=groupby_part_name,  # deprecated

             groupby_value=groupby_value,  # deprecated

         )


         name = formatter.format(name, **replacement_dict)

         title = formatter.format(title, **replacement_dict)

         contact = formatter.format(contact, **replacement_dict)


         figures_of_merit = ValidationFiguresOfMerit(name,

                                                     contact=contact,

                                                     title=title)


         for part_name, parts in iter_items_sorted_for_key(crops):

             key = self.keykey or self.default_keydefault_key

             key = formatter.format(key, part_name=part_name, **replacement_dict)

             figures_of_merit[key] = aggregation(parts)


         keys = list(figures_of_merit.keys())


         description = formatter.format(description, keys=keys, **replacement_dict)

         check = formatter.format(check, keys=keys, **replacement_dict)


         figures_of_merit.description = description

         figures_of_merit.check = check


         if tdirectory:

             figures_of_merit.write(tdirectory)


         print(figures_of_merit)


 class SaveHistogramsRefiner(Refiner):

     """Refiner for histograms"""


     default_name = "{module.id}_{part_name}_histogram{groupby_key}{stackby_key}"


     default_title = "Histogram of {part_name}{groupby_key}{stackby_key} from {module.title}"


     default_contact = "{module.contact}"


     default_description = "This is a histogram of {part_name}{groupby_key}{stackby_key}."


     default_check = "Check if the distribution is reasonable"


     def __init__(self,

                  name=None,

                  title=None,

                  contact=None,

                  description=None,

                  check=None,

                  lower_bound=None,

                  upper_bound=None,

                  bins=None,

                  outlier_z_score=None,

                  allow_discrete=False,

                  stackby="",

                  fit=None,

                  fit_z_score=None):

         """Constructor for this refiner"""


         super(SaveHistogramsRefiner, self).__init__()


         self.namename = name


         self.titletitle = title


         self.descriptiondescription = description


         self.checkcheck = check


         self.contactcontact = contact


         self.lower_boundlower_bound = lower_bound


         self.upper_boundupper_bound = upper_bound


         self.binsbins = bins


         self.outlier_z_scoreoutlier_z_score = outlier_z_score


         self.allow_discreteallow_discrete = allow_discrete


         self.stackbystackby = stackby


         self.fitfit = fit


         self.fit_z_scorefit_z_score = fit_z_score


     def refine(self,

                harvesting_module,

                crops,

                tdirectory=None,

                groupby_part_name=None,

                groupby_value=None,

                **kwds):

         """Process the histogram"""


         stackby = self.stackbystackby

         if stackby:

             stackby_parts = crops[stackby]

         else:

             stackby_parts = None


         replacement_dict = dict(

             refiner=self,

             module=harvesting_module,

             stackby_key=' stacked by ' + stackby if stackby else "",

             groupby_key=' in group ' + groupby_part_name + groupby_value if groupby_part_name else "",

         )


         contact = self.contactcontact or self.default_contactdefault_contact

         contact = formatter.format(contact, **replacement_dict)


         for part_name, parts in iter_items_sorted_for_key(crops):

             name = self.namename or self.default_namedefault_name

             title = self.titletitle or self.default_titledefault_title

             description = self.descriptiondescription or self.default_descriptiondefault_description

             check = self.checkcheck or self.default_checkdefault_check


             name = formatter.format(name, part_name=part_name, **replacement_dict)

             title = formatter.format(title, part_name=part_name, **replacement_dict)

             description = formatter.format(description, part_name=part_name, **replacement_dict)

             check = formatter.format(check, part_name=part_name, **replacement_dict)


             histogram = ValidationPlot(name)

             histogram.hist(parts,

                            lower_bound=self.lower_boundlower_bound,

                            upper_bound=self.upper_boundupper_bound,

                            bins=self.binsbins,

                            outlier_z_score=self.outlier_z_scoreoutlier_z_score,

                            allow_discrete=self.allow_discreteallow_discrete,

                            stackby=stackby_parts)


             histogram.title = title

             histogram.contact = contact

             histogram.description = description

             histogram.check = check


             histogram.xlabel = compose_axis_label(part_name)


             if self.fitfit:

                 if self.fit_z_scorefit_z_score is None:

                     kwds = dict()

                 else:

                     kwds = dict(z_score=self.fit_z_scorefit_z_score)


                 fit_method_name = 'fit_' + str(self.fitfit)

                 try:

                     fit_method = getattr(histogram, fit_method_name)

                 except AttributeError:

                     histogram.fit(str(self.fitfit), **kwds)

                 else:

                     fit_method(**kwds)


             if tdirectory:

                 histogram.write(tdirectory)


 class Plot2DRefiner(Refiner):

     """Refiner for profile histograms and 2D scatterplots"""


     plot_kind = "profile"


     def __init__(self,

                  y,

                  x=None,

                  name=None,

                  title=None,

                  contact=None,

                  description=None,

                  check=None,

                  stackby=None,

                  y_unit=None,

                  y_binary=None,

                  y_log=None,

                  lower_bound=None,

                  upper_bound=None,

                  bins=None,

                  outlier_z_score=None,

                  fit=None,

                  fit_z_score=None,

                  skip_single_valued=False,

                  allow_discrete=False):

         """Constructor for this refiner"""


         super().__init__()


         self.namename = name


         self.titletitle = title


         self.descriptiondescription = description


         self.checkcheck = check


         self.contactcontact = contact


         self.xx = x


         self.yy = y


         self.stackbystackby = stackby


         self.y_unity_unit = y_unit


         self.lower_boundlower_bound = lower_bound


         self.upper_boundupper_bound = upper_bound


         self.binsbins = bins


         self.y_binaryy_binary = y_binary


         self.y_logy_log = y_log


         self.outlier_z_scoreoutlier_z_score = outlier_z_score


         self.allow_discreteallow_discrete = allow_discrete


         self.fitfit = fit


         self.fit_z_scorefit_z_score = fit_z_score


         self.skip_single_valuedskip_single_valued = skip_single_valued


     def refine(self,

                harvesting_module,

                crops,

                tdirectory=None,

                groupby_part_name=None,

                groupby_value=None,

                **kwds):

         """Process the profile histogram / scatterplot"""


         stackby = self.stackbystackby

         if stackby:

             stackby_parts = crops[stackby]

         else:

             stackby_parts = None


         replacement_dict = dict(

             refiner=self,

             module=harvesting_module,

             stackby_key=' stacked by ' + stackby if stackby else "",

             groupby_key=' in group ' + groupby_part_name + groupby_value if groupby_part_name else "",

         )


         contact = self.contactcontact or self.default_contact

         contact = formatter.format(contact, **replacement_dict)


         y_crops = select_crop_parts(crops, select=self.yy)

         x_crops = select_crop_parts(crops, select=self.xx, exclude=self.yy)


         for y_part_name, y_parts in iter_items_sorted_for_key(y_crops):

             for x_part_name, x_parts in iter_items_sorted_for_key(x_crops):


                 if self.skip_single_valuedskip_single_valued and not self.has_more_than_one_valuehas_more_than_one_value(x_parts):

                     get_logger().info('Skipping "%s" by "%s" profile because x has only a single value "%s"',

                                       y_part_name,

                                       x_part_name,

                                       x_parts[0])

                     continue


                 if self.skip_single_valuedskip_single_valued and not self.has_more_than_one_valuehas_more_than_one_value(y_parts):

                     get_logger().info('Skipping "%s" by "%s" profile because y has only a single value "%s"',

                                       y_part_name,

                                       x_part_name,

                                       y_parts[0])

                     continue


                 name = self.namename or self.default_name

                 title = self.titletitle or self.default_title

                 description = self.descriptiondescription or self.default_description

                 check = self.checkcheck or self.default_check


                 name = formatter.format(name,

                                         x_part_name=x_part_name,

                                         y_part_name=y_part_name,

                                         **replacement_dict)


                 title = formatter.format(title,

                                          x_part_name=x_part_name,

                                          y_part_name=y_part_name,

                                          **replacement_dict)


                 description = formatter.format(description,

                                                x_part_name=x_part_name,

                                                y_part_name=y_part_name,

                                                **replacement_dict)


                 check = formatter.format(check,

                                          x_part_name=x_part_name,

                                          y_part_name=y_part_name,

                                          **replacement_dict)


                 profile_plot = ValidationPlot(name)


                 plot_kind = self.plot_kindplot_kind

                 if plot_kind == "profile":

                     profile_plot.profile(x_parts,

                                          y_parts,

                                          lower_bound=self.lower_boundlower_bound,

                                          upper_bound=self.upper_boundupper_bound,

                                          bins=self.binsbins,

                                          y_binary=self.y_binaryy_binary,

                                          y_log=self.y_logy_log,

                                          outlier_z_score=self.outlier_z_scoreoutlier_z_score,

                                          allow_discrete=self.allow_discreteallow_discrete,

                                          stackby=stackby_parts)


                     if self.fitfit:

                         if self.fit_z_scorefit_z_score is None:

                             kwds = dict()

                         else:

                             kwds = dict(z_score=self.fit_z_scorefit_z_score)


                         fit_method_name = 'fit_' + str(self.fitfit)

                         try:

                             fit_method = getattr(profile_plot, fit_method_name)

                         except BaseException:

                             profile_plot.fit(str(self.fitfit), **kwds)

                         else:

                             fit_method(**kwds)


                 elif plot_kind == "scatter":

                     profile_plot.scatter(x_parts,

                                          y_parts,

                                          lower_bound=self.lower_boundlower_bound,

                                          upper_bound=self.upper_boundupper_bound,

                                          outlier_z_score=self.outlier_z_scoreoutlier_z_score,

                                          stackby=stackby_parts)


                 profile_plot.title = title

                 profile_plot.contact = contact

                 profile_plot.description = description

                 profile_plot.check = check


                 profile_plot.xlabel = compose_axis_label(x_part_name)

                 profile_plot.ylabel = compose_axis_label(y_part_name, self.y_unity_unit)


                 if tdirectory:

                     profile_plot.write(tdirectory)


     @staticmethod

     def has_more_than_one_value(xs):

         """check if a list has at least two unique values"""

         first_x = xs[0]

         for x in xs:

             if x != first_x:

                 return True

         else:

             return False


 class SaveProfilesRefiner(Plot2DRefiner):

     """Refiner for profile histograms"""


     default_name = "{module.id}_{y_part_name}_by_{x_part_name}_profile{groupby_key}{stackby_key}"


     default_title = "Profile of {y_part_name} by {x_part_name} from {module.title}"


     default_contact = "{module.contact}"


     default_description = "This is a profile of {y_part_name} over {x_part_name}."


     default_check = "Check if the trend line is reasonable."


     plot_kind = "profile"


 class SaveScatterRefiner(Plot2DRefiner):

     """Refiner for 2D scatterplots"""


     default_name = "{module.id}_{y_part_name}_by_{x_part_name}_scatter{groupby_key}{stackby_key}"


     default_title = "Scatter of {y_part_name} by {x_part_name} from {module.title}"


     default_contact = "{module.contact}"


     default_description = "This is a scatter of {y_part_name} over {x_part_name}."


     default_check = "Check if the distributions is reasonable."


     plot_kind = "scatter"


 class SaveClassificationAnalysisRefiner(Refiner):

     """Refiner for truth-classification analyses"""


     default_contact = "{module.contact}"


     default_truth_name = "{part_name}_truth"


     default_estimate_name = "{part_name}_estimate"


     def __init__(self,

                  part_name=None,

                  contact=None,

                  estimate_name=None,

                  truth_name=None,

                  cut_direction=None,

                  cut=None,

                  lower_bound=None,

                  upper_bound=None,

                  outlier_z_score=None,

                  allow_discrete=False,

                  unit=None):

         """Constructor for this refiner"""


         self.part_namepart_name = part_name


         self.contactcontact = contact


         self.estimate_nameestimate_name = estimate_name


         self.truth_nametruth_name = truth_name


         self.cutcut = cut


         self.cut_directioncut_direction = cut_direction


         self.lower_boundlower_bound = lower_bound


         self.upper_boundupper_bound = upper_bound


         self.outlier_z_scoreoutlier_z_score = outlier_z_score


         self.allow_discreteallow_discrete = allow_discrete


         self.unitunit = unit


     def refine(self,

                harvesting_module,

                crops,

                tdirectory=None,

                groupby_part_name=None,

                groupby_value=None,

                **kwds):

         """Process the truth-classification analysis"""


         replacement_dict = dict(

             refiner=self,

             module=harvesting_module,

             groupby_key='_' + groupby_part_name + groupby_value if groupby_part_name else "",

             groupby=groupby_part_name,  # deprecated

             groupby_value=groupby_value,  # deprecated

         )


         contact = self.contactcontact or self.default_contactdefault_contact

         contact = formatter.format(contact, **replacement_dict)


         if self.truth_nametruth_name is not None:

             truth_name = self.truth_nametruth_name

         else:

             truth_name = self.default_truth_namedefault_truth_name


         truth_name = formatter.format(truth_name, part_name=self.part_namepart_name)

         truths = crops[truth_name]


         if self.estimate_nameestimate_name is not None:

             estimate_name = self.estimate_nameestimate_name

         else:

             estimate_name = self.default_estimate_namedefault_estimate_name


         if isinstance(estimate_name, str):

             estimate_names = [estimate_name, ]

         else:

             estimate_names = estimate_name


         for estimate_name in estimate_names:

             estimate_name = formatter.format(estimate_name, part_name=self.part_namepart_name)

             estimates = crops[estimate_name]


             classification_analysis = ClassificationAnalysis(quantity_name=estimate_name,

                                                              contact=contact,

                                                              cut_direction=self.cut_directioncut_direction,

                                                              cut=self.cutcut,

                                                              lower_bound=self.lower_boundlower_bound,

                                                              upper_bound=self.upper_boundupper_bound,

                                                              outlier_z_score=self.outlier_z_scoreoutlier_z_score,

                                                              allow_discrete=self.allow_discreteallow_discrete,

                                                              unit=self.unitunit)


             classification_analysis.analyse(estimates, truths)


             if tdirectory:

                 classification_analysis.write(tdirectory)


 class SavePullAnalysisRefiner(Refiner):

     """Refiner for pull analyses"""


     default_name = "{module.id}_{quantity_name}"


     default_contact = "{module.contact}"


     default_title_postfix = " from {module.title}"


     default_truth_name = "{part_name}_truth"


     default_estimate_name = "{part_name}_estimate"


     default_variance_name = "{part_name}_variance"


     def __init__(self,

                  name=None,

                  contact=None,

                  title_postfix=None,

                  part_name=None,

                  part_names=None,

                  truth_name=None,

                  estimate_name=None,

                  variance_name=None,

                  quantity_name=None,

                  aux_names=None,

                  unit=None,

                  outlier_z_score=None,

                  absolute=False,

                  which_plots=None):

         """Constructor for this refiner"""

         if aux_names is None:

             aux_names = []


         self.namename = name


         self.contactcontact = contact


         self.title_postfixtitle_postfix = title_postfix


         self.part_namespart_names = []

         if part_names is not None:

             self.part_namespart_names = part_names


         if part_name is not None:

             self.part_namespart_names.append(part_name)


         self.truth_nametruth_name = truth_name


         self.estimate_nameestimate_name = estimate_name


         self.variance_namevariance_name = variance_name


         self.quantity_namequantity_name = quantity_name


         self.unitunit = unit


         self.aux_namesaux_names = aux_names


         self.outlier_z_scoreoutlier_z_score = outlier_z_score


         self.absoluteabsolute = absolute


         self.which_plotswhich_plots = which_plots


     def refine(self,

                harvesting_module,

                crops,

                tdirectory=None,

                groupby_part_name=None,

                groupby_value=None,

                **kwds):

         """Process the pull analysis"""


         replacement_dict = dict(

             refiner=self,

             module=harvesting_module,

             # stackby_key='_' + stackby if stackby else "",

             groupby_key='_' + groupby_part_name + groupby_value if groupby_part_name else "",

             groupby=groupby_part_name,  # deprecated

             groupby_value=groupby_value,  # deprecated

         )


         contact = self.contactcontact or self.default_contactdefault_contact

         contact = formatter.format(contact, **replacement_dict)


         name = self.namename or self.default_namedefault_name


         if self.aux_namesaux_names:

             auxiliaries = select_crop_parts(crops, self.aux_namesaux_names)

         else:

             auxiliaries = {}


         for part_name in self.part_namespart_names:

             name = formatter.format(name, part_name=part_name, **replacement_dict)

             plot_name = name + "_{subplot_name}"


             title_postfix = self.title_postfixtitle_postfix

             if title_postfix is None:

                 title_postfix = self.default_title_postfixdefault_title_postfix


             title_postfix = formatter.format(title_postfix, part_name=part_name, **replacement_dict)

             plot_title = "{subplot_title} of {quantity_name}" + title_postfix


             if self.truth_nametruth_name is not None:

                 truth_name = self.truth_nametruth_name

             else:

                 truth_name = self.default_truth_namedefault_truth_name


             if self.estimate_nameestimate_name is not None:

                 estimate_name = self.estimate_nameestimate_name

             else:

                 estimate_name = self.default_estimate_namedefault_estimate_name


             if self.variance_namevariance_name is not None:

                 variance_name = self.variance_namevariance_name

             else:

                 variance_name = self.default_variance_namedefault_variance_name


             truth_name = formatter.format(truth_name, part_name=part_name)

             estimate_name = formatter.format(estimate_name, part_name=part_name)

             variance_name = formatter.format(variance_name, part_name=part_name)


             truths = crops[truth_name]

             estimates = crops[estimate_name]

             try:

                 variances = crops[variance_name]

             except KeyError:

                 variances = None


             quantity_name = self.quantity_namequantity_name or part_name


             which_plots = self.which_plotswhich_plots


             pull_analysis = PullAnalysis(quantity_name,

                                          unit=self.unitunit,

                                          absolute=self.absoluteabsolute,

                                          outlier_z_score=self.outlier_z_scoreoutlier_z_score,

                                          plot_name=plot_name,

                                          plot_title=plot_title)


             pull_analysis.analyse(truths,

                                   estimates,

                                   variances,

                                   auxiliaries=auxiliaries,

                                   which_plots=which_plots)


             pull_analysis.contact = contact


             if tdirectory:

                 pull_analysis.write(tdirectory)


 class SaveTreeRefiner(Refiner):

     """Refiner for ROOT TTrees"""


     default_name = "{module.id}_tree"


     default_title = "Tree of {module.id}"


     def __init__(self,

                  name=None,

                  title=None):

         """Constructor for this refiner"""

         super(SaveTreeRefiner, self).__init__()


         self.namename = name


         self.titletitle = title


     def refine(self,

                harvesting_module,

                crops,

                tdirectory=None,

                groupby_part_name=None,

                groupby_value=None,

                **kwds):

         """Process the TTree"""


         replacement_dict = dict(

             refiner=self,

             module=harvesting_module,

             groupby_key='_' + groupby_part_name + groupby_value if groupby_part_name else "",

             groupby=groupby_part_name,  # deprecated

             groupby_value=groupby_value,  # deprecated

         )


         with root_cd(tdirectory):

             name = self.namename or self.default_namedefault_name

             title = self.titletitle or self.default_titledefault_title


             name = formatter.format(name, **replacement_dict)

             title = formatter.format(title, **replacement_dict)


             output_ttree = ROOT.TTree(root_save_name(name), title)

             for part_name, parts in iter_items_sorted_for_key(crops):

                 self.add_branchadd_branch(output_ttree, part_name, parts)


             output_ttree.FlushBaskets()

             output_ttree.Write()


     def add_branch(self, output_ttree, part_name, parts):

         """Add a TBranch to the TTree"""

         input_value = np.zeros(1, dtype=float)


         branch_type_spec = '%s/D' % part_name

         tbranch = output_ttree.Branch(part_name, input_value, branch_type_spec)


         if output_ttree.GetNbranches() == 1:

             # On filling of the first branch we need to use the fill method of the TTree

             # For all other branches we can use the one of the branch

             # #justrootthings

             for value in parts:

                 input_value[0] = value

                 output_ttree.Fill()


         else:

             for value in parts:

                 input_value[0] = value

                 tbranch.Fill()


         output_ttree.GetEntry(0)

         output_ttree.ResetBranchAddress(tbranch)

         also_subbranches = True  # No subbranches here but we drop the buffers just in case.

         output_ttree.DropBranchFromCache(tbranch, also_subbranches)


 class FilterRefiner(Refiner):

     """Refiner for filters"""


     def __init__(self, wrapped_refiner, filter=None, on=None):

         """Constructor for this refiner"""


         self.wrapped_refinerwrapped_refiner = wrapped_refiner


         if filter is None:


             self.filterfilter = np.nonzero

         else:

             self.filterfilter = filter


         self.onon = on


     def refine(self, harvesting_module, crops, *args, **kwds):

         """Process this filter"""

         filtered_crops = filter_crops(crops, self.filterfilter, part_name=self.onon)

         self.wrapped_refinerwrapped_refiner(harvesting_module, filtered_crops, *args, **kwds)


 class SelectRefiner(Refiner):

     """Refiner for selection"""


     def __init__(self, wrapped_refiner, select=None, exclude=None):

         """Constructor for this refiner"""

         if select is None:

             select = []

         if exclude is None:

             exclude = []


         self.wrapped_refinerwrapped_refiner = wrapped_refiner


         self.selectselect = select


         self.excludeexclude = exclude


     def refine(self, harvesting_module, crops, *args, **kwds):

         """Process this selection"""

         selected_crops = select_crop_parts(crops, select=self.selectselect, exclude=self.excludeexclude)

         self.wrapped_refinerwrapped_refiner(harvesting_module, selected_crops, *args, **kwds)


 class GroupByRefiner(Refiner):

     """Refiner for grouping"""


     default_exclude_by = True


     def __init__(self,

                  wrapped_refiner,

                  by=None,

                  exclude_by=None):

         """Constructor for this refiner"""

         if by is None:

             by = []


         self.wrapped_refinerwrapped_refiner = wrapped_refiner


         self.byby = by


         self.exclude_byexclude_by = exclude_by if exclude_by is not None else self.default_exclude_bydefault_exclude_by


     def refine(self,

                harvesting_module,

                crops,

                groupby_part_name=None,

                groupby_value=None,

                *args,

                **kwds):

         """Process this grouping"""


         by = self.byby


         # A single name to do the group by

         if isinstance(by, str) or by is None:

             part_name = by

             # Wrap it into a list an continue with the general case

             by = [part_name, ]


         for groupby_spec in by:

             if groupby_spec is None:

                 # Using empty string as groupby_value to indicate that all values have been selected

                 value = None

                 self.wrapped_refinerwrapped_refiner(harvesting_module,

                                      crops,

                                      groupby_part_name=None,

                                      groupby_value=value,

                                      *args,

                                      **kwds)

                 continue


             elif isinstance(groupby_spec, str):

                 part_name = groupby_spec

                 groupby_parts = crops[part_name]

                 unique_values, index_of_values = np.unique(groupby_parts, return_inverse=True)

                 groupby_values = [" = {value}]".format(value=value) for value in unique_values]


             elif isinstance(groupby_spec, tuple):

                 part_name = groupby_spec[0]

                 cuts = groupby_spec[1]


                 groupby_parts = crops[part_name]


                 # Take care of nans

                 digitization_cuts = list(np.sort(cuts))

                 if digitization_cuts[-1] != np.inf:

                     digitization_cuts.append(np.inf)

                 index_of_values = np.digitize(groupby_parts, digitization_cuts, right=True)


                 groupby_values = ["below {upper_bound}".format(upper_bound=digitization_cuts[0])]

                 bin_bounds = list(zip(digitization_cuts[0:], digitization_cuts[1:]))

                 for lower_bound, upper_bound in bin_bounds:

                     if lower_bound == upper_bound:

                         # degenerated bin case

                         groupby_values.append("= {lower_bound}".format(lower_bound=lower_bound))

                     elif upper_bound == np.inf:

                         groupby_values.append("above {lower_bound}".format(lower_bound=lower_bound))

                     else:

                         groupby_values.append("between {lower_bound} and {upper_bound}".format(lower_bound=lower_bound,

                                                                                                upper_bound=upper_bound))

                 groupby_values.append("is nan")

                 assert len(groupby_values) == len(digitization_cuts) + 1


             else:

                 raise ValueError("Unknown groupby specification %s" % groupby_spec)


             # Exclude the groupby variable if desired

             selected_crops = select_crop_parts(crops, exclude=part_name if self.exclude_byexclude_by else None)

             for index_of_value, groupby_value in enumerate(groupby_values):

                 indices_for_value = index_of_values == index_of_value

                 if not np.any(indices_for_value):

                     continue


                 filtered_crops = filter_crops(selected_crops, indices_for_value)


                 self.wrapped_refinerwrapped_refiner(harvesting_module,

                                      filtered_crops,

                                      groupby_part_name=part_name,

                                      groupby_value=groupby_value,

                                      *args,

                                      **kwds)


 class CdRefiner(Refiner):

     """Refiner for change-directory"""


     default_folder_name = ""


     default_groupby_addition = "_groupby_{groupby}_{groupby_value}"


     def __init__(self,

                  wrapped_refiner,

                  folder_name=None,

                  groupby_addition=None):

         """Constructor for this refiner"""


         self.wrapped_refinerwrapped_refiner = wrapped_refiner


         self.folder_namefolder_name = folder_name


         self.groupby_additiongroupby_addition = groupby_addition


     def refine(self,

                harvesting_module,

                crops,

                tdirectory=None,

                groupby_part_name=None,

                groupby_value=None,

                *args,

                **kwds):

         """Process the change-directory"""


         folder_name = self.folder_namefolder_name

         if folder_name is None:

             if groupby_value is not None:

                 folder_name = "{groupby_addition}"

             else:

                 folder_name = self.default_folder_namedefault_folder_name


         groupby_addition = self.groupby_additiongroupby_addition


         if groupby_addition is None:

             groupby_addition = self.default_groupby_additiondefault_groupby_addition


         if groupby_part_name is None and groupby_value is None:

             groupby_addition = ""

         else:

             groupby_addition = formatter.format(groupby_addition,

                                                 groupby=groupby_part_name,

                                                 groupby_value=groupby_value)


         folder_name = formatter.format(folder_name,

                                        groupby_addition=groupby_addition,

                                        groupby=groupby_part_name,

                                        groupby_value=groupby_value)


         folder_name = '/'.join(root_save_name(name) for name in folder_name.split('/'))


         with root_cd(tdirectory):

             with root_cd(folder_name) as tdirectory:

                 self.wrapped_refinerwrapped_refiner(harvesting_module,

                                      crops,

                                      tdirectory=tdirectory,

                                      groupby_part_name=groupby_part_name,

                                      groupby_value=groupby_value,

                                      *args,

                                      **kwds)


 class ExpertLevelRefiner(Refiner):

     """Refiner for expert-level categorization"""


     def __init__(self, wrapped_refiner, above_expert_level=None, below_expert_level=None):

         """Constructor for this refiner"""


         self.wrapped_refinerwrapped_refiner = wrapped_refiner


         self.above_expert_levelabove_expert_level = above_expert_level


         self.below_expert_levelbelow_expert_level = below_expert_level


     def refine(self, harvesting_module, crops, *args, **kwds):

         """Process the expert-level categorization"""


         above_expert_level = self.above_expert_levelabove_expert_level

         below_expert_level = self.below_expert_levelbelow_expert_level


         proceed = True

         if above_expert_level is not None:

             proceed = proceed and harvesting_module.expert_level > above_expert_level


         if below_expert_level is not None:

             proceed = proceed and harvesting_module.expert_level < below_expert_level


         if proceed:

             self.wrapped_refinerwrapped_refiner(harvesting_module, crops, *args, **kwds)


 # Meta refiner decorators

 def groupby(refiner=None, **kwds):

     def group_decorator(wrapped_refiner):

         return GroupByRefiner(wrapped_refiner, **kwds)

     if refiner is None:

         return group_decorator

     else:

         return group_decorator(refiner)


 def select(refiner=None, **kwds):

     def select_decorator(wrapped_refiner):

         return SelectRefiner(wrapped_refiner, **kwds)

     if refiner is None:

         return select_decorator

     else:

         return select_decorator(refiner)


 def filter(refiner=None, **kwds):

     def filter_decorator(wrapped_refiner):

         return FilterRefiner(wrapped_refiner, **kwds)

     if refiner is None:

         return filter_decorator

     else:

         return filter_decorator(refiner)


 def cd(refiner=None, **kwds):

     def cd_decorator(wrapped_refiner):

         return CdRefiner(wrapped_refiner, **kwds)

     if refiner is None:

         return cd_decorator

     else:

         return cd_decorator(refiner)


 def context(refiner=None,

             above_expert_level=None, below_expert_level=None,

             folder_name=None, folder_groupby_addition=None,

             filter=None, filter_on=None,

             groupby=None, exclude_groupby=None,

             select=None, exclude=None):


     def context_decorator(wrapped_refiner):

         # Apply meta refiners in the reverse order that they shall be executed

         if exclude is not None or select is not None:

             wrapped_refiner = SelectRefiner(wrapped_refiner,

                                             select=select, exclude=exclude)


         if folder_name is not None or groupby is not None or folder_groupby_addition is not None:

             wrapped_refiner = CdRefiner(wrapped_refiner,

                                         folder_name=folder_name,

                                         groupby_addition=folder_groupby_addition)


         if groupby is not None:

             wrapped_refiner = GroupByRefiner(wrapped_refiner,

                                              by=groupby,

                                              exclude_by=exclude_groupby)


         if filter is not None or filter_on is not None:

             wrapped_refiner = FilterRefiner(wrapped_refiner,

                                             filter=filter,

                                             on=filter_on)


         if above_expert_level is not None or below_expert_level is not None:

             wrapped_refiner = ExpertLevelRefiner(wrapped_refiner,

                                                  above_expert_level=above_expert_level,

                                                  below_expert_level=below_expert_level)


         if not isinstance(wrapped_refiner, Refiner):

             wrapped_refiner = Refiner(wrapped_refiner)


         return wrapped_refiner


     if refiner is None:

         return context_decorator

     else:

         return functools.wraps(refiner)(context_decorator(refiner))


 def refiner_with_context(refiner_factory):

     @functools.wraps(refiner_factory)

     def module_decorator_with_context(above_expert_level=None, below_expert_level=None,

                                       folder_name=None, folder_groupby_addition=None,

                                       filter=None, filter_on=None,

                                       groupby=None, exclude_groupby=None,

                                       select=None, exclude=None,

                                       **kwds_for_refiner_factory):


         refiner = refiner_factory(**kwds_for_refiner_factory)


         return context(refiner,

                        above_expert_level=above_expert_level, below_expert_level=below_expert_level,

                        folder_name=folder_name, folder_groupby_addition=folder_groupby_addition,

                        filter=filter, filter_on=filter_on,

                        groupby=groupby, exclude_groupby=exclude_groupby,

                        select=select, exclude=exclude)


     return module_decorator_with_context


 @refiner_with_context

 def save_fom(**kwds):

     return SaveFiguresOfMeritRefiner(**kwds)


 @refiner_with_context

 def save_histograms(**kwds):

     return SaveHistogramsRefiner(**kwds)


 @refiner_with_context

 def save_profiles(**kwds):

     return SaveProfilesRefiner(**kwds)


 @refiner_with_context

 def save_scatters(**kwds):

     return SaveScatterRefiner(**kwds)


 @refiner_with_context

 def save_classification_analysis(**kwds):

     return SaveClassificationAnalysisRefiner(**kwds)


 @refiner_with_context

 def save_pull_analysis(**kwds):

     return SavePullAnalysisRefiner(**kwds)


 @refiner_with_context

 def save_tree(**kwds):

     return SaveTreeRefiner(**kwds)


 def select_crop_parts(crops, select=None, exclude=None):

     if select is None:

         select = []

     if exclude is None:

         exclude = []


     if isinstance(select, str):

         select = [select, ]


     if isinstance(exclude, str):

         exclude = [exclude, ]


     if isinstance(crops, collections.MutableMapping):

         part_names = list(crops.keys())


         if not select and not exclude:

             return crops


         if select:

             not_selected_part_names = [name for name in part_names if name not in select]


             # if the selection item is a callable function do not count it as not selectable yet

             select_not_in_part_names = [name for name in select

                                         if not isinstance(name, collections.Callable) and name not in part_names]

             if select_not_in_part_names:

                 get_logger().warning("Cannot select %s, because they are not in crop part names %s",

                                      select_not_in_part_names, sorted(part_names))

         else:

             not_selected_part_names = []


         if exclude:

             excluded_part_names = [name for name in part_names if name in exclude]

         else:

             excluded_part_names = []


         excluded_part_names.extend(not_selected_part_names)


         # Make a shallow copy

         selected_crops = copy.copy(crops)

         for part_name in set(excluded_part_names):

             del selected_crops[part_name]


         if isinstance(select, collections.Mapping):

             # select is a rename mapping

             for part_name, new_part_name in list(select.items()):

                 if isinstance(part_name, collections.Callable):

                     selected_crops[new_part_name] = part_name(**crops)

                 elif part_name in selected_crops:

                     parts = selected_crops[part_name]

                     del selected_crops[part_name]

                     selected_crops[new_part_name] = parts


         return selected_crops


     else:

         raise ValueError("Unrecognised crop %s of type %s" % (crops, type(crops)))


 def filter_crops(crops, filter_function, part_name=None):

     if isinstance(filter_function, np.ndarray):

         filter_indices = filter_function

     else:

         parts = crops[part_name]

         filter_indices = filter_function(parts)


     if isinstance(crops, np.ndarray):

         return crops[filter_indices]


     elif isinstance(crops, collections.MutableMapping):

         # Make a shallow copy

         filtered_crops = copy.copy(crops)

         for part_name, parts in list(crops.items()):

             filtered_crops[part_name] = parts[filter_indices]

         return filtered_crops


     else:

         raise ValueError("Unrecognised crop %s of type %s" % (crops, type(crops)))


 def iter_items_sorted_for_key(crops):

     # is the type of crops is a dictionary assume, that it should be sorted

     # in all other cases the users class has to take care of the sorting

     if isinstance(crops, dict):

         keys = sorted(crops.keys())

         return ((key, crops[key]) for key in keys)

     else:

         return list(crops.items())

tracking.harvest.refiners.CdRefiner
Definition: refiners.py:1040

tracking.harvest.refiners.CdRefiner.__init__
def __init__(self, wrapped_refiner, folder_name=None, groupby_addition=None)
Definition: refiners.py:1051

tracking.harvest.refiners.CdRefiner.folder_name
folder_name
cached value of the folder name
Definition: refiners.py:1057

tracking.harvest.refiners.CdRefiner.refine
def refine(self, harvesting_module, crops, tdirectory=None, groupby_part_name=None, groupby_value=None, *args, **kwds)
Definition: refiners.py:1068

tracking.harvest.refiners.CdRefiner.wrapped_refiner
wrapped_refiner
cached value of the wrapped refiner
Definition: refiners.py:1055

tracking.harvest.refiners.CdRefiner.default_groupby_addition
string default_groupby_addition
Default suffix for a groupby selection.
Definition: refiners.py:1046

tracking.harvest.refiners.CdRefiner.groupby_addition
groupby_addition
cached value of the suffix for a groupby selection
Definition: refiners.py:1059

tracking.harvest.refiners.CdRefiner.default_folder_name
string default_folder_name
Folder name to be used if a groupby selection is active.
Definition: refiners.py:1044

tracking.harvest.refiners.ExpertLevelRefiner
Definition: refiners.py:1108

tracking.harvest.refiners.ExpertLevelRefiner.below_expert_level
below_expert_level
cached value of the lower range of the expert level
Definition: refiners.py:1119

tracking.harvest.refiners.ExpertLevelRefiner.wrapped_refiner
wrapped_refiner
cached value of the wrapped refiner
Definition: refiners.py:1115

tracking.harvest.refiners.ExpertLevelRefiner.refine
def refine(self, harvesting_module, crops, *args, **kwds)
Definition: refiners.py:1121

tracking.harvest.refiners.ExpertLevelRefiner.__init__
def __init__(self, wrapped_refiner, above_expert_level=None, below_expert_level=None)
Definition: refiners.py:1111

tracking.harvest.refiners.ExpertLevelRefiner.above_expert_level
above_expert_level
cached value of the upper range of the expert level
Definition: refiners.py:1117

tracking.harvest.refiners.FilterRefiner
Definition: refiners.py:893

tracking.harvest.refiners.FilterRefiner.on
on
cached value of the part name to filter on
Definition: refiners.py:909

tracking.harvest.refiners.FilterRefiner.wrapped_refiner
wrapped_refiner
cached value of the wrapped refiner
Definition: refiners.py:900

tracking.harvest.refiners.FilterRefiner.refine
def refine(self, harvesting_module, crops, *args, **kwds)
Definition: refiners.py:911

tracking.harvest.refiners.FilterRefiner.filter
filter
cached value of the filter
Definition: refiners.py:904

tracking.harvest.refiners.FilterRefiner.__init__
def __init__(self, wrapped_refiner, filter=None, on=None)
Definition: refiners.py:896

tracking.harvest.refiners.GroupByRefiner
Definition: refiners.py:939

tracking.harvest.refiners.GroupByRefiner.by
by
cached value of the group-by classifier
Definition: refiners.py:955

tracking.harvest.refiners.GroupByRefiner.__init__
def __init__(self, wrapped_refiner, by=None, exclude_by=None)
Definition: refiners.py:948

tracking.harvest.refiners.GroupByRefiner.wrapped_refiner
wrapped_refiner
cached value of the wrapped refiner
Definition: refiners.py:953

tracking.harvest.refiners.GroupByRefiner.exclude_by
exclude_by
cached value of the exclude-by classifier
Definition: refiners.py:957

tracking.harvest.refiners.GroupByRefiner.default_exclude_by
bool default_exclude_by
default value of the exclude-by classifier
Definition: refiners.py:943

tracking.harvest.refiners.GroupByRefiner.refine
def refine(self, harvesting_module, crops, groupby_part_name=None, groupby_value=None, *args, **kwds)
Definition: refiners.py:965

tracking.harvest.refiners.Plot2DRefiner
Definition: refiners.py:312

tracking.harvest.refiners.Plot2DRefiner.title
title
cached user-defined title for this profile histogram / scatterplot
Definition: refiners.py:344

tracking.harvest.refiners.Plot2DRefiner.y_log
y_log
cached flag for logarithmic y axis for this profile histogram / scatterplot
Definition: refiners.py:371

tracking.harvest.refiners.Plot2DRefiner.description
description
cached user-defined description for this profile histogram / scatterplot
Definition: refiners.py:347

tracking.harvest.refiners.Plot2DRefiner.contact
contact
cached user-defined contact person for this profile histogram / scatterplot
Definition: refiners.py:351

tracking.harvest.refiners.Plot2DRefiner.fit
fit
cached fit for this profile histogram / scatterplot
Definition: refiners.py:379

tracking.harvest.refiners.Plot2DRefiner.upper_bound
upper_bound
cached upper bound for this profile histogram / scatterplot
Definition: refiners.py:365

tracking.harvest.refiners.Plot2DRefiner.y
y
cached value of ordinate
Definition: refiners.py:356

tracking.harvest.refiners.Plot2DRefiner.outlier_z_score
outlier_z_score
cached Z-score (for outlier detection) for this profile histogram / scatterplot
Definition: refiners.py:374

tracking.harvest.refiners.Plot2DRefiner.y_binary
y_binary
cached flag for probability y axis (range 0.0 .
Definition: refiners.py:369

tracking.harvest.refiners.Plot2DRefiner.skip_single_valued
skip_single_valued
cached flag to skip single-valued bins for this profile histogram / scatterplot
Definition: refiners.py:384

tracking.harvest.refiners.Plot2DRefiner.allow_discrete
allow_discrete
cached flag to allow discrete values for this profile histogram / scatterplot
Definition: refiners.py:376

tracking.harvest.refiners.Plot2DRefiner.fit_z_score
fit_z_score
cached fit Z-score (for outlier detection) for this profile histogram / scatterplot
Definition: refiners.py:381

tracking.harvest.refiners.Plot2DRefiner.stackby
stackby
cached stacking selection for this profile histogram / scatterplot
Definition: refiners.py:358

tracking.harvest.refiners.Plot2DRefiner.y_unit
y_unit
cached measurement unit for ordinate
Definition: refiners.py:360

tracking.harvest.refiners.Plot2DRefiner.__init__
def __init__(self, y, x=None, name=None, title=None, contact=None, description=None, check=None, stackby=None, y_unit=None, y_binary=None, y_log=None, lower_bound=None, upper_bound=None, bins=None, outlier_z_score=None, fit=None, fit_z_score=None, skip_single_valued=False, allow_discrete=False)
Definition: refiners.py:336

tracking.harvest.refiners.Plot2DRefiner.x
x
cached value of abscissa
Definition: refiners.py:354

tracking.harvest.refiners.Plot2DRefiner.plot_kind
string plot_kind
by default, this refiner is for profile histograms
Definition: refiners.py:315

tracking.harvest.refiners.Plot2DRefiner.has_more_than_one_value
def has_more_than_one_value(xs)
Definition: refiners.py:505

tracking.harvest.refiners.Plot2DRefiner.name
name
cached user-defined name for this profile histogram / scatterplot
Definition: refiners.py:342

tracking.harvest.refiners.Plot2DRefiner.bins
bins
cached number of bins for this profile histogram / scatterplot
Definition: refiners.py:367

tracking.harvest.refiners.Plot2DRefiner.refine
def refine(self, harvesting_module, crops, tdirectory=None, groupby_part_name=None, groupby_value=None, **kwds)
Definition: refiners.py:392

tracking.harvest.refiners.Plot2DRefiner.lower_bound
lower_bound
cached lower bound for this profile histogram / scatterplot
Definition: refiners.py:363

tracking.harvest.refiners.Plot2DRefiner.check
check
cached user-defined user-check action for this profile histogram / scatterplot
Definition: refiners.py:349

tracking.harvest.refiners.Refiner
Definition: refiners.py:34

tracking.harvest.refiners.Refiner.refiner_function
refiner_function
cached copy of the instance's refiner function
Definition: refiners.py:40

tracking.harvest.refiners.Refiner.__init__
def __init__(self, refiner_function=None)
Definition: refiners.py:37

tracking.harvest.refiners.Refiner.refine
def refine(self, harvesting_module, *args, **kwds)
Definition: refiners.py:69

tracking.harvest.refiners.Refiner.__get__
def __get__(self, harvesting_module, cls=None)
Definition: refiners.py:42

tracking.harvest.refiners.Refiner.__call__
def __call__(self, harvesting_module, crops=None, *args, **kwds)
Definition: refiners.py:55

tracking.harvest.refiners.SaveClassificationAnalysisRefiner
Definition: refiners.py:549

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.truth_name
truth_name
cached truth-values-collection name for this truth-classification analysis
Definition: refiners.py:581

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.cut
cut
cached threshold of estimates for this truth-classification analysis
Definition: refiners.py:584

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.contact
contact
cached contact person for this truth-classification analysis
Definition: refiners.py:577

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.upper_bound
upper_bound
cached upper bound of estimates for this truth-classification analysis
Definition: refiners.py:591

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.outlier_z_score
outlier_z_score
cached Z-score (for outlier detection) of estimates for this truth-classification analysis
Definition: refiners.py:593

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.allow_discrete
allow_discrete
cached discrete-value flag of estimates for this truth-classification analysis
Definition: refiners.py:595

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.unit
unit
cached measurement unit of estimates for this truth-classification analysis
Definition: refiners.py:597

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.default_truth_name
string default_truth_name
default name for the truth-classification analysis truth-values collection
Definition: refiners.py:556

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.estimate_name
estimate_name
cached estimates-collection name for this truth-classification analysis
Definition: refiners.py:579

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.default_estimate_name
string default_estimate_name
default name for the truth-classification analysis estimates collection
Definition: refiners.py:558

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.cut_direction
cut_direction
cached cut direction (> or <) of estimates for this truth-classification analysis
Definition: refiners.py:586

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.__init__
def __init__(self, part_name=None, contact=None, estimate_name=None, truth_name=None, cut_direction=None, cut=None, lower_bound=None, upper_bound=None, outlier_z_score=None, allow_discrete=False, unit=None)
Definition: refiners.py:571

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.part_name
part_name
cached part name for this truth-classification analysis
Definition: refiners.py:575

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.default_contact
string default_contact
default contact person for this truth-classification analysis
Definition: refiners.py:553

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.refine
def refine(self, harvesting_module, crops, tdirectory=None, groupby_part_name=None, groupby_value=None, **kwds)
Definition: refiners.py:605

tracking.harvest.refiners.SaveClassificationAnalysisRefiner.lower_bound
lower_bound
cached lower bound of estimates for this truth-classification analysis
Definition: refiners.py:589

tracking.harvest.refiners.SaveFiguresOfMeritRefiner
Definition: refiners.py:74

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.title
title
cached title of the figure of merit
Definition: refiners.py:113

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.description
description
cached description of the figure of merit
Definition: refiners.py:116

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.contact
contact
cached contact person of the figure of merit
Definition: refiners.py:120

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.__init__
def __init__(self, name=None, title=None, contact=None, description=None, check=None, key=None, aggregation=None)
Definition: refiners.py:105

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.default_description
string default_description
default description for this refiner
Definition: refiners.py:83

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.mean
def mean(xs)
return the mean of the parts, ignoring NaNs
Definition: refiners.py:91

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.default_key
string default_key
default key name for this refiner
Definition: refiners.py:87

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.default_aggregation
def default_aggregation
default aggregation is the mean of the parts
Definition: refiners.py:95

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.aggregation
aggregation
cached copy of the crops-aggregation method
Definition: refiners.py:125

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.default_check
string default_check
default user-check action for this refiner
Definition: refiners.py:85

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.default_title
string default_title
default title for this refiner
Definition: refiners.py:79

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.key
key
cached copy of the figures-of-merit key
Definition: refiners.py:123

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.name
name
cached name of the figure of merit
Definition: refiners.py:111

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.default_contact
string default_contact
default contact person for this refiner
Definition: refiners.py:81

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.default_name
string default_name
default name for this refiner
Definition: refiners.py:77

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.refine
def refine(self, harvesting_module, crops, tdirectory=None, groupby_part_name=None, groupby_value=None, **kwds)
Definition: refiners.py:133

tracking.harvest.refiners.SaveFiguresOfMeritRefiner.check
check
cached user-check action of the figure of merit
Definition: refiners.py:118

tracking.harvest.refiners.SaveHistogramsRefiner
Definition: refiners.py:180

tracking.harvest.refiners.SaveHistogramsRefiner.title
title
cached user-defined title for this histogram
Definition: refiners.py:214

tracking.harvest.refiners.SaveHistogramsRefiner.description
description
cached user-defined description for this histogram
Definition: refiners.py:217

tracking.harvest.refiners.SaveHistogramsRefiner.contact
contact
cached user-defined contact person for this histogram
Definition: refiners.py:221

tracking.harvest.refiners.SaveHistogramsRefiner.fit
fit
cached fit for this histogram
Definition: refiners.py:238

tracking.harvest.refiners.SaveHistogramsRefiner.upper_bound
upper_bound
cached upper bound for this histogram
Definition: refiners.py:226

tracking.harvest.refiners.SaveHistogramsRefiner.outlier_z_score
outlier_z_score
cached Z-score (for outlier detection) for this histogram
Definition: refiners.py:231

tracking.harvest.refiners.SaveHistogramsRefiner.allow_discrete
allow_discrete
cached flag to allow discrete values for this histogram
Definition: refiners.py:233

tracking.harvest.refiners.SaveHistogramsRefiner.default_description
string default_description
default description for this histogram
Definition: refiners.py:189

tracking.harvest.refiners.SaveHistogramsRefiner.__init__
def __init__(self, name=None, title=None, contact=None, description=None, check=None, lower_bound=None, upper_bound=None, bins=None, outlier_z_score=None, allow_discrete=False, stackby="", fit=None, fit_z_score=None)
Definition: refiners.py:206

tracking.harvest.refiners.SaveHistogramsRefiner.fit_z_score
fit_z_score
cached fit Z-score (for outlier detection) for this histogram
Definition: refiners.py:240

tracking.harvest.refiners.SaveHistogramsRefiner.stackby
stackby
cached stacking selection for this histogram
Definition: refiners.py:235

tracking.harvest.refiners.SaveHistogramsRefiner.default_check
string default_check
default user-check action for this histogram
Definition: refiners.py:191

tracking.harvest.refiners.SaveHistogramsRefiner.default_title
string default_title
default title for this histogram
Definition: refiners.py:185

tracking.harvest.refiners.SaveHistogramsRefiner.name
name
cached user-defined name for this histogram
Definition: refiners.py:212

tracking.harvest.refiners.SaveHistogramsRefiner.default_contact
string default_contact
default contact person for this histogram
Definition: refiners.py:187

tracking.harvest.refiners.SaveHistogramsRefiner.default_name
string default_name
default name for this histogram
Definition: refiners.py:183

tracking.harvest.refiners.SaveHistogramsRefiner.bins
bins
cached number of bins for this histogram
Definition: refiners.py:228

tracking.harvest.refiners.SaveHistogramsRefiner.refine
def refine(self, harvesting_module, crops, tdirectory=None, groupby_part_name=None, groupby_value=None, **kwds)
Definition: refiners.py:248

tracking.harvest.refiners.SaveHistogramsRefiner.lower_bound
lower_bound
cached lower bound for this histogram
Definition: refiners.py:224

tracking.harvest.refiners.SaveHistogramsRefiner.check
check
cached user-defined user-check action for this histogram
Definition: refiners.py:219

tracking.harvest.refiners.SaveProfilesRefiner
Definition: refiners.py:515

tracking.harvest.refiners.SavePullAnalysisRefiner
Definition: refiners.py:657

tracking.harvest.refiners.SavePullAnalysisRefiner.variance_name
variance_name
cached name for the pull analysis variances collection
Definition: refiners.py:712

tracking.harvest.refiners.SavePullAnalysisRefiner.truth_name
truth_name
cached name for the pull analysis truth-values collection
Definition: refiners.py:708

tracking.harvest.refiners.SavePullAnalysisRefiner.default_variance_name
string default_variance_name
default name for the pull analysis variances collection
Definition: refiners.py:672

tracking.harvest.refiners.SavePullAnalysisRefiner.quantity_name
quantity_name
cached name of the quantity for the pull analysis
Definition: refiners.py:715

tracking.harvest.refiners.SavePullAnalysisRefiner.contact
contact
cached contact person for this pull analysis
Definition: refiners.py:695

tracking.harvest.refiners.SavePullAnalysisRefiner.outlier_z_score
outlier_z_score
cached Z-score (for outlier detection) for the pull analysis
Definition: refiners.py:723

tracking.harvest.refiners.SavePullAnalysisRefiner.part_names
part_names
cached array of part names for this pull analysis
Definition: refiners.py:700

tracking.harvest.refiners.SavePullAnalysisRefiner.unit
unit
cached measurement unit for the pull analysis
Definition: refiners.py:717

tracking.harvest.refiners.SavePullAnalysisRefiner.aux_names
aux_names
cached auxiliary names for the pull analysis
Definition: refiners.py:720

tracking.harvest.refiners.SavePullAnalysisRefiner.default_truth_name
string default_truth_name
default name for the pull analysis truth-values collection
Definition: refiners.py:668

tracking.harvest.refiners.SavePullAnalysisRefiner.estimate_name
estimate_name
cached name for the pull analysis estimates collection
Definition: refiners.py:710

tracking.harvest.refiners.SavePullAnalysisRefiner.default_estimate_name
string default_estimate_name
default name for the pull analysis estimates collection
Definition: refiners.py:670

tracking.harvest.refiners.SavePullAnalysisRefiner.title_postfix
title_postfix
cached suffix for the title of this pull analysis
Definition: refiners.py:697

tracking.harvest.refiners.SavePullAnalysisRefiner.__init__
def __init__(self, name=None, contact=None, title_postfix=None, part_name=None, part_names=None, truth_name=None, estimate_name=None, variance_name=None, quantity_name=None, aux_names=None, unit=None, outlier_z_score=None, absolute=False, which_plots=None)
Definition: refiners.py:688

tracking.harvest.refiners.SavePullAnalysisRefiner.name
name
cached name for this pull analysis
Definition: refiners.py:693

tracking.harvest.refiners.SavePullAnalysisRefiner.default_contact
string default_contact
default contact person for this pull analysis
Definition: refiners.py:663

tracking.harvest.refiners.SavePullAnalysisRefiner.default_name
string default_name
default name for this pull analysis
Definition: refiners.py:661

tracking.harvest.refiners.SavePullAnalysisRefiner.refine
def refine(self, harvesting_module, crops, tdirectory=None, groupby_part_name=None, groupby_value=None, **kwds)
Definition: refiners.py:735

tracking.harvest.refiners.SavePullAnalysisRefiner.default_title_postfix
string default_title_postfix
default suffix for the title of this pull analysis
Definition: refiners.py:665

tracking.harvest.refiners.SavePullAnalysisRefiner.which_plots
which_plots
cached list of plots produced by the pull analysis
Definition: refiners.py:727

tracking.harvest.refiners.SavePullAnalysisRefiner.absolute
absolute
cached absolute-value-comparison flag for the pull analysis
Definition: refiners.py:725

tracking.harvest.refiners.SaveScatterRefiner
Definition: refiners.py:532

tracking.harvest.refiners.SaveTreeRefiner
Definition: refiners.py:817

tracking.harvest.refiners.SaveTreeRefiner.title
title
cached title for this TTree
Definition: refiners.py:834

tracking.harvest.refiners.SaveTreeRefiner.__init__
def __init__(self, name=None, title=None)
Definition: refiners.py:827

tracking.harvest.refiners.SaveTreeRefiner.add_branch
def add_branch(self, output_ttree, part_name, parts)
Definition: refiners.py:867

tracking.harvest.refiners.SaveTreeRefiner.default_title
string default_title
default title for this TTree
Definition: refiners.py:823

tracking.harvest.refiners.SaveTreeRefiner.name
name
cached name for this TTree
Definition: refiners.py:832

tracking.harvest.refiners.SaveTreeRefiner.default_name
string default_name
default name for this TTree
Definition: refiners.py:821

tracking.harvest.refiners.SaveTreeRefiner.refine
def refine(self, harvesting_module, crops, tdirectory=None, groupby_part_name=None, groupby_value=None, **kwds)
Definition: refiners.py:842

tracking.harvest.refiners.SelectRefiner
Definition: refiners.py:917

tracking.harvest.refiners.SelectRefiner.__init__
def __init__(self, wrapped_refiner, select=None, exclude=None)
Definition: refiners.py:920

tracking.harvest.refiners.SelectRefiner.wrapped_refiner
wrapped_refiner
cached value of the wrapped refiner
Definition: refiners.py:927

tracking.harvest.refiners.SelectRefiner.refine
def refine(self, harvesting_module, crops, *args, **kwds)
Definition: refiners.py:933

tracking.harvest.refiners.SelectRefiner.exclude
exclude
cached value of the exclusion flag
Definition: refiners.py:931

tracking.harvest.refiners.SelectRefiner.select
select
cached value of the selector
Definition: refiners.py:929

tracking.validation.classification.ClassificationAnalysis
Definition: classification.py:26

tracking.validation.fom.ValidationFiguresOfMerit
Definition: fom.py:20

tracking.validation.plot.ValidationPlot
Definition: plot.py:160

tracking.validation.pull.PullAnalysis
Definition: pull.py:27

Belle2::filter
std::map< ExpRun, std::pair< double, double > > filter(const std::map< ExpRun, std::pair< double, double >> &runs, double cut, std::map< ExpRun, std::pair< double, double >> &runsRemoved)
filter events to remove runs shorter than cut, it stores removed runs in runsRemoved
Definition: Splitter.cc:38

tracking.root_utils
Definition: root_utils.py:1

tracking.validation.classification
Definition: classification.py:1

tracking.validation.fom
Definition: fom.py:1

tracking.validation.plot
Definition: plot.py:1

tracking.validation.pull
Definition: pull.py:1

tracking.validation.tolerate_missing_key_formatter
Definition: tolerate_missing_key_formatter.py:1