Belle II Software  light-2205-abys
BestCandidateSelectionModule.cc
1 /**************************************************************************
2  * basf2 (Belle II Analysis Software Framework) *
3  * Author: The Belle II Collaboration *
4  * *
5  * See git log for contributors and copyright holders. *
6  * This file is licensed under LGPL-3.0, see LICENSE.md. *
7  **************************************************************************/
8 
9 #include <analysis/modules/BestCandidateSelection/BestCandidateSelectionModule.h>
10 
11 #include <analysis/utility/ValueIndexPairSorting.h>
12 
13 #include <analysis/VariableManager/Utility.h>
14 
15 #include <framework/logging/Logger.h>
16 #include <framework/utilities/MakeROOTCompatible.h>
17 
18 using namespace std;
19 using namespace Belle2;
20 
21 
22 REG_MODULE(BestCandidateSelection);
23 
24 
25 BestCandidateSelectionModule::BestCandidateSelectionModule():
26  m_variable(nullptr)
27 {
28  //the "undefined order" bit is not strictly true in the current implementation, but details (with anti-particle lists) are tricky
29  setDescription(R"DOC(Sort particles by the value of a given ``variable``
30 in the input list and optionally remove particles after the nth position.
31 
32 Per default particles are sorted in descending order but it can be switched to
33 an ascending order by setting ``selectLowest=True``. The convenience functions
34 `modularAnalysis.rankByHighest` and `modularAnalysis.rankByLowest` set this
35 parameter automatically based on their names.
36 
37 Particles will receive an extra-info field containing their rank as an integer
38 starting at 1 (best). The name of this extra-info field defaults to
39 ``${variable}_rank`` but can be chosen freely using the ``outputVariable``
40 parameter.
41 
42 The ranking also takes antiparticles into account, so there will only be one
43 B+- candidate with ``rank=1``. The remaining list is sorted from best to worst
44 candidate (each charge, e.g. B+/B-, separately). The sorting is guaranteed
45 to be stable between particle and anti particle list: particles with the same
46 value for ``variable`` will keep their relative order. That is, a particle "A"
47 which was before another particle "B" in the same list and has the same value
48 for ``variable`` will also stay before "B" after sorting.
49 
50 If ``allowMultiRank=False`` (the default) candidates with same value of
51 ``variable`` will have different ranks. If ``allowMultiRank=True`` they will
52 share the same rank.
53 
54 IF ``numBest>0`` only candidates with this rank or better will remain in the
55 output list. If ``allowMultiRank=True`` that means that there can be more than
56 ``numBest`` candidates in the output list if they share ranks.
57 )DOC");
58 
60 
61  addParam("particleList", m_inputListName, "Name of the ParticleList to rank for best candidate");
62  addParam("variable", m_variableName, "Variable which defines the candidate ranking (see ``selectLowest`` for ordering)");
63  addParam("selectLowest", m_selectLowest, "If true, candidate with lower values of ``variable`` are better, otherwise higher is better", false);
64  addParam("allowMultiRank", m_allowMultiRank, "If true, candidates with identical values get identical rank", false);
65  addParam("numBest", m_numBest, "Keep only particles with this rank or better. If ``allowMultiRank=False`` this is "
66  "identical to the maximum amount of candidates left in the list. Otherwise there may be more candidates if "
67  "some share the same rank (0: keep all)", 0);
68  addParam("cut", m_cutParameter, "Only candidates passing the cut will be ranked. The others will have rank -1.", std::string(""));
69  addParam("outputVariable", m_outputVariableName,
70  "Name for created variable, which contains the rank for the particle. If not provided, the standard name ``${variable}_rank`` is used.");
71 
72 }
73 
75 
77 {
78  m_particles.isRequired();
79  m_inputList.isRequired(m_inputListName);
80 
82  if (!m_variable) {
83  B2ERROR("Variable '" << m_variableName << "' is not available in Variable::Manager!");
84  }
85  if (!(m_variable->variabletype == Variable::Manager::VariableDataType::c_double or m_variable->variabletype == Variable::Manager::VariableDataType::c_int)) {
86  B2ERROR("Variable '" << m_variableName << "' has wrong data type! It must be either double or integer.");
87  }
88  if (m_numBest < 0) {
89  B2ERROR("value of numBest must be >= 0!");
90  }
92 
93  // parse the name that the rank will be stored under
94  if (m_outputVariableName.empty()) {
95  std::string root_compatible_VariableName = MakeROOTCompatible::makeROOTCompatible(m_variableName);
96  m_outputVariableName = root_compatible_VariableName + "_rank";
97  }
98 }
99 
101 {
102  // input list
103  if (!m_inputList) {
104  B2WARNING("Input list " << m_inputList.getName() << " was not created?");
105  return;
106  }
107 
108  // create list of particle index and the corresponding value of variable
109  typedef std::pair<double, unsigned int> ValueIndexPair;
110  std::vector<ValueIndexPair> valueToIndex;
111  const unsigned int numParticles = m_inputList->getListSize();
112  valueToIndex.reserve(numParticles);
113  for (const Particle& p : *m_inputList) {
114  double value = 0;
115  auto var_result = m_variable->function(&p);
116  if (std::holds_alternative<double>(var_result)) {
117  value = std::get<double>(var_result);
118  } else if (std::holds_alternative<int>(var_result)) {
119  value = std::get<int>(var_result);
120  }
121  valueToIndex.emplace_back(value, p.getArrayIndex());
122  }
123 
124  // use stable sort to make sure we keep the relative order of elements with
125  // same value as it was before
126  if (m_selectLowest) {
127  std::stable_sort(valueToIndex.begin(), valueToIndex.end(), ValueIndexPairSorting::lowerPair<ValueIndexPair>);
128  } else {
129  std::stable_sort(valueToIndex.begin(), valueToIndex.end(), ValueIndexPairSorting::higherPair<ValueIndexPair>);
130  }
131 
132  // assign ranks and (optionally) remove everything but best candidates
133  m_inputList->clear();
134  int rank{1};
135  double previous_val{0};
136  bool first_candidate{true};
137  for (const auto& candidate : valueToIndex) {
138  Particle* p = m_particles[candidate.second];
139  if (!m_cut->check(p)) {
140  p->addExtraInfo(m_outputVariableName, -1);
141  m_inputList->addParticle(p);
142  continue;
143  }
144  if (first_candidate) {
145  first_candidate = false;
146  } else {
147  if (!m_allowMultiRank || (candidate.first != previous_val)) ++rank;
148  }
149 
150  if (!p->hasExtraInfo(m_outputVariableName))
151  p->addExtraInfo(m_outputVariableName, rank);
152  m_inputList->addParticle(p);
153 
154  previous_val = candidate.first;
155 
156  if (m_numBest != 0 and rank >= m_numBest)
157  break;
158  }
159 }
bool m_allowMultiRank
Give the same rank to candidates with the same value.
virtual void initialize() override
Initialize the module (set up datastore)
virtual void event() override
Process an event.
std::string m_variableName
Variable which defines the candidate ranking.
StoreArray< Particle > m_particles
StoreArray of Particle objects.
bool m_selectLowest
Select the candidate with the lowest value (instead of highest).
virtual ~BestCandidateSelectionModule() override
Destructor.
std::unique_ptr< Variable::Cut > m_cut
cut object which performs the cuts
StoreObjPtr< ParticleList > m_inputList
input particle list
const Variable::Manager::Var * m_variable
Variable which defines the candidate ranking.
std::string m_cutParameter
Selection for candidates to be ranked.
int m_numBest
Number of best candidates to keep.
std::string m_outputVariableName
Name of generated Ranking-Variable, if specified by user.
std::string m_inputListName
name of input particle list.
static std::unique_ptr< GeneralCut > compile(const std::string &cut)
Creates an instance of a cut and returns a unique_ptr to it, if you need a copy-able object instead y...
Definition: GeneralCut.h:84
static std::string makeROOTCompatible(std::string str)
Remove special characters that ROOT dislikes in branch names, e.g.
void setDescription(const std::string &description)
Sets the description of the module.
Definition: Module.cc:214
void setPropertyFlags(unsigned int propertyFlags)
Sets the flags for the module properties.
Definition: Module.cc:208
@ c_ParallelProcessingCertified
This module can be run in parallel processing mode safely (All I/O must be done through the data stor...
Definition: Module.h:80
Class to store reconstructed particles.
Definition: Particle.h:74
const Var * getVariable(std::string name)
Get the variable belonging to the given key.
Definition: Manager.cc:57
static Manager & Instance()
get singleton instance.
Definition: Manager.cc:25
void addParam(const std::string &name, T &paramVariable, const std::string &description, const T &defaultValue)
Adds a new parameter to the module.
Definition: Module.h:560
#define REG_MODULE(moduleName)
Register the given module (without 'Module' suffix) with the framework.
Definition: Module.h:650
Abstract base class for different kinds of events.
Definition: ClusterUtils.h:23
VariableDataType variabletype
data type of variable
Definition: Manager.h:133
FunctionPtr function
Pointer to function.
Definition: Manager.h:147