Belle II Software  light-2212-foldex
BestCandidateSelectionModule.cc
1 /**************************************************************************
2  * basf2 (Belle II Analysis Software Framework) *
3  * Author: The Belle II Collaboration *
4  * *
5  * See git log for contributors and copyright holders. *
6  * This file is licensed under LGPL-3.0, see LICENSE.md. *
7  **************************************************************************/
8 
9 #include <analysis/modules/BestCandidateSelection/BestCandidateSelectionModule.h>
10 
11 #include <analysis/utility/ValueIndexPairSorting.h>
12 
13 #include <analysis/VariableManager/Utility.h>
14 
15 #include <analysis/DecayDescriptor/DecayDescriptor.h>
16 
17 #include <framework/logging/Logger.h>
18 #include <framework/utilities/MakeROOTCompatible.h>
19 
20 using namespace std;
21 using namespace Belle2;
22 
23 
24 REG_MODULE(BestCandidateSelection);
25 
26 
27 BestCandidateSelectionModule::BestCandidateSelectionModule():
28  m_variable(nullptr)
29 {
30  //the "undefined order" bit is not strictly true in the current implementation, but details (with anti-particle lists) are tricky
31  setDescription(R"DOC(Sort particles by the value of a given ``variable``
32 in the input list and optionally remove particles after the nth position.
33 
34 Per default particles are sorted in descending order but it can be switched to
35 an ascending order by setting ``selectLowest=True``. The convenience functions
36 `modularAnalysis.rankByHighest` and `modularAnalysis.rankByLowest` set this
37 parameter automatically based on their names.
38 
39 Particles will receive an extra-info field containing their rank as an integer
40 starting at 1 (best). The name of this extra-info field defaults to
41 ``${variable}_rank`` but can be chosen freely using the ``outputVariable``
42 parameter.
43 
44 The ranking also takes antiparticles into account, so there will only be one
45 B+- candidate with ``rank=1``. The remaining list is sorted from best to worst
46 candidate (each charge, e.g. B+/B-, separately). The sorting is guaranteed
47 to be stable between particle and anti particle list: particles with the same
48 value for ``variable`` will keep their relative order. That is, a particle "A"
49 which was before another particle "B" in the same list and has the same value
50 for ``variable`` will also stay before "B" after sorting.
51 
52 If ``allowMultiRank=False`` (the default) candidates with same value of
53 ``variable`` will have different ranks. If ``allowMultiRank=True`` they will
54 share the same rank.
55 
56 IF ``numBest>0`` only candidates with this rank or better will remain in the
57 output list. If ``allowMultiRank=True`` that means that there can be more than
58 ``numBest`` candidates in the output list if they share ranks.
59 )DOC");
60 
62 
63  addParam("particleList", m_inputListName, "Name of the ParticleList to rank for best candidate");
64  addParam("variable", m_variableName, "Variable which defines the candidate ranking (see ``selectLowest`` for ordering)");
65  addParam("selectLowest", m_selectLowest, "If true, candidate with lower values of ``variable`` are better, otherwise higher is better", false);
66  addParam("allowMultiRank", m_allowMultiRank, "If true, candidates with identical values get identical rank", false);
67  addParam("numBest", m_numBest, "Keep only particles with this rank or better. If ``allowMultiRank=False`` this is "
68  "identical to the maximum amount of candidates left in the list. Otherwise there may be more candidates if "
69  "some share the same rank (0: keep all)", 0);
70  addParam("cut", m_cutParameter, "Only candidates passing the cut will be ranked. The others will have rank -1.", std::string(""));
71  addParam("outputVariable", m_outputVariableName,
72  "Name for created variable, which contains the rank for the particle. If not provided, the standard name ``${variable}_rank`` is used.");
73 
74 }
75 
77 
79 {
80  m_particles.isRequired();
81  m_inputList.isRequired(m_inputListName);
82 
84  if (!m_variable) {
85  B2ERROR("Variable '" << m_variableName << "' is not available in Variable::Manager!");
86  }
87  if (!(m_variable->variabletype == Variable::Manager::VariableDataType::c_double or m_variable->variabletype == Variable::Manager::VariableDataType::c_int)) {
88  B2ERROR("Variable '" << m_variableName << "' has wrong data type! It must be either double or integer.");
89  }
90  if (m_numBest < 0) {
91  B2ERROR("value of numBest must be >= 0!");
92  } else if (m_numBest != 0) {
93  DecayDescriptor decaydescriptor;
94  decaydescriptor.init(m_inputListName);
95 
96  const DecayDescriptorParticle* ddpart = decaydescriptor.getMother();
97  const int pdgCode = ddpart->getPDGCode();
98  const string listLabel = ddpart->getLabel();
99 
100  // For final state particles we protect the label "all".
101  if (Const::finalStateParticlesSet.contains(Const::ParticleType(abs(pdgCode))) and listLabel == "all") {
102  B2FATAL("You are trying to apply a best-candidate-selection on the list " << m_inputListName <<
103  " but the label 'all' is protected for lists of final-state particles." <<
104  " It could introduce *very* dangerous bugs.");
105  } else if (listLabel == "MC" or listLabel == "V0") {
106  // the labels MC and V0 are also protected
107  B2FATAL("You are trying to apply a best-candidate-selection on the list " << m_inputListName <<
108  " but the label " << listLabel << " is protected and can not be reduced.");
109  }
110 
111  }
112 
114 
115  // parse the name that the rank will be stored under
116  if (m_outputVariableName.empty()) {
117  std::string root_compatible_VariableName = MakeROOTCompatible::makeROOTCompatible(m_variableName);
118  m_outputVariableName = root_compatible_VariableName + "_rank";
119  }
120 }
121 
123 {
124  // input list
125  if (!m_inputList) {
126  B2WARNING("Input list " << m_inputList.getName() << " was not created?");
127  return;
128  }
129 
130  if (m_numBest == 0 and m_inputList->getIsReserved())
131  m_inputList->setEditable(true);
132 
133  // create list of particle index and the corresponding value of variable
134  typedef std::pair<double, unsigned int> ValueIndexPair;
135  std::vector<ValueIndexPair> valueToIndex;
136  const unsigned int numParticles = m_inputList->getListSize();
137  valueToIndex.reserve(numParticles);
138  for (const Particle& p : *m_inputList) {
139  double value = 0;
140  auto var_result = m_variable->function(&p);
141  if (std::holds_alternative<double>(var_result)) {
142  value = std::get<double>(var_result);
143  } else if (std::holds_alternative<int>(var_result)) {
144  value = std::get<int>(var_result);
145  }
146  valueToIndex.emplace_back(value, p.getArrayIndex());
147  }
148 
149  // use stable sort to make sure we keep the relative order of elements with
150  // same value as it was before
151  if (m_selectLowest) {
152  std::stable_sort(valueToIndex.begin(), valueToIndex.end(), ValueIndexPairSorting::lowerPair<ValueIndexPair>);
153  } else {
154  std::stable_sort(valueToIndex.begin(), valueToIndex.end(), ValueIndexPairSorting::higherPair<ValueIndexPair>);
155  }
156 
157  // assign ranks and (optionally) remove everything but best candidates
158  m_inputList->clear();
159  int rank{1};
160  double previous_val{0};
161  bool first_candidate{true};
162  for (const auto& candidate : valueToIndex) {
163  Particle* p = m_particles[candidate.second];
164  if (!m_cut->check(p)) {
165  p->addExtraInfo(m_outputVariableName, -1);
166  m_inputList->addParticle(p);
167  continue;
168  }
169  if (first_candidate) {
170  first_candidate = false;
171  } else {
172  // If allowMultiRank, only increase rank when value changes
173  if (!m_allowMultiRank || (candidate.first != previous_val)) ++rank;
174  }
175 
176  if ((m_numBest != 0) and (rank > m_numBest)) // Only keep particles with same rank or below
177  break;
178 
179  if (!p->hasExtraInfo(m_outputVariableName))
180  p->addExtraInfo(m_outputVariableName, rank);
181  m_inputList->addParticle(p);
182  previous_val = candidate.first;
183 
184 
185  }
186 
187  if (m_numBest == 0 and m_inputList->getIsReserved())
188  m_inputList->setEditable(false);
189 }
bool m_allowMultiRank
Give the same rank to candidates with the same value.
virtual void initialize() override
Initialize the module (set up datastore)
virtual void event() override
Process an event.
std::string m_variableName
Variable which defines the candidate ranking.
StoreArray< Particle > m_particles
StoreArray of Particle objects.
bool m_selectLowest
Select the candidate with the lowest value (instead of highest).
virtual ~BestCandidateSelectionModule() override
Destructor.
std::unique_ptr< Variable::Cut > m_cut
cut object which performs the cuts
StoreObjPtr< ParticleList > m_inputList
input particle list
const Variable::Manager::Var * m_variable
Variable which defines the candidate ranking.
std::string m_cutParameter
Selection for candidates to be ranked.
int m_numBest
Number of best candidates to keep.
std::string m_outputVariableName
Name of generated Ranking-Variable, if specified by user.
std::string m_inputListName
name of input particle list.
The ParticleType class for identifying different particle types.
Definition: Const.h:399
static const ParticleSet finalStateParticlesSet
set of final set particles that can be created by the ParticleLoader
Definition: Const.h:648
Represents a particle in the DecayDescriptor.
int getPDGCode() const
Return PDG code.
std::string getLabel() const
The label of this particle, "default" returned, when no label set.
The DecayDescriptor stores information about a decay tree or parts of a decay tree.
bool init(const std::string &str)
Initialise the DecayDescriptor from given string.
const DecayDescriptorParticle * getMother() const
return mother.
static std::unique_ptr< GeneralCut > compile(const std::string &cut)
Creates an instance of a cut and returns a unique_ptr to it, if you need a copy-able object instead y...
Definition: GeneralCut.h:84
static std::string makeROOTCompatible(std::string str)
Remove special characters that ROOT dislikes in branch names, e.g.
void setDescription(const std::string &description)
Sets the description of the module.
Definition: Module.cc:214
void setPropertyFlags(unsigned int propertyFlags)
Sets the flags for the module properties.
Definition: Module.cc:208
@ c_ParallelProcessingCertified
This module can be run in parallel processing mode safely (All I/O must be done through the data stor...
Definition: Module.h:80
Class to store reconstructed particles.
Definition: Particle.h:74
const Var * getVariable(std::string name)
Get the variable belonging to the given key.
Definition: Manager.cc:57
static Manager & Instance()
get singleton instance.
Definition: Manager.cc:25
void addParam(const std::string &name, T &paramVariable, const std::string &description, const T &defaultValue)
Adds a new parameter to the module.
Definition: Module.h:560
#define REG_MODULE(moduleName)
Register the given module (without 'Module' suffix) with the framework.
Definition: Module.h:650
Abstract base class for different kinds of events.
Definition: ClusterUtils.h:23
VariableDataType variabletype
data type of variable
Definition: Manager.h:133
FunctionPtr function
Pointer to function.
Definition: Manager.h:147