16 The classes defined here are used to uniquely define a FEI training.
18 - The global configuration like database prefix, cache mode, monitoring, ... (FeiConfiguration)
19 - The reconstructed Particles (Particle)
20 - The reconstructed Channels of each particle (DecayChannel)
21 - The MVA configuration for each channel (MVAConfiguration)
22 - The Cut definitions of each channel (PreCutConfiguration)
23 - The Cut definitions of each particle (PostCutConfiguration)
36FeiConfiguration = collections.namedtuple(
'FeiConfiguration',
37 'prefix, cache, monitor, legacy, externTeacher, training, monitoring_path')
38FeiConfiguration.__new__.__defaults__ = (
'FEI_TEST',
None,
True,
None,
'basf2_mva_teacher',
False,
'')
39FeiConfiguration.__doc__ =
"Fei Global Configuration class"
40FeiConfiguration.prefix.__doc__ =
"The database prefix used for all weight files"
41FeiConfiguration.cache.__doc__ =
"The stage which is passed as input, it is assumed that all previous stages"\
42 " do not have to be reconstructed again. Can be either a number or"\
43 " a filename containing a pickled number or"\
44 " None in this case the environment variable FEI_STAGE is used."
45FeiConfiguration.monitor.__doc__ = (
46 "Determines the level of monitoring histograms to create. "
47 "Set to False to disable monitoring. "
48 "Set to 'simple' to enable lightweight histograms. "
49 "Any other value will enable full monitoring histograms."
51FeiConfiguration.legacy.__doc__ =
"Pass the summary file of a legacy FEI training,"\
52 " and the algorithm will be able to apply this training."
53FeiConfiguration.externTeacher.__doc__ =
"Teacher command e.g. basf2_mva_teacher, b2mva-kekcc-cluster-teacher"
54FeiConfiguration.training.__doc__ =
"If you train the FEI set this to True, otherwise to False"
55FeiConfiguration.monitoring_path.__doc__ =
"Path where monitoring histograms are stored."
58MVAConfiguration = collections.namedtuple(
'MVAConfiguration',
'method, config, variables, target, sPlotVariable, spectators')
59MVAConfiguration.__new__.__defaults__ = (
'FastBDT',
60 '--nTrees 400 --nCutLevels 10 --nLevels 3 --shrinkage 0.1 --randRatio 0.5',
61 None,
'isSignal',
None, {})
62MVAConfiguration.__doc__ =
"Multivariate analysis configuration class."
63MVAConfiguration.method.__doc__ =
"Method used by MVAInterface."
64MVAConfiguration.config.__doc__ =
"Method specific configuration string passed to basf2_mva_teacher"
65MVAConfiguration.variables.__doc__ =
"List of variables from the VariableManager."\
66 " {} is expanded to one variable per daughter particle."
67MVAConfiguration.target.__doc__ =
"Target variable from the VariableManager."
68MVAConfiguration.sPlotVariable.__doc__ =
"Discriminating variable used by sPlot to do data-driven training."
69MVAConfiguration.spectators.__doc__ =
"Dictionary of spectator variables with their ranges from the VariableManager."
72PreCutConfiguration = collections.namedtuple(
73 'PreCutConfiguration',
'userCut, vertexCut, noBackgroundSampling,'
74 'bestCandidateVariable, bestCandidateCut, bestCandidateMode, noSignalSampling, bkgSamplingFactor')
75PreCutConfiguration.__new__.__defaults__ = (
'', -2,
False,
None, 0,
'lowest',
False, 1.0)
76PreCutConfiguration.__doc__ =
"PreCut configuration class. These cuts is employed before training the mva classifier."
77PreCutConfiguration.userCut.__doc__ =
"The user cut is passed directly to the ParticleCombiner."\
78 " Particles which do not pass this cut are immediately discarded."
79PreCutConfiguration.vertexCut.__doc__ =
"The vertex cut is passed as confidence level to the VertexFitter."
80PreCutConfiguration.noBackgroundSampling.__doc__ =
"For very pure channels, the background sampling factor is too high" \
81 " and the MVA can't be trained. This disables background sampling."
82PreCutConfiguration.bestCandidateVariable.__doc__ =
"Variable from the VariableManager which is used to rank all candidates."
83PreCutConfiguration.bestCandidateCut.__doc__ =
"Number of best-candidates to keep after the best-candidate ranking."
84PreCutConfiguration.bestCandidateMode.__doc__ =
"Either lowest or highest."
85PreCutConfiguration.noSignalSampling.__doc__ =
"For channels with unknown br. frac., the signal sampling factor can be" \
86 " overestimated and you loose signal samples in the training." \
87 " This disables signal sampling."
88PreCutConfiguration.bkgSamplingFactor.__doc__ =
"Add additional multiplicative bkg. sampling factor, less than 1.0 to reduce."
90PostCutConfiguration = collections.namedtuple(
'PostCutConfiguration',
'value, bestCandidateCut')
91PostCutConfiguration.__new__.__defaults__ = (0.0, 0)
92PostCutConfiguration.__doc__ =
"PostCut configuration class. This cut is employed after the training of the mva classifier."
93PostCutConfiguration.value.__doc__ =
"Absolute value used to cut on the SignalProbability of each candidate."
94PostCutConfiguration.bestCandidateCut.__doc__ =
"Number of best-candidates to keep, ranked by SignalProbability."
96DecayChannel = collections.namedtuple(
98 'name, label, decayString, daughters, mvaConfig, preCutConfig, decayModeID, pi0veto')
99DecayChannel.__new__.__defaults__ = (
None,
None,
None,
None,
None,
None,
None,
False)
100DecayChannel.__doc__ =
"Decay channel of a Particle."
101DecayChannel.name.__doc__ =
"str:Name of the channel e.g. :code:`D0:generic_0`"
102DecayChannel.label.__doc__ =
"Label used to identify the decay channel e.g. for weight files independent of decayModeID"
103DecayChannel.decayString.__doc__ =
"DecayDescriptor of the channel e.g. D0 -> K+ pi-"
104DecayChannel.daughters.__doc__ =
"List of daughter particles of the decay channel e.g. [K+, pi-]"
105DecayChannel.mvaConfig.__doc__ =
"MVAConfiguration object which is used for this channel."
106DecayChannel.preCutConfig.__doc__ =
"PreCutConfiguration object which is used for this channel."
107DecayChannel.decayModeID.__doc__ =
"DecayModeID of this channel. Unique ID for each channel of this particle."
108DecayChannel.pi0veto.__doc__ =
"If true, additional pi0veto variables are added to the MVAs, useful only for decays with gammas."
110MonitoringVariableBinning = {
'mcErrors': (
'mcErrors', 513, -0.5, 512.5),
111 'mcParticleStatus': (
'mcParticleStatus', 257, -0.5, 256.5),
112 'dM': (
'dM', 100, -1.0, 1.0),
113 'dQ': (
'dQ', 100, -1.0, 1.0),
114 'abs(dM)': (
'abs(dM)', 100, 0.0, 1.0),
115 'abs(dQ)': (
'abs(dQ)', 100, 0.0, 1.0),
116 'pionID': (
'pionID', 100, 0.0, 1.0),
117 'kaonID': (
'kaonID', 100, 0.0, 1.0),
118 'protonID': (
'protonID', 100, 0.0, 1.0),
119 'electronID': (
'electronID', 100, 0.0, 1.0),
120 'muonID': (
'muonID', 100, 0.0, 1.0),
121 'isSignal': (
'isSignal', 2, -0.5, 1.5),
122 'isSignalAcceptMissingNeutrino': (
'isSignalAcceptMissingNeutrino', 2, -0.5, 1.5),
123 'isPrimarySignal': (
'isPrimarySignal', 2, -0.5, 1.5),
124 'chiProb': (
'chiProb', 100, 0.0, 1.0),
125 'Mbc': (
'Mbc', 100, 5.1, 5.4),
126 'cosThetaBetweenParticleAndNominalB': (
'cosThetaBetweenParticleAndNominalB', 100, -10.0, 10.0),
127 'extraInfo(SignalProbability)': (
'extraInfo(SignalProbability)', 100, 0.0, 1.0),
128 'extraInfo(decayModeID)': (
'extraInfo(decayModeID)', 101, -0.5, 100.5),
129 'extraInfo(uniqueSignal)': (
'extraInfo(uniqueSignal)', 2, -0.5, 1.5),
130 'extraInfo(preCut_rank)': (
'extraInfo(preCut_rank)', 41, -0.5, 40.5),
131 'extraInfo(postCut_rank)': (
'extraInfo(postCut_rank)', 41, -0.5, 40.5),
132 'daughterProductOf(extraInfo(SignalProbability))':
133 (
'daughterProductOf(extraInfo(SignalProbability))', 100, 0.0, 1.0),
134 'pValueCombinationOfDaughters(extraInfo(SignalProbability))':
135 (
'pValueCombinationOfDaughters(extraInfo(SignalProbability))', 100, 0.0, 1.0),
139def variables2binnings(variables):
141 Convert given variables into a tuples which can be given to VariableToHistogram
143 return [MonitoringVariableBinning[v]
if v
in MonitoringVariableBinning
else (v, 100, -10.0, 10.0)
for v
in variables]
146def variables2binnings_2d(variables):
148 Convert given variables into a tuples which can be given to VariableToHistogram
151 for v1, v2
in variables:
152 b1 = MonitoringVariableBinning[v1]
if v1
in MonitoringVariableBinning
else (v1, 100, -10.0, 10.0)
153 b2 = MonitoringVariableBinning[v2]
if v2
in MonitoringVariableBinning
else (v2, 100, -10.0, 10.0)
154 result.append(b1 + b2)
158def removeJPsiSlash(string: str) -> str:
160 Remove the / in the J/psi particle name
162 return string.replace(
'/',
'')
168 The Particle class is the only class the end-user gets into contact with.
169 The user creates an instance of this class for every particle he wants to reconstruct with the FEI algorithm,
170 and provides MVAConfiguration, PreCutConfiguration and PostCutConfiguration. These can be overwritten per channel.
173 def __init__(self, identifier: str,
174 mvaConfig: MVAConfiguration,
175 preCutConfig: PreCutConfiguration = PreCutConfiguration(),
176 postCutConfig: PostCutConfiguration = PostCutConfiguration()):
178 Creates a Particle without any decay channels. To add decay channels use addChannel method.
179 @param identifier is the pdg name of the particle as a string
180 with an optional additional user label separated by ':'
181 @param mvaConfig multivariate analysis configuration
182 @param preCutConfig intermediate pre cut configuration
183 @param postCutConfig post cut configuration
186 self.identifier = identifier +
':generic' if len(identifier.split(
':')) < 2
else identifier
187 v = self.identifier.split(
':')
193 self.mvaConfig = mvaConfig
197 self.preCutConfig = preCutConfig
199 self.postCutConfig = postCutConfig
203 Compares to Particle objects.
204 They are equal if their identifier, name, label, all channels, preCutConfig and postCutConfig is equal
205 @param a another Particle object
207 return (self.identifier == a.identifier
and self.name == a.name
and self.label == a.label
and
208 self.channels == a.channels
and self.preCutConfig == a.preCutConfig
and self.postCutConfig == a.postCutConfig)
212 Creates a string representation of a Particle object.
214 return str((self.identifier, self.channels, self.preCutConfig, self.postCutConfig, self.mvaConfig))
218 Creates a hash of a Particle object.
219 This is necessary to use this as a key in a dictionary
221 return hash((self.identifier, self.channels, self.preCutConfig, self.postCutConfig, self.mvaConfig))
225 """ Property returning list of unique daughter particles of all channels """
226 return list(frozenset([daughter
for channel
in self.channels
for daughter
in channel.daughters]))
229 daughters: typing.Sequence[str],
230 mvaConfig: MVAConfiguration =
None,
231 preCutConfig: PreCutConfiguration =
None,
232 pi0veto: bool =
False):
234 Appends a new decay channel to the Particle object.
235 @param daughters is a list of pdg particle names e.g. ['pi+','K-']
236 @param mvaConfig multivariate analysis configuration
237 @param preCutConfig pre cut configuration object
238 @param pi0veto if true, additional pi0veto variables are added to the MVA configuration
241 daughters = [d +
':generic' if ':' not in d
else d
for d
in daughters]
243 mvaConfig = copy.deepcopy(self.mvaConfig
if mvaConfig
is None else mvaConfig)
245 preCutConfig = copy.deepcopy(self.preCutConfig
if preCutConfig
is None else preCutConfig)
247 if mvaConfig
is not None and mvaConfig.target != self.mvaConfig.target:
249 f
'Particle {self.identifier} has common target {self.mvaConfig.target}, while channel '
250 f
'{" ".join(daughters)} has {mvaConfig.target}. Each particle must have exactly one target!')
254 for v
in mvaConfig.variables:
255 if v.count(
'{') == 0:
258 matches = re.findall(
r'\{\s*\d*\s*\.\.\s*\d*\s*\}', v)
259 if len(matches) == 0
and v.count(
'{}') == 0:
261 elif v.count(
'{}') > 0
and len(matches) > 0:
262 basf2.B2FATAL(f
'Variable {v} contains both '+
'{}'+f
' and {matches}. Only one is allowed!')
263 elif len(matches) > 0:
266 for match
in matches:
267 tempRange = match[1:-1].split(
'..')
268 if tempRange[0] ==
'':
271 tempRange[0] = int(tempRange[0])
272 if tempRange[0] >= len(daughters):
273 basf2.B2INFO(f
'Variable {v} contains index {tempRange[0]} which is more than daughters, skipping!')
276 if tempRange[1] ==
'':
277 tempRange[1] = len(daughters)
279 tempRange[1] = int(tempRange[1])
280 if tempRange[1] > len(daughters):
281 basf2.B2INFO(f
'Variable {v} contains index {tempRange[1]} which is more than daughters, skipping!')
284 ranges.append(tempRange)
288 mvaVars += [v.replace(matches[0], str(c))
for c
in range(ranges[0][0], ranges[0][1])]
290 for match
in matches:
291 v = v.replace(match,
'{}')
292 mvaVars += [v.format(*c)
for c
in itertools.product(*[range(r[0], r[1])
for r
in ranges])]
293 elif v.count(
'{}') <= len(daughters):
294 mvaVars += [v.format(*c)
for c
in itertools.combinations(list(range(0, len(daughters))), v.count(
'{}'))]
295 elif v.count(
'{}') > len(daughters):
296 basf2.B2INFO(f
'Variable {v} contains more brackets than daughters, which is why it will be ignored!')
299 basf2.B2FATAL(f
'Something went wrong with variable {v}!')
300 mvaConfig = mvaConfig._replace(variables=mvaVars)
302 decayModeID = len(self.channels)
303 self.channels.append(DecayChannel(name=self.identifier +
'_' + str(decayModeID),
304 label=removeJPsiSlash(self.identifier +
' ==> ' +
' '.join(daughters)),
305 decayString=self.identifier +
'_' + str(decayModeID) +
' -> ' +
' '.join(daughters),
308 preCutConfig=preCutConfig,
309 decayModeID=decayModeID,