9 #include <framework/database/Configuration.h>
10 #include <framework/logging/Logger.h>
11 #include <framework/dataobjects/FileMetaData.h>
12 #include <framework/database/Downloader.h>
13 #include <framework/database/Database.h>
14 #include <framework/utilities/Utils.h>
15 #include <boost/python.hpp>
16 #include <framework/core/PyObjConvUtils.h>
17 #include <framework/core/PyObjROOTUtils.h>
18 #include <boost/algorithm/string.hpp>
25 #define CURRENT_DEFAULT_TAG "release-08-01-07"
27 namespace py = boost::python;
35 std::vector<std::string> extractStringList(
const py::object& obj)
37 std::vector<std::string> result;
39 py::object str(py::handle<>(PyObject_Str(item.ptr())));
40 py::extract<std::string> extract(str);
41 result.emplace_back(extract());
49 namespace Belle2::Conditions {
54 boost::python::list tmp;
55 for (
const auto& e : std::get<0>(
m_value)) { tmp.append(e); }
56 m_value.emplace<boost::python::list>(std::move(tmp));
65 std::vector<std::string> tmp = extractStringList(std::get<1>(
m_value));
66 m_value.emplace<std::vector<std::string>>(std::move(tmp));
74 [&element](std::vector<std::string>& list) {list.emplace_back(element);},
75 [&element](boost::python::list & list) {list.append(element);}
82 [&element](std::vector<std::string>& list) {list.emplace(list.begin(), element);},
83 [&element](boost::python::list & list) {list.insert(0, element);}
89 ensurePy().slice(boost::python::_, boost::python::_) = source;
130 fillFromEnv(list,
"BELLE2_CONDB_GLOBALTAG", CURRENT_DEFAULT_TAG);
131 return py::tuple(list);
142 if (inputMetadata.empty())
return;
144 std::optional<std::string> inputGlobaltags;
145 for (
const auto& metadata : inputMetadata) {
146 if (!inputGlobaltags) {
147 inputGlobaltags = metadata.getDatabaseGlobalTag();
149 if (inputGlobaltags != metadata.getDatabaseGlobalTag()) {
150 B2WARNING(
"Input files metadata contain incompatible globaltag settings, globaltag replay not possible");
157 if (inputGlobaltags and inputGlobaltags->empty()) {
158 B2WARNING(
"Input files metadata all have empty globaltag setting, globaltag replay not possible");
177 std::optional<std::string> relMin, dateMin;
179 for (
const auto& metadata : inputMetadata) {
181 std::string rel = metadata.getRelease().substr(0, 10);
182 if (std::regex_match(rel, std::regex(
"release-[0-9][0-9]"))) {
183 if (!relMin) relMin = rel;
184 relMin = min(*relMin, rel);
188 std::string date = metadata.getDate().substr(0, 10);
189 if (std::regex_match(date, std::regex(
"[0-9][0-9][0-9][0-9]-[0-9][0-9]-[0-9][0-9]"))) {
190 if (!dateMin) dateMin = date;
191 dateMin = min(*dateMin, date);
196 if ((relMin && relMin <
"release-04") ||
197 (!relMin && (!dateMin || dateMin <
"2019-12-31"))) {
198 B2DEBUG(30,
"Enabling legacy IP information globaltag in tag replay");
203 if ((relMin && relMin <
"release-08") ||
204 (!relMin && (!dateMin || dateMin <
"2023-08-31"))) {
205 B2DEBUG(30,
"Enabling legacy CollsionAxisCMS globaltag in tag replay");
222 B2INFO(
"Global tag override is in effect: input globaltags and default globaltag will be ignored");
233 for (
const auto& tag : baseList) baseListPy.append(tag);
234 arguments[
"base_tags"] = baseListPy;
240 arguments[
"metadata"] = py::object();
243 py::list metaDataList;
245 arguments[
"metadata"] = metaDataList;
248 py::object retval = (*m_callback)(*py::tuple(), **arguments);
251 if (retval != py::object()) {
252 return extractStringList(retval);
257 if (baseList.empty()) {
259 B2FATAL(R
"(No baseline globaltags available.
260 The input files you selected don't have compatible globaltags or an empty
261 globaltag setting. As such globaltag configuration cannot be determined
264 If you really sure that it is a good idea to process these files together
265 you have to manually override the list of globaltags:
267 >>> basf2.conditions.override_globaltags()
270 B2FATAL(R
"(No default globaltags available.
271 There is no default globaltag available for processing. This usually means
272 you set the environment variable BELLE2_CONDB_GLOBALTAG to an empty value.
274 As this is unlikely to work for even the most basic functionality this is not
275 directly supported anymore. If you really want to disable any access to the
276 conditions database please configure this explicitly
278 >>> basf2.conditions.metadata_providers = []
279 >>> basf2.conditions.override_globaltags([])
285 for (
const auto& tag : baseList) { finalList.emplace_back(tag); }
291 boost::python::dict expertSettings(
const boost::python::tuple& args, boost::python::dict kwargs)
293 if (py::len(args) != 1) {
295 PyErr_SetString(PyExc_TypeError, (
"expert_settings() takes one positional argument but " +
296 std::to_string(len(args)) +
" were given").c_str());
297 py::throw_error_already_set();
299 Configuration&
self = py::extract<Configuration&>(args[0]);
306 auto checkValue = [&kwargs, &result](
const std::string & name,
auto setter,
auto getter) {
307 using value_type = decltype(getter());
308 if (kwargs.has_key(name)) {
310 py::object
object = kwargs[name];
313 }
catch (std::runtime_error&) {
314 std::stringstream error;
316 PyErr_SetString(PyExc_TypeError, error.str().c_str());
317 py::throw_error_already_set();
321 py::delitem(kwargs, py::object(name));
328 checkValue(
"save_payloads",
329 [&
self](
const std::string & path) {
self.setNewPayloadLocation(path);},
330 [&
self]() {
return self.getNewPayloadLocation();});
331 checkValue(
"download_cache_location",
332 [&
self](
const std::string & path) {
self.setDownloadCacheDirectory(path);},
333 [&
self]() {
return self.getDownloadCacheDirectory();});
334 checkValue(
"download_lock_timeout",
335 [&
self](
size_t timeout) {
self.setDownloadLockTimeout(timeout);},
336 [&
self]() {
return self.getDownloadLockTimeout();});
337 checkValue(
"usable_globaltag_states",
338 [&
self](
const auto & states) {
self.setUsableTagStates(states); },
339 [&
self]() {
return self.getUsableTagStates(); });
340 checkValue(
"connection_timeout",
341 [&downloader](
unsigned int timeout) {downloader.setConnectionTimeout(timeout);},
342 [&downloader]() {
return downloader.getConnectionTimeout();});
343 checkValue(
"stalled_timeout",
344 [&downloader](
unsigned int timeout) {downloader.setStalledTimeout(timeout);},
345 [&downloader]() {
return downloader.getStalledTimeout();});
346 checkValue(
"max_retries",
347 [&downloader](
unsigned int retries) {downloader.setMaxRetries(retries);},
348 [&downloader]() {
return downloader.getMaxRetries();});
349 checkValue(
"backoff_factor",
350 [&downloader](
unsigned int factor) { downloader.setBackoffFactor(factor);},
351 [&downloader]() {
return downloader.getBackoffFactor();});
353 if (py::len(kwargs) > 0) {
354 std::string message =
"Unrecognized keyword arguments: ";
355 auto keys = kwargs.keys();
356 for (
int i = 0; i < len(keys); ++i) {
357 if (i > 0) message +=
", ";
358 message += py::extract<std::string>(keys[i]);
360 PyErr_SetString(PyExc_TypeError, message.c_str());
361 py::throw_error_already_set();
376 py::docstring_options options(
true,
false,
false);
380 py::object expert = raw_function(expertSettings);
381 py::class_<Configuration>(
"ConditionsConfiguration", R
"DOC(
382 This class contains all configurations for the conditions database service
384 * which globaltags to use
385 * where to look for payload information
386 * where to find the actual payload files
387 * which temporary testing payloads to use
389 But for most users the only thing they should need to care about is to set the
390 list of additional `globaltags` to use.
393 Indicator whether or not the override of globaltags is enabled. If true then
394 globaltags present in input files will be ignored and only the ones given in
395 `globaltags` will be considered.
399 Reset the conditions database configuration to its original state.
402 A tuple containing the default globaltags to be used if events are generated without an input file.
405 List of globaltags to be used. These globaltags will be the ones with highest
406 priority but by default the globaltags used to create the input files or the
407 default globaltag will also be used.
409 The priority of the globaltags in this list is highest first. So the first in
410 the list will be checked first and all other globaltags will only be checked for
411 payloads not found so far.
414 By default this list contains the globaltags to be used **in addition** to
415 the ones from the input file or the default one if no input file is present.
416 If this is not desirable you need to call `override_globaltags()` to disable
417 any addition or modification of this list.
421 Append a globaltag to the end of the `globaltags` list. That means it will be
422 the lowest priority of all tags in the list.
426 Add a globaltag to the beginning of the `globaltags` list. That means it will be
427 the highest priority of all tags in the list.
429 .def("override_globaltags", overrideGTFlag)
430 .def(
"override_globaltags", overrideGTList, py::args(
"globaltags"), R
"DOC(override_globaltags(list=None)
432 Enable globaltag override. This disables all modification of the globaltag list at the beginning of processing:
434 * the default globaltag or the input file globaltags will be ignored.
435 * any callback set with `set_globaltag_callback` will be ignored.
436 * the list of `globaltags` will be used exactly as it is.
439 list (list(str) or None) if given this list will replace the current content of `globaltags`
442 it's still possible to modify `globaltags` after this call.
446 Disable global tag replay and revert to the old behavior that the default
447 globaltag will be used if no other globaltags are specified.
449 This is a shortcut to just calling
451 >>> conditions.override_globaltags()
452 >>> conditions.globaltags += list(conditions.default_globaltags)
457 Append a text file containing local test payloads to the end of the list of
458 `testing_payloads`. This will mean they will have lower priority than payloads
459 in previously defined text files but still higher priority than globaltags.
462 filename (str): file containing a local definition of payloads and their
463 intervals of validity for testing
466 This functionality is strictly for testing purposes. Using local payloads
467 leads to results which cannot be reproduced by anyone else and thus cannot
472 Insert a text file containing local test payloads in the beginning of the list
473 of `testing_payloads`. This will mean they will have higher priority than payloads in
474 previously defined text files as well as higher priority than globaltags.
477 filename (str): file containing a local definition of payloads and their
478 intervals of validity for testing
481 This functionality is strictly for testing purposes. Using local payloads
482 leads to results which cannot be reproduced by anyone else and thus cannot
486 List of text files to look for local testing payloads. Each entry should be a
487 text file containing local payloads and their intervals of validity to be used
490 Payloads found in these files and valid for the current run will have a higher
491 priority than any of the `globaltags`. If a valid payload is present in multiple
492 files the first one in the list will have higher priority.
495 This functionality is strictly for testing purposes. Using local payloads
496 leads to results which cannot be reproduced by anyone else and thus cannot
500 List of metadata providers to use when looking for payload metadata. There are currently two supported providers:
502 1. Central metadata provider to look for payloads in the central conditions database.
503 This provider is used for any entry in this list which starts with ``http(s)://``.
504 The URL should point to the top level of the REST api endpoints on the server
506 2. Local metadata provider to look for payloads in a local SQLite snapshot taken
507 from the central server. This provider will be assumed for any entry in this
508 list not starting with a protocol specifier or if the protocol is given as ``file://``
510 This list should rarely need to be changed. The only exception is for users who
511 want to be able to use the software without internet connection after they
512 downloaded a snapshot of the necessary globaltags with ``b2conditionsdb download``
513 to point to this location.
516 URL of the default central metadata provider to look for payloads in the
520 List of payload locations to search for payloads which have been found by any of
521 the configured `metadata_providers`. This can be a local directory or a
522 ``http(s)://`` url pointing to the payload directory on a server.
524 For remote locations starting with ``http(s)://`` we assume that the layout of
525 the payloads on the server is the same as on the main payload server:
526 The combination of given location and the relative url in the payload metadata
527 field ``payloadUrl`` should point to the correct payload on the server.
529 For local directories, two layouts are supported and will be auto detected:
532 All payloads are in the same directory without any substructure with the name
533 ``dbstore_{name}_rev_{revision}.root``
535 All payloads are stored in subdirectories in the form ``AB/{name}_r{revision}.root``
536 where ``A`` and ``B`` are the first two characters of the md5 checksum of the
540 Given ``payload_locations = ["payload_dir/", "http://server.com/payloads"]``
541 the framework would look for a payload with name ``BeamParameters`` in revision
542 ``45`` (and checksum ``a34ce5...``) in the following places
545 1. ``payload_dir/a3/BeamParameters_r45.root``
546 2. ``payload_dir/dbstore_BeamParameters_rev_45.root``
547 3. ``http://server.com/payloads/dbstore/BeamParameters/dbstore_BeamParameters_rev_45.root``
548 given the usual pattern of the ``payloadUrl`` metadata. But this could be
549 changed on the central servers so mirrors should not depend on this convention
550 but copy the actual structure of the central server.
552 If the payload cannot be found in any of the given locations the framework will
553 always attempt to download it directly from the central server and put it in a
554 local cache directory.
556 .def("expert_settings", expert, R
"DOC(expert_settings(**kwargs)
558 Set some additional settings for the conditions database.
560 You can supply any combination of keyword-only arguments defined below. The
561 function will return a dictionary containing all current settings.
563 >>> conditions.expert_settings(connection_timeout=5, max_retries=1)
564 {'save_payloads': 'localdb/database.txt',
565 'download_cache_location': '',
566 'download_lock_timeout': 120,
567 'usable_globaltag_states': {'PUBLISHED', 'RUNNING', 'TESTING', 'VALIDATED'},
568 'connection_timeout': 5,
569 'stalled_timeout': 60,
574 Modification of these parameters should not be needed, in rare
575 circumstances this could be used to optimize access for many jobs at once
576 but should only be set by experts.
579 save_payloads (str): Where to store new payloads created during processing.
580 This should be a filename to contain the payload information and the payload
581 files will be placed in the same directory as the file.
582 download_cache_location (str): Where to store payloads which have been downloaded
583 from the central server. This could be a user defined directory, otherwise
584 empty string defaults to ``$TMPDIR/basf2-conditions`` where ``$TMPDIR`` is the
585 temporary directories defined in the system. Newly downloaded payloads will
586 be stored in this directory in a hashed structure, see `payload_locations`
587 download_lock_timeout (int): How many seconds to wait for a write lock when
588 concurrently downloading the same payload between different processes.
589 If locking fails the payload will be downloaded to a temporary file
590 separately for each process.
591 usable_globaltag_states (set(str)): Names of globaltag states accepted for
592 processing. This can be changed to make sure that only fully published
593 globaltags are used or to enable running on an open tag. It is not possible
594 to allow usage of 'INVALID' tags, those will always be rejected.
595 connection_timeout (int): timeout in seconds before connection should be
596 aborted. 0 sets the timeout to the default (300s)
597 stalled_timeout (int): timeout in seconds before a download should be
598 aborted if the speed stays below 10 KB/s, 0 disables this timeout
599 max_retries (int): maximum amount of retries if the server responded with
600 an HTTP response of 500 or more. 0 disables retrying
601 backoff_factor (int): backoff factor for retries in seconds. Retries are
602 performed using something similar to binary backoff: For retry :math:`n`
603 and a ``backoff_factor`` :math:`f` we wait for a random time chosen
604 uniformely from the interval :math:`[1, (2^{n} - 1) \times f]` in
609 Set a callback function to be called just before processing.
611 This callback can be used to further customize the globaltags to be used during
612 processing. It will be called after the input files have been opened and checked
613 with three keyword arguments:
616 The globaltags determined from either the input files or, if no input files
617 are present, the default globaltags
620 The globaltags provided by the user
623 If there are not input files (e.g. generating events) this argument is None.
624 Otherwise it is a list of all the ``FileMetaData`` instances from all input files.
625 This list can be empty if there is no metadata associated with the input files.
627 From this information the callback function should then compose the final list
628 of globaltags to be used for processing and return this list. If ``None`` is
629 returned the default behavior is applied as if there were no callback function.
630 If anything else is returned the processing is aborted.
632 If no callback function is specified the default behavior is equivalent to ::
634 def callback(base_tags, user_tags, metadata):
636 basf2.B2FATAL("No baseline globaltags available. Please use override")
638 return user_tags + base_tags
640 If `override_enabled` is ``True`` then the callback function will not be called.
643 If a callback is set it is responsible to select the correct list of globaltags
644 and also make sure that all files are compatible. No further checks will be
645 done by the framework but any list of globaltags which is returned will be used
648 If the list of ``base_tags`` is empty that usually means that the input files
649 had different globaltag settings but it is the responsibility of the callback
650 to then verify if the list of globaltags is usable or not.
652 If the callback function determines that no working set of globaltags can be
653 determined then it should abort processing using a FATAL error or an exception
bool m_overrideEnabled
is the globaltag override enabled?
static Configuration & getInstance()
Get a reference to the instance which will be used when the Database is initialized.
CppOrPyList m_globalTags
the list with all user globaltags
void prependGlobalTag(const std::string &globalTag)
preprend a globaltag
boost::python::tuple getDefaultGlobalTagsPy() const
Get the tuple of default globaltags as python version.
void appendGlobalTag(const std::string &globalTag)
Append a globaltag.
Configuration()
Initialize default values.
void ensureEditable() const
Check whether the configuration object can be edited or if the database has been initialized already.
void setGlobaltagCallbackPy(const boost::python::object &obj)
Set a callback function from python which will be called when processing starts and should return the...
std::vector< std::string > getBaseTags() const
Get the base globaltags to be used in addition to user globaltags.
void disableGlobalTagReplay()
Disable global tag replay.
boost::python::list getGlobalTagsPy()
Get the list of user globaltags as python version.
void setMetadataProvidersPy(const boost::python::list &list)
Set the list of metadata providers in python.
boost::python::list getTestingPayloadLocationsPy()
Get the list of text files containing test payloads in python.
static void fillFromEnv(T &target, const std::string &envName, const std::string &defaultValue)
Fill a target object from a list of environment variables.
std::vector< FileMetaData > m_inputMetadata
the file metadata of all input files if globaltag replay is requested by input module
std::vector< std::string > getFinalListOfTags()
Get the final list of globaltags to be used for processing.
void setPayloadLocationsPy(const boost::python::list &list)
Set the list of payload locations in python.
CppOrPyList m_metadataProviders
the list with all the metadata providers
void setInputMetadata(const std::vector< FileMetaData > &inputMetadata)
To be called by input modules with the list of all input FileMetaData.
boost::python::list getMetadataProvidersPy()
Get the list of metadata providers in python.
void overrideGlobalTags()
Enable globaltag override: If this is called once than overrideEnabled() will return true and getFina...
void setTestingPayloadLocationsPy(const boost::python::list &list)
Set the list of text files containing test payloads in python.
std::optional< std::vector< std::string > > m_inputGlobaltags
the list of globaltags from all the input files to be used in addition to the user globaltags
void prependTestingPayloadLocation(const std::string &filename)
Prepend a local text file with testing payloads to the list.
boost::python::list getPayloadLocationsPy()
Get the list og payload locations in python.
static void exposePythonAPI()
expose this class to python
std::string m_defaultMetadataProviderUrl
default URL where to look for the metadata provider
std::string getDefaultMetadataProviderUrl()
Get the default URL where to look for the metadata provider.
CppOrPyList m_payloadLocations
the list with all the payload locations
void overrideGlobalTagsPy(const boost::python::list &globalTags)
Enable globaltag override and set the list of user globaltags in one go.
void reset()
Reset to default values.
void setGlobalTagsPy(const boost::python::list &globalTags)
Set the list of globaltags from python.
bool overrideEnabled() const
Check if override is enabled by previous calls to overrideGlobalTags()
std::optional< boost::python::object > m_callback
the callback function to determine the final final list of globaltags
std::vector< std::string > getDefaultGlobalTags() const
Get the std::vector of default globaltags.
void appendTestingPayloadLocation(const std::string &filename)
Add a local text file with testing payloads.
bool m_databaseInitialized
bool indicating whether the database has been initialized, in which case any changes to the configura...
boost::python::list & ensurePy()
Return the python list version.
void prepend(const std::string &element)
Prepend an element to whatever representation we currently have.
void shallowCopy(const boost::python::object &source)
shallow copy all elements of the source object into the python representation.
void append(const std::string &element)
Append an element to whatever representation we currently have.
std::vector< std::string > & ensureCpp()
Return the C++ vector version.
std::variant< std::vector< std::string >, boost::python::list > m_value
Store either a std::vector or a python list of strings.
static Downloader & getDefaultInstance()
Return the default instance.
static std::string get(const std::string &name, const std::string &fallback="")
Get the value of an environment variable or the given fallback value if the variable is not set.
static bool isSet(const std::string &name)
Check if a value is set in the database.
static Database & Instance()
Instance of a singleton Database.
static std::vector< std::string > getOrCreateList(const std::string &name, const std::string &fallback, const std::string &separators=" \t\n\r")
Get a list of values from an environment variable or the given fallback string if the variable is not...
boost::python::object createROOTObjectPyCopy(const T &instance)
Create a python wrapped copy from a class instance which has a ROOT dictionary.
static void reset(bool keepConfig=false)
Reset the database instance.
boost::python::object convertToPythonObject(const Scalar &value)
------------— From C++ TO Python Converter ---------------------—
Scalar convertPythonObject(const boost::python::object &pyObject, Scalar)
Convert from Python to given type.
bool iteratePythonObject(const boost::python::object &pyObject, Functor function)
Helper function to loop over a python object that implements the iterator concept and call a functor ...
VisitOverload(Ts...) -> VisitOverload< Ts... >
Function for the C++17 std::visit overload pattern to allow simple use of variants.
static std::string name()
type name.