diff --git a/doc/templates.md b/doc/templates.md index 7229c71d3..643d5ea55 100644 --- a/doc/templates.md +++ b/doc/templates.md @@ -26,18 +26,19 @@ Note that some of the information below will only apply to either of these gener Currently PODIO loads templates that are placed in [`/python/templates`](/python/templates). They are broadly split along the classes that are generated for each datatype or component from the EDM definition: -| template file(s) | content | generated file(s) | -|---------------------------------|---------------------------------------------------------------------------------------------------------|---------------------------------------------------------------------------------------| -| `Component.h.jinja2` | Definition for each component | `[/].h` | -| `Data.h.jinja2` | POD struct of each datatype (living in the POD layer) | `[/]Data.h` | -| `Obj.{h,cc}.jinja2` | `Obj` class for each datatype (living in the object layer) and managing resources | `[/]Obj.h`, `src/Obj.cc` | -| `[Mutable]Object.{h,cc}.jinja2` | The user facing interfaces for each datatype (living in the user layer) | `[/][Mutable].h`, `src/[Mutable].cc` | -| `Collection.{h,cc}.jinja2` | The user facing collection interface (living in the user layer) | `[/]Collection.h`, `src/Collection.cc` | -| `CollectionData.{h,cc}.jinja2` | The classes managing the collection storage (not user facing!) | `[/]CollectionData.h`, `src/CollectionData.cc` | -| `selection.xml.jinja2` | The `selection.xml` file that is necessary for generating a root dictionary for the generated datamodel | `src/selection.xml` | -| `SIOBlock.{h,cc}.jinja2` | The SIO blocks that are necessary for the SIO backend | `[/]SIOBlock.h`, `src/SIOBlock.cc` | -| `MutableStruct.jl.jinja2` | The mutable struct definitions of components and datatypes for julia |`[/]Struct.jl`, `[/]Struct.jl` | -| `ParentModule.jl.jinja2` | The constructor and collection definitions of components and datatypes in the data model are contained within a single module named after the package-name |`[/].jl` | +| template file(s) | content | generated file(s) | +|---------------------------------|------------------------------------------------------------------------------------------------------------------------------------------------------------|---------------------------------------------------------------------------------------| +| `Component.h.jinja2` | Definition for each component | `[/].h` | +| `Data.h.jinja2` | POD struct of each datatype (living in the POD layer) | `[/]Data.h` | +| `Obj.{h,cc}.jinja2` | `Obj` class for each datatype (living in the object layer) and managing resources | `[/]Obj.h`, `src/Obj.cc` | +| `[Mutable]Object.{h,cc}.jinja2` | The user facing interfaces for each datatype (living in the user layer) | `[/][Mutable].h`, `src/[Mutable].cc` | +| `Collection.{h,cc}.jinja2` | The user facing collection interface (living in the user layer) | `[/]Collection.h`, `src/Collection.cc` | +| `CollectionData.{h,cc}.jinja2` | The classes managing the collection storage (not user facing!) | `[/]CollectionData.h`, `src/CollectionData.cc` | +| `datamodel.h.jinja2` | The *full datamodel header* that includes everything of a generated EDM (via including all generated `Collections`). | `[]/.h` | +| `selection.xml.jinja2` | The `selection.xml` file that is necessary for generating a root dictionary for the generated datamodel | `src/selection.xml` | +| `SIOBlock.{h,cc}.jinja2` | The SIO blocks that are necessary for the SIO backend | `[/]SIOBlock.h`, `src/SIOBlock.cc` | +| `MutableStruct.jl.jinja2` | The mutable struct definitions of components and datatypes for julia | `[/]Struct.jl`, `[/]Struct.jl` | +| `ParentModule.jl.jinja2` | The constructor and collection definitions of components and datatypes in the data model are contained within a single module named after the package-name | `[/].jl` | The presence of a `[]` subdirectory for the header files is controlled by the `includeSubfolder` option in the yaml definition file. diff --git a/include/podio/CollectionBranches.h b/include/podio/CollectionBranches.h deleted file mode 100644 index 3ab3e8129..000000000 --- a/include/podio/CollectionBranches.h +++ /dev/null @@ -1,23 +0,0 @@ -#ifndef PODIO_COLLECTIONBRANCHES_H -#define PODIO_COLLECTIONBRANCHES_H - -#include "TBranch.h" - -#include -#include - -namespace podio::root_utils { -/// Small helper struct to collect all branches that are necessary to read or -/// write a collection. Needed to cache the branch pointers and avoid having to -/// get them from a TTree/TChain for every event. -struct CollectionBranches { - TBranch* data{nullptr}; - std::vector refs{}; - std::vector vecs{}; - std::vector refNames{}; ///< The names of the relation branches - std::vector vecNames{}; ///< The names of the vector member branches -}; - -} // namespace podio::root_utils - -#endif diff --git a/include/podio/GenericParameters.h b/include/podio/GenericParameters.h index 55119a2e8..60adf8825 100644 --- a/include/podio/GenericParameters.h +++ b/include/podio/GenericParameters.h @@ -6,6 +6,7 @@ #include #include +#include #include #include #include @@ -105,6 +106,10 @@ class GenericParameters { template > std::vector getKeys() const; + /// Get all the available values for a given type + template > + std::vector> getValues() const; + /// erase all elements void clear() { _intMap.clear(); @@ -243,5 +248,19 @@ std::vector GenericParameters::getKeys() const { return keys; } +template +std::vector> GenericParameters::getValues() const { + std::vector> values; + auto& mtx = getMutex(); + const auto& map = getMap(); + { + // Lock to avoid concurrent changes to the map while we get the stored + // values + std::lock_guard lock{mtx}; + values.reserve(map.size()); + std::transform(map.begin(), map.end(), std::back_inserter(values), [](const auto& pair) { return pair.second; }); + } + return values; +} } // namespace podio #endif diff --git a/include/podio/RNTupleReader.h b/include/podio/RNTupleReader.h index 1cffa149f..057b9fcef 100644 --- a/include/podio/RNTupleReader.h +++ b/include/podio/RNTupleReader.h @@ -1,8 +1,6 @@ #ifndef PODIO_RNTUPLEREADER_H #define PODIO_RNTUPLEREADER_H -#include "podio/CollectionBranches.h" -#include "podio/ICollectionProvider.h" #include "podio/ROOTFrameData.h" #include "podio/SchemaEvolution.h" #include "podio/podioVersion.h" diff --git a/include/podio/RNTupleWriter.h b/include/podio/RNTupleWriter.h index ed0f3012c..d8a53ba43 100644 --- a/include/podio/RNTupleWriter.h +++ b/include/podio/RNTupleWriter.h @@ -1,11 +1,11 @@ #ifndef PODIO_RNTUPLEWRITER_H #define PODIO_RNTUPLEWRITER_H -#include "podio/CollectionBase.h" #include "podio/Frame.h" #include "podio/GenericParameters.h" #include "podio/SchemaEvolution.h" #include "podio/utilities/DatamodelRegistryIOHelpers.h" +#include "podio/utilities/RootHelpers.h" #include "TFile.h" #include @@ -102,42 +102,42 @@ class RNTupleWriter { checkConsistency(const std::vector& collsToWrite, const std::string& category) const; private: - template - void fillParams(GenericParameters& params, ROOT::Experimental::REntry* entry); + std::unique_ptr + createModels(const std::vector& collections); + + /// Helper struct to group all the necessary information for one category. + struct CategoryInfo { + std::unique_ptr writer{nullptr}; ///< The RNTupleWriter for this category + + // The following are assumed to run in parallel! + std::vector ids{}; ///< The ids of all collections + std::vector names{}; ///< The names of all collections + std::vector types{}; ///< The types of all collections + std::vector subsetCollections{}; ///< The flags identifying the subcollections + std::vector schemaVersions{}; ///< The schema versions of all collections + + // Storage for the keys & values of all the parameters of this category + // (resp. at least the current entry) + root_utils::ParamStorage intParams{}; + root_utils::ParamStorage floatParams{}; + root_utils::ParamStorage doubleParams{}; + root_utils::ParamStorage stringParams{}; + }; + CategoryInfo& getCategoryInfo(const std::string& category); - using StoreCollection = std::pair; - std::unique_ptr createModels(const std::vector& collections); + template + void fillParams(const GenericParameters& params, CategoryInfo& catInfo, ROOT::Experimental::REntry* entry); - std::unique_ptr m_metadata{}; - std::unique_ptr m_metadataWriter{}; + template + root_utils::ParamStorage& getParamStorage(CategoryInfo& catInfo); std::unique_ptr m_file{}; DatamodelDefinitionCollector m_datamodelCollector{}; - struct CollectionInfo { - std::vector id{}; - std::vector name{}; - std::vector type{}; - std::vector isSubsetCollection{}; - std::vector schemaVersion{}; - std::unique_ptr writer{nullptr}; - }; - CollectionInfo& getCategoryInfo(const std::string& category); - - std::unordered_map m_categories{}; + std::unordered_map m_categories{}; bool m_finished{false}; - - std::vector m_intkeys{}, m_floatkeys{}, m_doublekeys{}, m_stringkeys{}; - - std::vector> m_intvalues{}; - std::vector> m_floatvalues{}; - std::vector> m_doublevalues{}; - std::vector> m_stringvalues{}; - - template - std::pair&, std::vector>&> getKeyValueVectors(); }; } // namespace podio diff --git a/include/podio/ROOTFrameData.h b/include/podio/ROOTFrameData.h index d58dd43e4..502ff24ef 100644 --- a/include/podio/ROOTFrameData.h +++ b/include/podio/ROOTFrameData.h @@ -25,37 +25,15 @@ class ROOTFrameData { ROOTFrameData(const ROOTFrameData&) = delete; ROOTFrameData& operator=(const ROOTFrameData&) = delete; - ROOTFrameData(BufferMap&& buffers, CollIDPtr&& idTable, podio::GenericParameters&& params) : - m_buffers(std::move(buffers)), m_idTable(std::move(idTable)), m_parameters(std::move(params)) { - } + ROOTFrameData(BufferMap&& buffers, CollIDPtr&& idTable, podio::GenericParameters&& params); - std::optional getCollectionBuffers(const std::string& name) { - const auto bufferHandle = m_buffers.extract(name); - if (bufferHandle.empty()) { - return std::nullopt; - } + std::optional getCollectionBuffers(const std::string& name); - return {bufferHandle.mapped()}; - } + podio::CollectionIDTable getIDTable() const; - podio::CollectionIDTable getIDTable() const { - // Construct a copy of the internal table - return {m_idTable->ids(), m_idTable->names()}; - } + std::unique_ptr getParameters(); - std::unique_ptr getParameters() { - return std::make_unique(std::move(m_parameters)); - } - - std::vector getAvailableCollections() const { - std::vector collections; - collections.reserve(m_buffers.size()); - for (const auto& [name, _] : m_buffers) { - collections.push_back(name); - } - - return collections; - } + std::vector getAvailableCollections() const; private: // TODO: switch to something more elegant once the basic functionality and @@ -66,13 +44,6 @@ class ROOTFrameData { podio::GenericParameters m_parameters{}; }; -// Interim workaround for https://github.com/AIDASoft/podio#500 -inline ROOTFrameData::~ROOTFrameData() { - for (auto& [_, buffer] : m_buffers) { - buffer.deleteBuffers(buffer); - } -} - } // namespace podio #endif // PODIO_ROOTFRAMEDATA_H diff --git a/include/podio/ROOTLegacyReader.h b/include/podio/ROOTLegacyReader.h index c379eea1c..9383ca51b 100644 --- a/include/podio/ROOTLegacyReader.h +++ b/include/podio/ROOTLegacyReader.h @@ -1,13 +1,12 @@ #ifndef PODIO_ROOTLEGACYREADER_H #define PODIO_ROOTLEGACYREADER_H -#include "podio/CollectionBranches.h" #include "podio/ROOTFrameData.h" #include "podio/podioVersion.h" +#include "podio/utilities/RootHelpers.h" #include "TChain.h" -#include #include #include #include @@ -114,7 +113,7 @@ class ROOTLegacyReader { private: std::pair getLocalTreeAndEntry(const std::string& treename); - void createCollectionBranches(const std::vector>& collInfo); + void createCollectionBranches(const std::vector& collInfo); podio::GenericParameters readEventMetaData(); diff --git a/include/podio/ROOTReader.h b/include/podio/ROOTReader.h index b14a08d17..bb6a1efdd 100644 --- a/include/podio/ROOTReader.h +++ b/include/podio/ROOTReader.h @@ -1,14 +1,13 @@ #ifndef PODIO_ROOTREADER_H #define PODIO_ROOTREADER_H -#include "podio/CollectionBranches.h" #include "podio/ROOTFrameData.h" #include "podio/podioVersion.h" #include "podio/utilities/DatamodelRegistryIOHelpers.h" +#include "podio/utilities/RootHelpers.h" #include "TChain.h" -#include #include #include #include diff --git a/include/podio/ROOTWriter.h b/include/podio/ROOTWriter.h index 06aa61a46..318f0f21f 100644 --- a/include/podio/ROOTWriter.h +++ b/include/podio/ROOTWriter.h @@ -1,9 +1,9 @@ #ifndef PODIO_ROOTWRITER_H #define PODIO_ROOTWRITER_H -#include "podio/CollectionBranches.h" #include "podio/CollectionIDTable.h" #include "podio/utilities/DatamodelRegistryIOHelpers.h" +#include "podio/utilities/RootHelpers.h" #include "TFile.h" @@ -100,31 +100,25 @@ class ROOTWriter { checkConsistency(const std::vector& collsToWrite, const std::string& category) const; private: - using StoreCollection = std::pair; - - // collectionID, collectionType, subsetCollection - // @note same as in rootUtils.h private header! - using CollectionInfoT = std::tuple; - /// Helper struct to group together all necessary state to write / process a /// given category. Created during the first writing of a category struct CategoryInfo { - TTree* tree{nullptr}; ///< The TTree to which this category is written - std::vector branches{}; ///< The branches for this category - std::vector collInfo{}; ///< Collection info for this category - podio::CollectionIDTable idTable{}; ///< The collection id table for this category - std::vector collsToWrite{}; ///< The collections to write for this category + TTree* tree{nullptr}; ///< The TTree to which this category is written + std::vector branches{}; ///< The branches for this category + std::vector collInfo{}; ///< Collection info for this category + podio::CollectionIDTable idTable{}; ///< The collection id table for this category + std::vector collsToWrite{}; ///< The collections to write for this category }; /// Initialize the branches for this category - void initBranches(CategoryInfo& catInfo, const std::vector& collections, + void initBranches(CategoryInfo& catInfo, const std::vector& collections, /*const*/ podio::GenericParameters& parameters); /// Get the (potentially uninitialized category information for this category) CategoryInfo& getCategoryInfo(const std::string& category); static void resetBranches(std::vector& branches, - const std::vector& collections, + const std::vector& collections, /*const*/ podio::GenericParameters* parameters); std::unique_ptr m_file{nullptr}; ///< The storage file diff --git a/include/podio/Reader.h b/include/podio/Reader.h index e644a8238..ebce75a3e 100644 --- a/include/podio/Reader.h +++ b/include/podio/Reader.h @@ -7,25 +7,30 @@ namespace podio { class Reader { -public: +private: struct ReaderConcept { virtual ~ReaderConcept() = default; virtual podio::Frame readNextFrame(const std::string& name) = 0; virtual podio::Frame readFrame(const std::string& name, size_t index) = 0; - virtual size_t getEntries(const std::string& name) = 0; + virtual size_t getEntries(const std::string& name) const = 0; virtual podio::version::Version currentFileVersion() const = 0; virtual std::vector getAvailableCategories() const = 0; virtual const std::string_view getDatamodelDefinition(const std::string& name) const = 0; virtual std::vector getAvailableDatamodels() const = 0; }; +private: template - struct ReaderModel final : public ReaderConcept { + struct ReaderModel final : ReaderConcept { ReaderModel(std::unique_ptr reader) : m_reader(std::move(reader)) { } ReaderModel(const ReaderModel&) = delete; ReaderModel& operator=(const ReaderModel&) = delete; + ReaderModel(ReaderModel&&) = default; + ReaderModel& operator=(ReaderModel&&) = default; + + ~ReaderModel() = default; podio::Frame readNextFrame(const std::string& name) override { auto maybeFrame = m_reader->readNextEntry(name); @@ -43,7 +48,7 @@ class Reader { throw std::runtime_error("Failed reading category " + name + " at frame " + std::to_string(index) + " (reading beyond bounds?)"); } - size_t getEntries(const std::string& name) override { + size_t getEntries(const std::string& name) const override { return m_reader->getEntries(name); } podio::version::Version currentFileVersion() const override { @@ -67,9 +72,18 @@ class Reader { std::unique_ptr m_self{nullptr}; +public: template Reader(std::unique_ptr); + Reader(const Reader&) = delete; + Reader& operator=(const Reader&) = delete; + + Reader(Reader&&) = default; + Reader& operator=(Reader&&) = default; + + ~Reader() = default; + podio::Frame readNextFrame(const std::string& name) { return m_self->readNextFrame(name); } @@ -82,10 +96,10 @@ class Reader { podio::Frame readEvent(size_t index) { return readFrame(podio::Category::Event, index); } - size_t getEntries(const std::string& name) { + size_t getEntries(const std::string& name) const { return m_self->getEntries(name); } - size_t getEvents() { + size_t getEvents() const { return getEntries(podio::Category::Event); } podio::version::Version currentFileVersion() const { diff --git a/include/podio/Writer.h b/include/podio/Writer.h index 74c02025d..ca5b5d4c6 100644 --- a/include/podio/Writer.h +++ b/include/podio/Writer.h @@ -2,25 +2,22 @@ #define PODIO_WRITER_H #include "podio/Frame.h" -#include "podio/podioVersion.h" namespace podio { class Writer { -public: +private: struct WriterConcept { virtual ~WriterConcept() = default; - virtual void writeFrame(const podio::Frame& frame, const std::string& category) = 0; virtual void writeFrame(const podio::Frame& frame, const std::string& category, const std::vector& collections) = 0; - virtual void writeEvent(const podio::Frame& frame) = 0; - virtual void writeEvent(const podio::Frame& frame, const std::vector& collections) = 0; virtual void finish() = 0; }; +private: template - struct WriterModel final : public WriterConcept { + struct WriterModel final : WriterConcept { WriterModel(std::unique_ptr writer) : m_writer(std::move(writer)) { } WriterModel(const WriterModel&) = delete; @@ -30,19 +27,10 @@ class Writer { ~WriterModel() = default; - void writeFrame(const podio::Frame& frame, const std::string& category) override { - return m_writer->writeFrame(frame, category); - } void writeFrame(const podio::Frame& frame, const std::string& category, const std::vector& collections) override { return m_writer->writeFrame(frame, category, collections); } - void writeEvent(const podio::Frame& frame) override { - return writeFrame(frame, podio::Category::Event); - } - void writeEvent(const podio::Frame& frame, const std::vector& collections) override { - return writeFrame(frame, podio::Category::Event, collections); - } void finish() override { return m_writer->finish(); } @@ -51,6 +39,7 @@ class Writer { std::unique_ptr m_self{nullptr}; +public: template Writer(std::unique_ptr reader) : m_self(std::make_unique>(std::move(reader))) { } @@ -63,16 +52,16 @@ class Writer { ~Writer() = default; void writeFrame(const podio::Frame& frame, const std::string& category) { - return m_self->writeFrame(frame, category); + return m_self->writeFrame(frame, category, frame.getAvailableCollections()); } void writeFrame(const podio::Frame& frame, const std::string& category, const std::vector& collections) { return m_self->writeFrame(frame, category, collections); } void writeEvent(const podio::Frame& frame) { - return writeFrame(frame, podio::Category::Event); + writeFrame(frame, podio::Category::Event, frame.getAvailableCollections()); } void writeEvent(const podio::Frame& frame, const std::vector& collections) { - return writeFrame(frame, podio::Category::Event, collections); + writeFrame(frame, podio::Category::Event, collections); } void finish() { return m_self->finish(); diff --git a/include/podio/utilities/RootHelpers.h b/include/podio/utilities/RootHelpers.h new file mode 100644 index 000000000..55b97a74c --- /dev/null +++ b/include/podio/utilities/RootHelpers.h @@ -0,0 +1,44 @@ +#ifndef PODIO_UTILITIES_ROOTHELPERS_H +#define PODIO_UTILITIES_ROOTHELPERS_H + +#include "TBranch.h" + +#include +#include +#include + +namespace podio { +class CollectionBase; + +namespace root_utils { + + // A collection of additional information that describes the collection: the + // collectionID, the collection (data) type, whether it is a subset + // collection, and its schema version + using CollectionWriteInfoT = std::tuple; + // for backwards compatibility + using CollectionInfoWithoutSchemaT = std::tuple; + + /// A collection name and a base pointer grouped together for writing + using StoreCollection = std::tuple; + + /// Small helper struct to collect all branches that are necessary to read or + /// write a collection. Needed to cache the branch pointers and avoid having to + /// get them from a TTree/TChain for every event. + struct CollectionBranches { + TBranch* data{nullptr}; + std::vector refs{}; + std::vector vecs{}; + std::vector refNames{}; ///< The names of the relation branches + std::vector vecNames{}; ///< The names of the vector member branches + }; + + /// Pair of keys and values for one type of the ones that can be stored in + /// GenericParameters + template + using ParamStorage = std::tuple, std::vector>>; + +} // namespace root_utils +} // namespace podio + +#endif // PODIO_UTILITIES_ROOTHELPERS_H diff --git a/python/podio_gen/cpp_generator.py b/python/podio_gen/cpp_generator.py index 079594944..21ec9d97e 100644 --- a/python/podio_gen/cpp_generator.py +++ b/python/podio_gen/cpp_generator.py @@ -88,6 +88,7 @@ def post_process(self, _): if "ROOT" in self.io_handlers: self._prepare_iorules() self._create_selection_xml() + self._write_all_collections_header() self._write_cmake_lists_file() def do_process_component(self, name, component): @@ -485,6 +486,22 @@ def _write_list(name, target_folder, files, comment): self.any_changes, ) + def _write_all_collections_header(self): + """Write a header file that includes all collection headers""" + + collection_files = (x.split("::")[-1] + "Collection.h" for x in self.datamodel.datatypes) + self._write_file( + os.path.join(self.install_dir, self.package_name, f"{self.package_name}.h"), + self._eval_template( + "datamodel.h.jinja2", + { + "includes": collection_files, + "incfolder": self.incfolder, + "package_name": self.package_name, + }, + ), + ) + def _write_edm_def_file(self): """Write the edm definition to a compile time string""" model_encoder = DataModelJSONEncoder() diff --git a/python/podio_schema_evolution.py b/python/podio_schema_evolution.py index 12d500c66..1a9a7f828 100755 --- a/python/podio_schema_evolution.py +++ b/python/podio_schema_evolution.py @@ -31,7 +31,7 @@ class AddedComponent(SchemaChange): def __init__(self, component, name): self.component = component self.name = name - super().__init__(f"'{self.component.name}' has been added") + super().__init__(f"'{self.name}' has been added") class DroppedComponent(SchemaChange): diff --git a/python/templates/CMakeLists.txt b/python/templates/CMakeLists.txt index 503097189..014b4e0bd 100644 --- a/python/templates/CMakeLists.txt +++ b/python/templates/CMakeLists.txt @@ -1,6 +1,7 @@ set(PODIO_TEMPLATES ${CMAKE_CURRENT_LIST_DIR}/Collection.cc.jinja2 ${CMAKE_CURRENT_LIST_DIR}/Collection.h.jinja2 + ${CMAKE_CURRENT_LIST_DIR}/datamodel.h.jinja2 ${CMAKE_CURRENT_LIST_DIR}/CollectionData.cc.jinja2 ${CMAKE_CURRENT_LIST_DIR}/CollectionData.h.jinja2 ${CMAKE_CURRENT_LIST_DIR}/Component.h.jinja2 diff --git a/python/templates/datamodel.h.jinja2 b/python/templates/datamodel.h.jinja2 new file mode 100644 index 000000000..cf7ee7aea --- /dev/null +++ b/python/templates/datamodel.h.jinja2 @@ -0,0 +1,10 @@ +// AUTOMATICALLY GENERATED FILE - DO NOT EDIT + +#ifndef {{ package_name.upper() }}_{{ package_name }}_H +#define {{ package_name.upper() }}_{{ package_name }}_H + +{% for name in includes %} +#include "{{ incfolder }}{{ name }}" +{% endfor %} + +#endif // {{ package_name.upper() }}_{{ package_name }}_H diff --git a/src/CMakeLists.txt b/src/CMakeLists.txt index f129467d8..561e2a9b9 100644 --- a/src/CMakeLists.txt +++ b/src/CMakeLists.txt @@ -80,6 +80,7 @@ SET(root_sources ROOTWriter.cc ROOTReader.cc ROOTLegacyReader.cc + ROOTFrameData.cc ) if(ENABLE_RNTUPLE) list(APPEND root_sources @@ -92,6 +93,8 @@ SET(root_headers ${PROJECT_SOURCE_DIR}/include/podio/ROOTReader.h ${PROJECT_SOURCE_DIR}/include/podio/ROOTLegacyReader.h ${PROJECT_SOURCE_DIR}/include/podio/ROOTWriter.h + ${PROJECT_SOURCE_DIR}/include/podio/ROOTFrameData.h + ${PROJECT_SOURCE_DIR}/include/podio/utilities/RootHelpers.h ) if(ENABLE_RNTUPLE) list(APPEND root_headers @@ -146,7 +149,11 @@ set(io_headers ${PROJECT_SOURCE_DIR}/include/podio/Reader.h ) -PODIO_ADD_LIB_AND_DICT(podioIO "${io_headers}" "${io_sources}" io_selection.xml) +add_library(podioIO SHARED ${io_sources}) +add_library(podio::podioIO ALIAS podioIO) +target_include_directories(podioIO PUBLIC + $ + $) target_link_libraries(podioIO PUBLIC podio::podio podio::podioRootIO) if(ENABLE_SIO) target_link_libraries(podioIO PUBLIC podio::podioSioIO) @@ -170,8 +177,6 @@ install(FILES ${CMAKE_CURRENT_BINARY_DIR}/libpodioDict_rdict.pcm ${CMAKE_CURRENT_BINARY_DIR}/podioRootIODictDict.rootmap ${CMAKE_CURRENT_BINARY_DIR}/libpodioRootIODict_rdict.pcm - ${CMAKE_CURRENT_BINARY_DIR}/podioIODictDict.rootmap - ${CMAKE_CURRENT_BINARY_DIR}/libpodioIODict_rdict.pcm DESTINATION "${CMAKE_INSTALL_LIBDIR}") if (ENABLE_SIO) diff --git a/src/RNTupleWriter.cc b/src/RNTupleWriter.cc index 38231cc18..decdac8e4 100644 --- a/src/RNTupleWriter.cc +++ b/src/RNTupleWriter.cc @@ -17,7 +17,6 @@ namespace podio { RNTupleWriter::RNTupleWriter(const std::string& filename) : - m_metadata(ROOT::Experimental::RNTupleModel::Create()), m_file(new TFile(filename.c_str(), "RECREATE", "data file")) { } @@ -28,40 +27,33 @@ RNTupleWriter::~RNTupleWriter() { } template -std::pair&, std::vector>&> RNTupleWriter::getKeyValueVectors() { +root_utils::ParamStorage& RNTupleWriter::getParamStorage(CategoryInfo& catInfo) { if constexpr (std::is_same_v) { - return {m_intkeys, m_intvalues}; + return catInfo.intParams; } else if constexpr (std::is_same_v) { - return {m_floatkeys, m_floatvalues}; + return catInfo.floatParams; } else if constexpr (std::is_same_v) { - return {m_doublekeys, m_doublevalues}; + return catInfo.doubleParams; } else if constexpr (std::is_same_v) { - return {m_stringkeys, m_stringvalues}; + return catInfo.stringParams; } else { throw std::runtime_error("Unknown type"); } } template -void RNTupleWriter::fillParams(GenericParameters& params, ROOT::Experimental::REntry* entry) { - auto [key, value] = getKeyValueVectors(); +void RNTupleWriter::fillParams(const GenericParameters& params, CategoryInfo& catInfo, + ROOT::Experimental::REntry* entry) { + auto& [keys, values] = getParamStorage(catInfo); + keys = params.getKeys(); + values = params.getValues(); #if ROOT_VERSION_CODE >= ROOT_VERSION(6, 31, 0) - entry->BindRawPtr(root_utils::getGPKeyName(), &key); - entry->BindRawPtr(root_utils::getGPValueName(), &value); + entry->BindRawPtr(root_utils::getGPKeyName(), &keys); + entry->BindRawPtr(root_utils::getGPValueName(), &values); #else - entry->CaptureValueUnsafe(root_utils::getGPKeyName(), &key); - entry->CaptureValueUnsafe(root_utils::getGPValueName(), &value); + entry->CaptureValueUnsafe(root_utils::getGPKeyName(), &keys); + entry->CaptureValueUnsafe(root_utils::getGPValueName(), &values); #endif - - key.clear(); - key.reserve(params.getMap().size()); - value.clear(); - value.reserve(params.getMap().size()); - - for (auto& [kk, vv] : params.getMap()) { - key.emplace_back(kk); - value.emplace_back(vv); - } } void RNTupleWriter::writeFrame(const podio::Frame& frame, const std::string& category) { @@ -77,14 +69,14 @@ void RNTupleWriter::writeFrame(const podio::Frame& frame, const std::string& cat const bool new_category = (catInfo.writer == nullptr); if (new_category) { // This is the minimal information that we need for now - catInfo.name = root_utils::sortAlphabeticaly(collsToWrite); + catInfo.names = root_utils::sortAlphabeticaly(collsToWrite); } - std::vector collections; - collections.reserve(catInfo.name.size()); + std::vector collections; + collections.reserve(catInfo.names.size()); // Only loop over the collections that were requested in the first Frame of // this category - for (const auto& name : catInfo.name) { + for (const auto& name : catInfo.names) { auto* coll = frame.getCollectionForWrite(name); if (!coll) { // Make sure all collections that we want to write are actually available @@ -101,15 +93,15 @@ void RNTupleWriter::writeFrame(const podio::Frame& frame, const std::string& cat catInfo.writer = ROOT::Experimental::RNTupleWriter::Append(std::move(model), category, *m_file.get(), {}); for (const auto& [name, coll] : collections) { - catInfo.id.emplace_back(coll->getID()); - catInfo.type.emplace_back(coll->getTypeName()); - catInfo.isSubsetCollection.emplace_back(coll->isSubsetCollection()); - catInfo.schemaVersion.emplace_back(coll->getSchemaVersion()); + catInfo.ids.emplace_back(coll->getID()); + catInfo.types.emplace_back(coll->getTypeName()); + catInfo.subsetCollections.emplace_back(coll->isSubsetCollection()); + catInfo.schemaVersions.emplace_back(coll->getSchemaVersion()); } } else { - if (!root_utils::checkConsistentColls(catInfo.name, collsToWrite)) { + if (!root_utils::checkConsistentColls(catInfo.names, collsToWrite)) { throw std::runtime_error("Trying to write category '" + category + "' with inconsistent collection content. " + - root_utils::getInconsistentCollsMsg(catInfo.name, collsToWrite)); + root_utils::getInconsistentCollsMsg(catInfo.names, collsToWrite)); } } @@ -178,17 +170,17 @@ void RNTupleWriter::writeFrame(const podio::Frame& frame, const std::string& cat // &const_cast(frame.getParameters())); } - auto params = frame.getParameters(); - fillParams(params, entry.get()); - fillParams(params, entry.get()); - fillParams(params, entry.get()); - fillParams(params, entry.get()); + const auto& params = frame.getParameters(); + fillParams(params, catInfo, entry.get()); + fillParams(params, catInfo, entry.get()); + fillParams(params, catInfo, entry.get()); + fillParams(params, catInfo, entry.get()); m_categories[category].writer->Fill(*entry); } std::unique_ptr -RNTupleWriter::createModels(const std::vector& collections) { +RNTupleWriter::createModels(const std::vector& collections) { auto model = ROOT::Experimental::RNTupleModel::CreateBare(); #if ROOT_VERSION_CODE >= ROOT_VERSION(6, 31, 0) @@ -260,49 +252,49 @@ RNTupleWriter::createModels(const std::vector& collections) { return model; } -RNTupleWriter::CollectionInfo& RNTupleWriter::getCategoryInfo(const std::string& category) { +RNTupleWriter::CategoryInfo& RNTupleWriter::getCategoryInfo(const std::string& category) { if (auto it = m_categories.find(category); it != m_categories.end()) { return it->second; } - auto [it, _] = m_categories.try_emplace(category, CollectionInfo{}); + auto [it, _] = m_categories.try_emplace(category, CategoryInfo{}); return it->second; } void RNTupleWriter::finish() { + auto metadata = ROOT::Experimental::RNTupleModel::Create(); auto podioVersion = podio::version::build_version; - auto versionField = m_metadata->MakeField>(root_utils::versionBranchName); + auto versionField = metadata->MakeField>(root_utils::versionBranchName); *versionField = {podioVersion.major, podioVersion.minor, podioVersion.patch}; auto edmDefinitions = m_datamodelCollector.getDatamodelDefinitionsToWrite(); - auto edmField = - m_metadata->MakeField>>(root_utils::edmDefBranchName); + auto edmField = metadata->MakeField>>(root_utils::edmDefBranchName); *edmField = std::move(edmDefinitions); - auto availableCategoriesField = m_metadata->MakeField>(root_utils::availableCategories); + auto availableCategoriesField = metadata->MakeField>(root_utils::availableCategories); for (auto& [c, _] : m_categories) { availableCategoriesField->push_back(c); } for (auto& [category, collInfo] : m_categories) { - auto idField = m_metadata->MakeField>({root_utils::idTableName(category)}); - *idField = collInfo.id; - auto collectionNameField = m_metadata->MakeField>({root_utils::collectionName(category)}); - *collectionNameField = collInfo.name; - auto collectionTypeField = m_metadata->MakeField>({root_utils::collInfoName(category)}); - *collectionTypeField = collInfo.type; - auto subsetCollectionField = m_metadata->MakeField>({root_utils::subsetCollection(category)}); - *subsetCollectionField = collInfo.isSubsetCollection; - auto schemaVersionField = m_metadata->MakeField>({"schemaVersion_" + category}); - *schemaVersionField = collInfo.schemaVersion; + auto idField = metadata->MakeField>({root_utils::idTableName(category)}); + *idField = collInfo.ids; + auto collectionNameField = metadata->MakeField>({root_utils::collectionName(category)}); + *collectionNameField = collInfo.names; + auto collectionTypeField = metadata->MakeField>({root_utils::collInfoName(category)}); + *collectionTypeField = collInfo.types; + auto subsetCollectionField = metadata->MakeField>({root_utils::subsetCollection(category)}); + *subsetCollectionField = collInfo.subsetCollections; + auto schemaVersionField = metadata->MakeField>({"schemaVersion_" + category}); + *schemaVersionField = collInfo.schemaVersions; } - m_metadata->Freeze(); - m_metadataWriter = - ROOT::Experimental::RNTupleWriter::Append(std::move(m_metadata), root_utils::metaTreeName, *m_file, {}); + metadata->Freeze(); + auto metadataWriter = + ROOT::Experimental::RNTupleWriter::Append(std::move(metadata), root_utils::metaTreeName, *m_file, {}); - m_metadataWriter->Fill(); + metadataWriter->Fill(); m_file->Write(); @@ -311,7 +303,6 @@ void RNTupleWriter::finish() { for (auto& [_, catInfo] : m_categories) { catInfo.writer.reset(); } - m_metadataWriter.reset(); m_finished = true; } @@ -319,7 +310,7 @@ void RNTupleWriter::finish() { std::tuple, std::vector> RNTupleWriter::checkConsistency(const std::vector& collsToWrite, const std::string& category) const { if (const auto it = m_categories.find(category); it != m_categories.end()) { - return root_utils::getInconsistentColls(it->second.name, collsToWrite); + return root_utils::getInconsistentColls(it->second.names, collsToWrite); } return {std::vector{}, collsToWrite}; diff --git a/src/ROOTFrameData.cc b/src/ROOTFrameData.cc new file mode 100644 index 000000000..2fde64154 --- /dev/null +++ b/src/ROOTFrameData.cc @@ -0,0 +1,44 @@ +#include "podio/ROOTFrameData.h" + +namespace podio { + +ROOTFrameData::ROOTFrameData(BufferMap&& buffers, CollIDPtr&& idTable, podio::GenericParameters&& params) : + m_buffers(std::move(buffers)), m_idTable(std::move(idTable)), m_parameters(std::move(params)) { +} + +// Interim workaround for https://github.com/AIDASoft/podio#500 +ROOTFrameData::~ROOTFrameData() { + for (auto& [_, buffer] : m_buffers) { + buffer.deleteBuffers(buffer); + } +} + +std::optional ROOTFrameData::getCollectionBuffers(const std::string& name) { + const auto bufferHandle = m_buffers.extract(name); + if (bufferHandle.empty()) { + return std::nullopt; + } + + return {bufferHandle.mapped()}; +} + +podio::CollectionIDTable ROOTFrameData::getIDTable() const { + // Construct a copy of the internal table + return {m_idTable->ids(), m_idTable->names()}; +} + +std::unique_ptr ROOTFrameData::getParameters() { + return std::make_unique(std::move(m_parameters)); +} + +std::vector ROOTFrameData::getAvailableCollections() const { + std::vector collections; + collections.reserve(m_buffers.size()); + for (const auto& [name, _] : m_buffers) { + collections.push_back(name); + } + + return collections; +} + +} // namespace podio diff --git a/src/ROOTLegacyReader.cc b/src/ROOTLegacyReader.cc index c5815e4e3..83f160615 100644 --- a/src/ROOTLegacyReader.cc +++ b/src/ROOTLegacyReader.cc @@ -138,7 +138,7 @@ void ROOTLegacyReader::openFiles(const std::vector& filenames) { // Check if the CollectionTypeInfo branch is there and assume that the file // has been written with with podio pre #197 (<0.13.1) if that is not the case if (auto* collInfoBranch = root_utils::getBranch(metadatatree, "CollectionTypeInfo")) { - auto collectionInfo = new std::vector; + auto collectionInfo = new std::vector; if (m_fileVersion < podio::version::Version{0, 16, 4}) { auto oldCollInfo = new std::vector(); @@ -171,7 +171,7 @@ unsigned ROOTLegacyReader::getEntries(const std::string& name) const { return m_chain->GetEntries(); } -void ROOTLegacyReader::createCollectionBranches(const std::vector& collInfo) { +void ROOTLegacyReader::createCollectionBranches(const std::vector& collInfo) { size_t collectionIndex{0}; for (const auto& [collID, collType, isSubsetColl, collSchemaVersion] : collInfo) { diff --git a/src/ROOTReader.cc b/src/ROOTReader.cc index 928000c7a..fab05d112 100644 --- a/src/ROOTReader.cc +++ b/src/ROOTReader.cc @@ -21,11 +21,11 @@ namespace podio { std::tuple, std::vector>> createCollectionBranches(TChain* chain, const podio::CollectionIDTable& idTable, - const std::vector& collInfo); + const std::vector& collInfo); std::tuple, std::vector>> createCollectionBranchesIndexBased(TChain* chain, const podio::CollectionIDTable& idTable, - const std::vector& collInfo); + const std::vector& collInfo); GenericParameters ROOTReader::readEntryParameters(ROOTReader::CategoryInfo& catInfo, bool reloadBranches, unsigned int localEntry) { @@ -137,7 +137,7 @@ void ROOTReader::initCategory(CategoryInfo& catInfo, const std::string& category auto* collInfoBranch = root_utils::getBranch(m_metaChain.get(), root_utils::collInfoName(category)); - auto collInfo = new std::vector(); + auto collInfo = new std::vector(); if (m_fileVersion < podio::version::Version{0, 16, 4}) { auto oldCollInfo = new std::vector(); collInfoBranch->SetAddress(&oldCollInfo); @@ -253,7 +253,7 @@ std::vector ROOTReader::getAvailableCategories() const { std::tuple, std::vector>> createCollectionBranchesIndexBased(TChain* chain, const podio::CollectionIDTable& idTable, - const std::vector& collInfo) { + const std::vector& collInfo) { size_t collectionIndex{0}; std::vector collBranches; @@ -305,7 +305,7 @@ createCollectionBranchesIndexBased(TChain* chain, const podio::CollectionIDTable std::tuple, std::vector>> createCollectionBranches(TChain* chain, const podio::CollectionIDTable& idTable, - const std::vector& collInfo) { + const std::vector& collInfo) { size_t collectionIndex{0}; std::vector collBranches; diff --git a/src/ROOTWriter.cc b/src/ROOTWriter.cc index b38bc145b..9e46bf942 100644 --- a/src/ROOTWriter.cc +++ b/src/ROOTWriter.cc @@ -37,7 +37,7 @@ void ROOTWriter::writeFrame(const podio::Frame& frame, const std::string& catego catInfo.tree->SetDirectory(m_file.get()); } - std::vector collections; + std::vector collections; collections.reserve(catInfo.collsToWrite.size()); for (const auto& name : catInfo.collsToWrite) { auto* coll = frame.getCollectionForWrite(name); @@ -76,7 +76,7 @@ ROOTWriter::CategoryInfo& ROOTWriter::getCategoryInfo(const std::string& categor return it->second; } -void ROOTWriter::initBranches(CategoryInfo& catInfo, const std::vector& collections, +void ROOTWriter::initBranches(CategoryInfo& catInfo, const std::vector& collections, /*const*/ podio::GenericParameters& parameters) { catInfo.branches.reserve(collections.size() + 1); // collections + parameters @@ -118,7 +118,7 @@ void ROOTWriter::initBranches(CategoryInfo& catInfo, const std::vectorgetTypeName(), + catInfo.collInfo.emplace_back(catInfo.idTable.collectionID(name).value(), std::string(coll->getTypeName()), coll->isSubsetCollection(), coll->getSchemaVersion()); } @@ -129,12 +129,12 @@ void ROOTWriter::initBranches(CategoryInfo& catInfo, const std::vector& branches, - const std::vector& collections, + const std::vector& collections, /*const*/ podio::GenericParameters* parameters) { size_t iColl = 0; - for (auto& coll : collections) { + for (auto& [_, coll] : collections) { const auto& collBranches = branches[iColl]; - root_utils::setCollectionAddresses(coll.second->getBuffers(), collBranches); + root_utils::setCollectionAddresses(coll->getBuffers(), collBranches); iColl++; } diff --git a/src/io_selection.xml b/src/io_selection.xml deleted file mode 100644 index ffeeb5eef..000000000 --- a/src/io_selection.xml +++ /dev/null @@ -1,6 +0,0 @@ - - - - - - diff --git a/src/rootUtils.h b/src/rootUtils.h index 5fb7aa7d3..c9e7c1238 100644 --- a/src/rootUtils.h +++ b/src/rootUtils.h @@ -1,14 +1,10 @@ #ifndef PODIO_ROOT_UTILS_H // NOLINT(llvm-header-guard): internal headers confuse clang-tidy #define PODIO_ROOT_UTILS_H // NOLINT(llvm-header-guard): internal headers confuse clang-tidy -#include "podio/CollectionBase.h" -#include "podio/CollectionBranches.h" -#include "podio/CollectionBuffers.h" #include "podio/CollectionIDTable.h" +#include "podio/utilities/RootHelpers.h" #include "TBranch.h" -#include "TChain.h" -#include "TClass.h" #include "TTree.h" #include @@ -203,13 +199,6 @@ inline void setCollectionAddresses(const BufferT& collBuffers, const CollectionB } } -// A collection of additional information that describes the collection: the -// collectionID, the collection (data) type, whether it is a subset -// collection, and its schema version -using CollectionInfoT = std::tuple; -// for backwards compatibility -using CollectionInfoWithoutSchemaT = std::tuple; - inline void readBranchesData(const CollectionBranches& branches, Long64_t entry) { // Read all data if (branches.data) { @@ -233,7 +222,7 @@ inline void readBranchesData(const CollectionBranches& branches, Long64_t entry) * collections */ inline auto reconstructCollectionInfo(TTree* eventTree, podio::CollectionIDTable const& idTable) { - std::vector collInfo; + std::vector collInfo; for (size_t iColl = 0; iColl < idTable.names().size(); ++iColl) { const auto collID = idTable.ids()[iColl]; diff --git a/tests/schema_evolution/CMakeLists.txt b/tests/schema_evolution/CMakeLists.txt index a86963d82..c6eabb388 100644 --- a/tests/schema_evolution/CMakeLists.txt +++ b/tests/schema_evolution/CMakeLists.txt @@ -33,4 +33,20 @@ function(PODIO_CREATE_READ_NEW_DATA_TEST sourcefile additional_libs) ) endfunction() +add_test( + NAME schema-evolution-script + COMMAND ${PROJECT_SOURCE_DIR}/python/podio_schema_evolution.py + ${CMAKE_CURRENT_SOURCE_DIR}/datalayout_new.yaml + ${PROJECT_SOURCE_DIR}/tests/datalayout.yaml +) + +add_test( + NAME schema-evolution-script-with-evol + COMMAND + ${PROJECT_SOURCE_DIR}/python/podio_schema_evolution.py + --evo ${CMAKE_CURRENT_SOURCE_DIR}/schema_evolution.yaml + ${CMAKE_CURRENT_SOURCE_DIR}/datalayout_new.yaml + ${PROJECT_SOURCE_DIR}/tests/datalayout.yaml +) + add_subdirectory(root_io) diff --git a/tests/schema_evolution/datalayout_new.yaml b/tests/schema_evolution/datalayout_new.yaml index e9938fd1c..8c08df933 100644 --- a/tests/schema_evolution/datalayout_new.yaml +++ b/tests/schema_evolution/datalayout_new.yaml @@ -33,6 +33,11 @@ components : - int x - int y_new + ex2::NamespaceStructLong: + Members: + - int64_t x + - int64_t y_new + ex2::NamespaceInNamespaceStruct: Members: - ex2::NamespaceStruct data @@ -191,7 +196,7 @@ datatypes : Members: - std::int16_t i16Val{42} // some int16 value - std::array floats {3.14f, 1.23f} // some float values - - ex2::NamespaceStruct s{10, 11} // one that we happen to know works + - ex2::NamespaceStructLong s{10, 11} // one that we happen to know works - double d{9.876e5} // double val - CompWithInit comp // To make sure that the default initializer of the component does what it should