fastmachinelearning · y19y19 · Apr 2, 2024 · Apr 2, 2024 · Apr 10, 2024 · Apr 29, 2024
diff --git a/Configuration/ProcessModifiers/python/allSonicTriton_cff.py b/Configuration/ProcessModifiers/python/allSonicTriton_cff.py
@@ -5,6 +5,8 @@
 from Configuration.ProcessModifiers.particleNetPTSonicTriton_cff import particleNetPTSonicTriton
 from Configuration.ProcessModifiers.deepMETSonicTriton_cff import deepMETSonicTriton
 from Configuration.ProcessModifiers.deepTauSonicTriton_cff import deepTauSonicTriton
+from Configuration.ProcessModifiers.particleTransformerAK4SonicTriton_cff import particleTransformerAK4SonicTriton
 
 # collect all SonicTriton-related process modifiers here
-allSonicTriton = cms.ModifierChain(enableSonicTriton,deepMETSonicTriton,particleNetSonicTriton,deepTauSonicTriton)
+allSonicTriton = cms.ModifierChain(enableSonicTriton,deepMETSonicTriton,particleNetSonicTriton,particleNetPTSonicTriton,deepTauSonicTriton,particleTransformerAK4SonicTriton)
+
diff --git a/Configuration/ProcessModifiers/python/particleTransformerAK4SonicTriton_cff.py b/Configuration/ProcessModifiers/python/particleTransformerAK4SonicTriton_cff.py
@@ -0,0 +1,3 @@
+import FWCore.ParameterSet.Config as cms
+
+particleTransformerAK4SonicTriton = cms.Modifier()
diff --git a/RecoBTag/ONNXRuntime/plugins/ParticleTransformerAK4SonicJetTagsProducer.cc b/RecoBTag/ONNXRuntime/plugins/ParticleTransformerAK4SonicJetTagsProducer.cc
@@ -0,0 +1,306 @@
+#include "FWCore/Framework/interface/Frameworkfwd.h"
+
+#include "FWCore/Framework/interface/Event.h"
+#include "FWCore/Framework/interface/MakerMacros.h"
+
+#include "FWCore/Framework/interface/makeRefToBaseProdFrom.h"
+
+#include "FWCore/ParameterSet/interface/ParameterSet.h"
+#include "FWCore/Utilities/interface/StreamID.h"
+
+#include "DataFormats/BTauReco/interface/JetTag.h"
+
+#include "DataFormats/BTauReco/interface/ParticleTransformerAK4TagInfo.h"
+#include "DataFormats/BTauReco/interface/ParticleTransformerAK4Features.h"
+
+#include "HeterogeneousCore/SonicTriton/interface/TritonEDProducer.h"
+
+#include "HeterogeneousCore/SonicTriton/interface/TritonData.h"
+
+class ParticleTransformerAK4SonicJetTagsProducer : public TritonEDProducer<> {
+public:
+  explicit ParticleTransformerAK4SonicJetTagsProducer(const edm::ParameterSet&);
+  ~ParticleTransformerAK4SonicJetTagsProducer() override;
+
+  void acquire(edm::Event const &iEvent, edm::EventSetup const &iSetup, Input &iInput) override;
+
+  void produce(edm::Event &iEvent, edm::EventSetup const &iSetup, Output const &iOutput) override;
+  static void fillDescriptions(edm::ConfigurationDescriptions&);
+
+private:
+  typedef std::vector<reco::ParticleTransformerAK4TagInfo> TagInfoCollection;
+  typedef reco::JetTagCollection JetTagCollection;
+
+  const edm::EDGetTokenT<TagInfoCollection> src_;
+  std::vector<std::string> flav_names_;
+  std::vector<std::string> input_names_;
+  std::vector<std::string> output_names_;
+
+  enum InputIndexes {
+    kChargedCandidates = 0,
+    kNeutralCandidates = 1,
+    kVertices = 2,
+    kChargedCandidates4Vec = 3,
+    kNeutralCandidates4Vec = 4,
+    kVertices4Vec = 5
+  };
+
+  constexpr static unsigned n_features_cpf_ = 16;
+  constexpr static unsigned n_pairwise_features_cpf_ = 4;
+  constexpr static unsigned n_features_npf_ = 8;
+  constexpr static unsigned n_pairwise_features_npf_ = 4;
+  constexpr static unsigned n_features_sv_ = 14;
+  constexpr static unsigned n_pairwise_features_sv_ = 4;
+  bool skippedInference_ = false;
+  bool padding_ = true;
+};
+
+ParticleTransformerAK4SonicJetTagsProducer::ParticleTransformerAK4SonicJetTagsProducer(const edm::ParameterSet& iConfig)
+    : TritonEDProducer<>(iConfig),
+      src_(consumes<TagInfoCollection>(iConfig.getParameter<edm::InputTag>("src"))),
+      flav_names_(iConfig.getParameter<std::vector<std::string>>("flav_names")),
+      input_names_(iConfig.getParameter<std::vector<std::string>>("input_names")),
+      output_names_(iConfig.getParameter<std::vector<std::string>>("output_names")) {
+  // get output names from flav_names
+  for (const auto& flav_name : flav_names_) {
+    produces<JetTagCollection>(flav_name);
+  }
+}
+
+ParticleTransformerAK4SonicJetTagsProducer::~ParticleTransformerAK4SonicJetTagsProducer() {}
+
+void ParticleTransformerAK4SonicJetTagsProducer::fillDescriptions(edm::ConfigurationDescriptions& descriptions) {
+  // pfParticleTransformerAK4JetTags
+  edm::ParameterSetDescription desc;
+  TritonClient::fillPSetDescription(desc);
+  desc.add<edm::InputTag>("src", edm::InputTag("pfParticleTransformerAK4TagInfos"));
+  desc.add<std::vector<std::string>>("input_names", {"input_1", "input_2", "input_3", "input_4", "input_5", "input_6"});
+  desc.add<std::vector<std::string>>("output_names", {"softmax"});
+  desc.add<std::vector<std::string>>(
+      "flav_names", std::vector<std::string>{"probb", "probbb", "problepb", "probc", "probuds", "probg"});
+
+  descriptions.add("pfParticleTransformerAK4SonicJetTags", desc);
+}
+
+void ParticleTransformerAK4SonicJetTagsProducer::acquire(edm::Event const &iEvent, edm::EventSetup const &iSetup, Input &iInput) {
+  edm::Handle<TagInfoCollection> tag_infos;
+  iEvent.getByToken(src_, tag_infos);
+  client_->setBatchSize(tag_infos->size());
+  skippedInference_ = false;
+  if (tag_infos->empty()) return;
+  unsigned int max_n_cpf = 0; 
+  unsigned int max_n_npf = 0; 
+  unsigned int max_n_vtx = 0; 
+
+  // Find the max n_cpf, n_npf and n_vtx among all the jets in an event. 
+  for (unsigned jet_n = 0; jet_n < tag_infos->size(); ++jet_n) {
+    max_n_cpf = std::max(max_n_cpf,
+                         static_cast<unsigned int>(((*tag_infos)[jet_n]).features().c_pf_features.size()));
+    max_n_npf = std::max(max_n_npf,
+                         static_cast<unsigned int>(((*tag_infos)[jet_n]).features().n_pf_features.size()));
+    max_n_vtx = std::max(max_n_vtx,
+                         static_cast<unsigned int>(((*tag_infos)[jet_n]).features().sv_features.size()));
+  }
+
+  // If an event has no jet, or all jets has zero n_cpf, n_npf and n_vtx, the inference is skipped.
+  if (max_n_cpf == 0 && max_n_npf == 0 && max_n_vtx == 0) {
+    client_->setBatchSize(0);
+    skippedInference_ = true;
+    return;
+  }
+
+  // all the jets in the same event will fill up the same amount of n_cpf, n_npf, n_vtx and send to server
+  max_n_cpf = std::clamp(max_n_cpf, (unsigned int)0, (unsigned int)25);
+  max_n_npf = std::clamp(max_n_npf, (unsigned int)0, (unsigned int)25);
+  max_n_vtx = std::clamp(max_n_vtx, (unsigned int)0, (unsigned int)5);
+
+  for (unsigned igroup = 0; igroup < input_names_.size(); ++igroup) {
+    const auto &group_name = input_names_[igroup];
+    auto &input = iInput.at(group_name);
+    unsigned target = 0;
+
+    if (igroup == kChargedCandidates || igroup == kChargedCandidates4Vec) target = std::max((unsigned int)1, max_n_cpf);
+    else if (igroup == kNeutralCandidates || igroup == kNeutralCandidates4Vec) target = std::max((unsigned int)1, max_n_npf);
+    else if (igroup == kVertices || igroup == kVertices4Vec) target = std::max((unsigned int)1, max_n_vtx);
+
+    input.setShape(0, target);
+    auto tdata = input.allocate<float>(true);
+    for (unsigned jet_n = 0; jet_n < tag_infos->size(); ++jet_n) {
+      const auto &taginfo = (*tag_infos)[jet_n];
+      const auto &features = taginfo.features();
+      auto &vdata = (*tdata)[jet_n];
+      // Loop through the n cpf, and in the case that n_cpf is smaller than max_n_cpf, add padding values to all features
+      if (igroup == kChargedCandidates) {
+        unsigned int n_cpf = features.c_pf_features.size();
+        n_cpf = std::clamp(n_cpf, (unsigned int)0,  (unsigned int)25);
+        for (unsigned int count = 0; count < n_cpf; count++) {
+          vdata.push_back(features.c_pf_features.at(count).btagPf_trackEtaRel);
+          vdata.push_back(features.c_pf_features.at(count).btagPf_trackPtRel);
+          vdata.push_back(features.c_pf_features.at(count).btagPf_trackPPar);
+          vdata.push_back(features.c_pf_features.at(count).btagPf_trackDeltaR);
+          vdata.push_back(features.c_pf_features.at(count).btagPf_trackPParRatio);
+          vdata.push_back(features.c_pf_features.at(count).btagPf_trackSip2dVal);
+          vdata.push_back(features.c_pf_features.at(count).btagPf_trackSip2dSig);
+          vdata.push_back(features.c_pf_features.at(count).btagPf_trackSip3dVal);
+          vdata.push_back(features.c_pf_features.at(count).btagPf_trackSip3dSig);
+          vdata.push_back(features.c_pf_features.at(count).btagPf_trackJetDistVal);
+          vdata.push_back(features.c_pf_features.at(count).ptrel);
+          vdata.push_back(features.c_pf_features.at(count).drminsv);
+          vdata.push_back(features.c_pf_features.at(count).vtx_ass);
+          vdata.push_back(features.c_pf_features.at(count).puppiw);
+          vdata.push_back(features.c_pf_features.at(count).chi2);
+          vdata.push_back(features.c_pf_features.at(count).quality);
+        }
+        if (padding_ && n_cpf < max_n_cpf)
+          vdata.insert(vdata.end(), (max_n_cpf - n_cpf) * n_features_cpf_, 0); // Add 0 to unfilled part as padding value
+        if (max_n_cpf == 0) 
+          vdata.insert(vdata.end(), n_features_cpf_, 0); // Add at least 1 row of 0, otherwise the model has trouble getting output
+      }
+      else if (igroup == kNeutralCandidates) {
+        unsigned int n_npf = features.n_pf_features.size();
+        n_npf = std::clamp(n_npf, (unsigned int)0, (unsigned int)25);
+
+        for (unsigned int count = 0; count < n_npf; count++) {
+          vdata.push_back(features.n_pf_features.at(count).ptrel);
+          vdata.push_back(features.n_pf_features.at(count).etarel);
+          vdata.push_back(features.n_pf_features.at(count).phirel);
+          vdata.push_back(features.n_pf_features.at(count).deltaR);
+          vdata.push_back(features.n_pf_features.at(count).isGamma);
+          vdata.push_back(features.n_pf_features.at(count).hadFrac);
+          vdata.push_back(features.n_pf_features.at(count).drminsv);
+          vdata.push_back(features.n_pf_features.at(count).puppiw);
+        }
+        if (padding_ && n_npf < max_n_npf)
+          vdata.insert(vdata.end(), (max_n_npf - n_npf) * n_features_npf_, 0);
+        if (max_n_npf == 0)
+          vdata.insert(vdata.end(), n_features_npf_, 0);
+      }
+      else if (igroup == kVertices) {
+        unsigned int n_vtx= features.sv_features.size();
+        n_vtx = std::clamp(n_vtx, (unsigned int)0, (unsigned int)5);
+
+        for (unsigned int count = 0; count < n_vtx; count++) {
+          vdata.push_back(features.sv_features.at(count).pt);
+          vdata.push_back(features.sv_features.at(count).deltaR);
+          vdata.push_back(features.sv_features.at(count).mass);
+          vdata.push_back(features.sv_features.at(count).etarel);
+          vdata.push_back(features.sv_features.at(count).phirel);
+          vdata.push_back(features.sv_features.at(count).ntracks);
+          vdata.push_back(features.sv_features.at(count).chi2);
+          vdata.push_back(features.sv_features.at(count).normchi2);
+          vdata.push_back(features.sv_features.at(count).dxy);
+          vdata.push_back(features.sv_features.at(count).dxysig);
+          vdata.push_back(features.sv_features.at(count).d3d);
+          vdata.push_back(features.sv_features.at(count).d3dsig);
+          vdata.push_back(features.sv_features.at(count).costhetasvpv);
+          vdata.push_back(features.sv_features.at(count).enratio);
+        }
+        if (padding_ && n_vtx < max_n_vtx)
+          vdata.insert(vdata.end(), (max_n_vtx - n_vtx) * n_features_sv_, 0);
+        if (max_n_vtx == 0)
+          vdata.insert(vdata.end(), n_features_sv_, 0);
+      }
+      else if (igroup == kChargedCandidates4Vec) {
+        unsigned int n_cpf = features.c_pf_features.size();
+        n_cpf = std::clamp(n_cpf,  (unsigned int)0,  (unsigned int)25);
+
+        for (unsigned int count = 0; count < n_cpf; count++) {
+          const auto& cpf_pairwise_features = features.c_pf_features.at(count);
+          vdata.push_back(cpf_pairwise_features.px);
+          vdata.push_back(cpf_pairwise_features.py);
+          vdata.push_back(cpf_pairwise_features.pz);
+          vdata.push_back(cpf_pairwise_features.e);
+        }
+        if (padding_ && n_cpf < max_n_cpf) 
+          vdata.insert(vdata.end(), (max_n_cpf - n_cpf) * n_pairwise_features_cpf_, 0);
+        if (max_n_cpf == 0)
+          vdata.insert(vdata.end(), n_pairwise_features_cpf_, 0);
+      }
+      else if (igroup == kNeutralCandidates4Vec) {
+        unsigned int n_npf = features.n_pf_features.size();
+        n_npf = std::clamp(n_npf, (unsigned int)0, (unsigned int)25);
+        for (unsigned int count = 0; count < n_npf; count++) {
+          const auto& npf_pairwise_features = features.n_pf_features.at(count);
+          vdata.push_back(npf_pairwise_features.px);
+          vdata.push_back(npf_pairwise_features.py);
+          vdata.push_back(npf_pairwise_features.pz);
+          vdata.push_back(npf_pairwise_features.e);
+        }
+        if (padding_ && n_npf < max_n_npf)
+          vdata.insert(vdata.end(), (max_n_npf - n_npf) * n_pairwise_features_npf_, 0); 
+        if (max_n_npf == 0)
+          vdata.insert(vdata.end(), n_pairwise_features_npf_, 0);
+      }
+      else if (igroup == kVertices4Vec ) {
+        unsigned int n_vtx = features.sv_features.size();
+        n_vtx = std::clamp(n_vtx, (unsigned int)0, (unsigned int)5);
+        for (unsigned int count = 0; count < n_vtx; count++) {
+          const auto& sv_pairwise_features = features.sv_features.at(count);
+          vdata.push_back(sv_pairwise_features.px);
+          vdata.push_back(sv_pairwise_features.py);
+          vdata.push_back(sv_pairwise_features.pz);
+          vdata.push_back(sv_pairwise_features.e);
+        }
+        if (padding_ && n_vtx < max_n_vtx)
+          vdata.insert(vdata.end(), (max_n_vtx - n_vtx) * n_pairwise_features_sv_, 0); 
+        if (max_n_vtx == 0)
+          vdata.insert(vdata.end(), n_pairwise_features_sv_, 0);
+      }
+    }
+    input.toServer(tdata);
+  } 
+}
+
+void ParticleTransformerAK4SonicJetTagsProducer::produce(edm::Event& iEvent, const edm::EventSetup& iSetup, Output const &iOutput) {
+  edm::Handle<TagInfoCollection> tag_infos;
+  iEvent.getByToken(src_, tag_infos);
+
+  // initialize output collection
+  std::vector<std::unique_ptr<JetTagCollection>> output_tags;
+  if (!tag_infos->empty()) {
+    auto jet_ref = tag_infos->begin()->jet();
+    auto ref2prod = edm::makeRefToBaseProdFrom(jet_ref, iEvent);
+    for (std::size_t i = 0; i < flav_names_.size(); i++) {
+      output_tags.emplace_back(std::make_unique<JetTagCollection>(ref2prod));
+    }
+  } else {
+    for (std::size_t i = 0; i < flav_names_.size(); i++) {
+      output_tags.emplace_back(std::make_unique<JetTagCollection>());
+    }
+  }
+  if (!tag_infos->empty()) {
+    if (!skippedInference_) {
+      const auto &output1 = iOutput.begin()->second;
+      const auto &outputs_from_server = output1.fromServer<float>();
+
+      for (unsigned jet_n = 0; jet_n < tag_infos->size(); ++jet_n) {
+        const auto &taginfo = (*tag_infos)[jet_n];
+        const auto &jet_ref = tag_infos->at(jet_n).jet();
+
+        if (taginfo.features().is_filled) {
+          for (std::size_t flav_n = 0; flav_n < flav_names_.size(); flav_n++) {
+            (*(output_tags[flav_n]))[jet_ref] = outputs_from_server[jet_n][flav_n];
+          }
+        } else {
+          for (std::size_t flav_n = 0; flav_n < flav_names_.size(); flav_n++) {
+            (*(output_tags[flav_n]))[jet_ref] = -1.0;
+          }
+        }
+      }
+    } else {
+      for (unsigned jet_n = 0; jet_n < tag_infos->size(); ++jet_n) {
+        const auto &jet_ref = tag_infos->at(jet_n).jet();
+        for (std::size_t flav_n = 0; flav_n < flav_names_.size(); flav_n++) {
+          (*(output_tags[flav_n]))[jet_ref] = -1.0;
+        }
+      }
+    }
+  }
+  // put into the event
+  for (std::size_t flav_n = 0; flav_n < flav_names_.size(); ++flav_n) {
+    iEvent.put(std::move(output_tags[flav_n]), flav_names_[flav_n]);
+  }
+}
+
+//define this as a plug-in
+DEFINE_FWK_MODULE(ParticleTransformerAK4SonicJetTagsProducer);
diff --git a/RecoBTag/ONNXRuntime/python/pfParticleTransformerAK4_cff.py b/RecoBTag/ONNXRuntime/python/pfParticleTransformerAK4_cff.py
@@ -4,8 +4,26 @@
 
 from RecoBTag.ONNXRuntime.pfParticleTransformerAK4JetTags_cfi import pfParticleTransformerAK4JetTags
 from RecoBTag.ONNXRuntime.pfParticleTransformerAK4DiscriminatorsJetTags_cfi import pfParticleTransformerAK4DiscriminatorsJetTags
+from RecoBTag.ONNXRuntime.pfParticleTransformerAK4SonicJetTags_cfi import pfParticleTransformerAK4SonicJetTags as _pfParticleTransformerAK4SonicJetTags
 from CommonTools.PileupAlgos.Puppi_cff import puppi
 from CommonTools.RecoAlgos.primaryVertexAssociation_cfi import primaryVertexAssociation
+from Configuration.ProcessModifiers.particleTransformerAK4SonicTriton_cff import particleTransformerAK4SonicTriton
+
+
+particleTransformerAK4SonicTriton.toReplaceWith(pfParticleTransformerAK4JetTags, _pfParticleTransformerAK4SonicJetTags.clone(
+    Client = cms.PSet(
+        timeout = cms.untracked.uint32(300),
+        mode = cms.string("Async"),
+        modelName = cms.string("particletransformer_AK4"), # double check
+        modelConfigPath = cms.FileInPath("RecoBTag/Combined/data/models/particletransformer_AK4/config.pbtxt"), # this is SONIC, not currently in the CMSSW, so the models/ will be copied to this location privately
+        modelVersion = cms.string(""),
+        verbose = cms.untracked.bool(False),
+        allowedTries = cms.untracked.uint32(0),
+        useSharedMemory = cms.untracked.bool(True),
+        compression = cms.untracked.string(""),
+    ),
+    flav_names = pfParticleTransformerAK4JetTags.flav_names,
+))
 
 # declare all the discriminators
 # probs
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,3 @@
		import FWCore.ParameterSet.Config as cms

		particleTransformerAK4SonicTriton = cms.Modifier()