Merge pull request #43941 from riga/aot_interface_14_1_X

Add TF AOT interface.
cms-sw · Mar 14, 2024 · 16ae21f · 16ae21f
2 parents 5669353 + 1e5643c
commit 16ae21f
Show file tree

Hide file tree

Showing 19 changed files with 1,672 additions and 2 deletions.
diff --git a/PhysicsTools/TensorFlow/test/createconstantgraph.py b/PhysicsTools/TensorFlow/test/createconstantgraph.py
@@ -47,4 +47,4 @@
 # write it
 graph_path = os.path.join(datadir, "constantgraph.pb")
 outputs = ["output"]
-cmsml.tensorflow.save_graph(graph_path, sess, output_names=outputs, variables_to_constants=True)
+cmsml.tensorflow.save_frozen_graph(graph_path, sess, output_names=outputs, variables_to_constants=True)
diff --git a/PhysicsTools/TensorFlow/test/readconstantgraph.py b/PhysicsTools/TensorFlow/test/readconstantgraph.py
@@ -24,5 +24,5 @@
 
 # read and evaluate the graph
 graph_path = os.path.join(datadir, "constantgraph.pb")
-graph, sess = cmsml.tensorflow.load_graph(graph_path, create_session=True)
+graph, sess = cmsml.tensorflow.load_frozen_graph(graph_path, create_session=True)
 print(sess.run("output:0", feed_dict={"scale:0": 1.0, "input:0": [range(10)]})[0][0])
diff --git a/PhysicsTools/TensorFlowAOT/BuildFile.xml b/PhysicsTools/TensorFlowAOT/BuildFile.xml
@@ -0,0 +1,7 @@
+<use name="tensorflow-xla-runtime"/>
+
+<use name="FWCore/Utilities"/>
+
+<export>
+  <lib name="1"/>
+</export>
diff --git a/PhysicsTools/TensorFlowAOT/interface/Batching.h b/PhysicsTools/TensorFlowAOT/interface/Batching.h
@@ -0,0 +1,78 @@
+#ifndef PHYSICSTOOLS_TENSORFLOWAOT_BATCHING_H
+#define PHYSICSTOOLS_TENSORFLOWAOT_BATCHING_H
+
+/*
+ * AOT batching rules and strategies.
+ *
+ * Author: Marcel Rieger, Bogdan Wiederspan
+ */
+
+#include <cstddef>
+#include <vector>
+#include <map>
+#include <ostream>
+
+namespace tfaot {
+
+  // rule defining how a certain batch size should be composed of various smaller sizes plus an
+  // optional padding that is applied to the last size
+  class BatchRule {
+  public:
+    // constructor
+    explicit BatchRule(size_t batchSize, const std::vector<size_t>& sizes, size_t lastPadding = 0);
+
+    // destructor
+    ~BatchRule() = default;
+
+    // getter for the batch size
+    size_t getBatchSize() const { return batchSize_; }
+
+    // getter for available sizes
+    const std::vector<size_t>& getSizes() const { return sizes_; }
+
+    // getter for the last padding value
+    size_t getLastPadding() const { return lastPadding_; }
+
+    // returns the number of available sizes
+    size_t nSizes() const { return sizes_.size(); }
+
+    // getter for the registered size at index i
+    size_t getSize(size_t i) const { return sizes_[i]; }
+
+  private:
+    size_t batchSize_;
+    std::vector<size_t> sizes_;
+    size_t lastPadding_;
+  };
+
+  // stream operator
+  std::ostream& operator<<(std::ostream& out, const BatchRule& rule);
+
+  // the batch strategy is a collection of batch rules registered to certain batch sizes
+  class BatchStrategy {
+  public:
+    // constructor
+    explicit BatchStrategy() = default;
+
+    // destructor
+    ~BatchStrategy() = default;
+
+    // registers a new rule for a batch size
+    void setRule(const BatchRule& rule) { rules_.insert_or_assign(rule.getBatchSize(), rule); }
+
+    // returns whether a rule was already registered for a certain batch size
+    bool hasRule(size_t batchSize) const { return rules_.find(batchSize) != rules_.end(); }
+
+    // returns a rule registered previously for a certain batch size
+    const BatchRule& getRule(size_t batchSize) const;
+
+    // registers a new rule for a certain batch size according to a certain algorithm
+    void setDefaultRule(size_t batchSize, const std::vector<size_t>& availableBatchSizes);
+
+  private:
+    std::map<size_t, BatchRule> rules_;
+  };
+
+}  // namespace tfaot
+
+#endif  // PHYSICSTOOLS_TENSORFLOWAOT_BATCHING_H
diff --git a/PhysicsTools/TensorFlowAOT/interface/Model.h b/PhysicsTools/TensorFlowAOT/interface/Model.h
@@ -0,0 +1,168 @@
+#ifndef PHYSICSTOOLS_TENSORFLOWAOT_MODEL_H
+#define PHYSICSTOOLS_TENSORFLOWAOT_MODEL_H
+
+/*
+ * AOT model interface.
+ *
+ * Author: Marcel Rieger, Bogdan Wiederspan
+ */
+
+#include "FWCore/Utilities/interface/Exception.h"
+
+#include "PhysicsTools/TensorFlowAOT/interface/Util.h"
+#include "PhysicsTools/TensorFlowAOT/interface/Batching.h"
+
+namespace tfaot {
+
+  // model interface receiving the AOT wrapper type as a template argument
+  template <class W>
+  class Model {
+  public:
+    // constructor
+    explicit Model() : wrapper_(std::make_unique<W>()) {}
+
+    // destructor
+    ~Model() { wrapper_.reset(); };
+
+    // getter for the name
+    const std::string& name() const { return wrapper_->name(); }
+
+    // setter for the batch strategy
+    void setBatchStrategy(const BatchStrategy& strategy) { batchStrategy_ = strategy; }
+
+    // getter for the batch strategy
+    const BatchStrategy& getBatchStrategy() const { return batchStrategy_; }
+
+    // adds a new batch rule to the strategy
+    void setBatchRule(size_t batchSize, const std::vector<size_t>& sizes, size_t lastPadding = 0) {
+      batchStrategy_.setRule(BatchRule(batchSize, sizes, lastPadding));
+    }
+
+    // evaluates the model for multiple inputs and outputs of different types
+    template <typename... Outputs, typename... Inputs>
+    std::tuple<Outputs...> run(size_t batchSize, Inputs&&... inputs);
+
+  private:
+    std::unique_ptr<W> wrapper_;
+    BatchStrategy batchStrategy_;
+
+    // ensures that a batch rule exists for a certain batch size, and if not, registers a new one
+    // based on the default algorithm
+    const BatchRule& ensureRule(size_t batchSize);
+
+    // reserves memory in a nested (batched) vector to accomodate the result output at an index
+    template <typename T>
+    void reserveOutput(size_t batchSize, size_t resultIndex, std::vector<std::vector<T>>& data) const;
+
+    // injects data of a specific batch element into the argument data at an index
+    template <typename T>
+    void injectBatchInput(size_t batchSize, size_t batchIndex, size_t argIndex, const std::vector<T>& batchData);
+
+    // extracts result data at an index into a specific batch
+    template <typename T>
+    void extractBatchOutput(size_t batchSize, size_t batchIndex, size_t resultIndex, std::vector<T>& batchData) const;
+  };
+
+  template <class W>
+  const BatchRule& Model<W>::ensureRule(size_t batchSize) {
+    // register a default rule if there is none yet for that batch size
+    if (!batchStrategy_.hasRule(batchSize)) {
+      batchStrategy_.setDefaultRule(batchSize, wrapper_->batchSizes());
+    }
+    return batchStrategy_.getRule(batchSize);
+  }
+
+  template <class W>
+  template <typename T>
+  void Model<W>::reserveOutput(size_t batchSize, size_t resultIndex, std::vector<std::vector<T>>& data) const {
+    data.resize(batchSize, std::vector<T>(wrapper_->resultCountNoBatch(resultIndex)));
+  }
+
+  template <class W>
+  template <typename T>
+  void Model<W>::injectBatchInput(size_t batchSize,
+                                  size_t batchIndex,
+                                  size_t argIndex,
+                                  const std::vector<T>& batchData) {
+    size_t count = wrapper_->argCountNoBatch(argIndex);
+    if (batchData.size() != count) {
+      throw cms::Exception("InputMismatch")
+          << "model '" << name() << "' received " << batchData.size() << " elements for argument " << argIndex
+          << ", but " << count << " are expected";
+    }
+    T* argPtr = wrapper_->template argData<T>(batchSize, argIndex) + batchIndex * count;
+    auto beg = batchData.cbegin();
+    std::copy(beg, beg + count, argPtr);
+  }
+
+  template <class W>
+  template <typename T>
+  void Model<W>::extractBatchOutput(size_t batchSize,
+                                    size_t batchIndex,
+                                    size_t resultIndex,
+                                    std::vector<T>& batchData) const {
+    size_t count = wrapper_->resultCountNoBatch(resultIndex);
+    const T* resPtr = wrapper_->template resultData<T>(batchSize, resultIndex) + batchIndex * count;
+    batchData.assign(resPtr, resPtr + count);
+  }
+
+  template <class W>
+  template <typename... Outputs, typename... Inputs>
+  std::tuple<Outputs...> Model<W>::run(size_t batchSize, Inputs&&... inputs) {
+    // check number of inputs
+    size_t nInputs = sizeof...(Inputs);
+    if (nInputs != wrapper_->nArgs()) {
+      throw cms::Exception("InputMismatch")
+          << "model '" << name() << "' received " << nInputs << " inputs, but " << wrapper_->nArgs() << " are expected";
+    }
+
+    // check number of outputs
+    size_t nOutputs = sizeof...(Outputs);
+    if (nOutputs != wrapper_->nResults()) {
+      throw cms::Exception("OutputMismatch") << "requested " << nOutputs << " from model '" << name() << "', but "
+                                             << wrapper_->nResults() << " are provided";
+    }
+
+    // get the corresponding batch rule
+    const BatchRule& rule = ensureRule(batchSize);
+
+    // create a callback that invokes lambdas over all outputs with normal indices
+    auto forEachOutput = createIndexLooper<sizeof...(Outputs)>();
+
+    // reserve output arrays
+    std::tuple<Outputs...> outputs;
+    forEachOutput([&](auto resultIndex) { reserveOutput(batchSize, resultIndex, std::get<resultIndex>(outputs)); });
+
+    // loop over particular batch sizes, copy input, evaluate and compose the output
+    size_t batchOffset = 0;
+    size_t nSizes = rule.nSizes();
+    for (size_t i = 0; i < nSizes; i++) {
+      // get actual model batch size and optional padding
+      size_t bs = rule.getSize(i);
+      size_t padding = (i == nSizes - 1) ? rule.getLastPadding() : 0;
+
+      // fill inputs separately per batch element
+      for (size_t batchIndex = 0; batchIndex < bs - padding; batchIndex++) {
+        size_t argIndex = 0;
+        ([&] { injectBatchInput(bs, batchIndex, argIndex++, inputs[batchOffset + batchIndex]); }(), ...);
+      }
+
+      // model evaluation
+      wrapper_->run(bs);
+
+      // fill outputs separately per batch element
+      for (size_t batchIndex = 0; batchIndex < bs - padding; batchIndex++) {
+        forEachOutput([&](auto resultIndex) {
+          extractBatchOutput(bs, batchIndex, resultIndex, std::get<resultIndex>(outputs)[batchOffset + batchIndex]);
+        });
+      }
+
+      batchOffset += bs;
+    }
+
+    return outputs;
+  }
+
+}  // namespace tfaot
+
+#endif  // PHYSICSTOOLS_TENSORFLOWAOT_MODEL_H
diff --git a/PhysicsTools/TensorFlowAOT/interface/Util.h b/PhysicsTools/TensorFlowAOT/interface/Util.h
@@ -0,0 +1,41 @@
+#ifndef PHYSICSTOOLS_TENSORFLOWAOT_UTIL_H
+#define PHYSICSTOOLS_TENSORFLOWAOT_UTIL_H
+
+/*
+ * AOT utils and type definitions.
+ *
+ * Author: Marcel Rieger, Bogdan Wiederspan
+ */
+
+#include <type_traits>
+#include <utility>
+#include <vector>
+
+#include "tensorflow/compiler/tf2xla/xla_compiled_cpu_function.h"
+#include "tensorflow/core/platform/types.h"
+
+namespace tfaot {
+
+  // typedefs
+  typedef tensorflow::XlaCompiledCpuFunction::AllocMode AllocMode;
+  typedef std::vector<std::vector<bool>> BoolArrays;
+  typedef std::vector<std::vector<int32_t>> Int32Arrays;
+  typedef std::vector<std::vector<int64_t>> Int64Arrays;
+  typedef std::vector<std::vector<float>> FloatArrays;
+  typedef std::vector<std::vector<double>> DoubleArrays;
+
+  // helper to create lambdas accepting a function that is called with an index
+  template <size_t... Index>
+  auto createIndexLooper(std::index_sequence<Index...>) {
+    return [](auto&& f) { (f(std::integral_constant<size_t, Index>{}), ...); };
+  }
+
+  // helper to create lambdas accepting a function that is called with an index in a range [0, N)
+  template <size_t N>
+  auto createIndexLooper() {
+    return createIndexLooper(std::make_index_sequence<N>{});
+  }
+
+}  // namespace tfaot
+
+#endif  // PHYSICSTOOLS_TENSORFLOWAOT_UTIL_H