ReduceLayer && OneDNN (#266)

Semyon1104 · web-flow · commit 5e23309bd3e6 · 2026-02-11T19:37:35.000+01:00
diff --git a/app/Graph/build.cpp b/app/Graph/build.cpp
@@ -760,8 +760,8 @@ ParseResult parse_json_model(RuntimeOptions options,
             keepdims = attributes["keepdims"].get<int64_t>();
           }
         }
-        auto reduce_layer = std::make_shared<it_lab_ai::ReduceLayer>(
-            it_lab_ai::ReduceLayer::Operation::kMean, keepdims, axes);
+        auto reduce_layer = LayerFactory::createReduceLayer(
+            it_lab_ai::ReduceLayer::Operation::kMean, keepdims, axes, options);
         layer = reduce_layer;
       } else if (layer_type == "ReduceSum") {
         int64_t keepdims = 0;
@@ -787,8 +787,8 @@ ParseResult parse_json_model(RuntimeOptions options,
             }
           }
         }
-        auto reduce_layer = std::make_shared<it_lab_ai::ReduceLayer>(
-            it_lab_ai::ReduceLayer::Operation::kSum, keepdims, axes);
+        auto reduce_layer = LayerFactory::createReduceLayer(
+            it_lab_ai::ReduceLayer::Operation::kSum, keepdims, axes, options);
         layer = reduce_layer;
       } else if (layer_type == "Constant") {
         if (layer_data.contains("attributes")) {
diff --git a/app/Graph/build.hpp b/app/Graph/build.hpp
@@ -35,6 +35,7 @@
 #include "layers_oneDNN/ConvLayer.hpp"
 #include "layers_oneDNN/EWLayer.hpp"
 #include "layers_oneDNN/PoolingLayer.hpp"
+#include "layers_oneDNN/ReduceLayer.hpp"
 
 extern std::unordered_map<std::string, std::string> model_paths;
 
@@ -101,6 +102,15 @@ class LayerFactory {
                                                 bias, group, useLegacyImpl);
   }
 
+  static std::shared_ptr<Layer> createReduceLayer(
+      ReduceLayer::Operation op, int64_t keepdims,
+      const std::vector<int64_t>& axes, const RuntimeOptions& options) {
+    if (options.backend == Backend::kOneDnn) {
+      return std::make_shared<ReduceLayerOneDnn>(op, keepdims, axes);
+    }
+    return std::make_shared<ReduceLayer>(op, keepdims, axes);
+  }
+
   static std::shared_ptr<Layer> createPoolingLayer(
       const std::string& PoolType, const Shape& shape,
       const RuntimeOptions& options, const Shape& strides = {2, 2},
diff --git a/include/layers/Shape.hpp b/include/layers/Shape.hpp
@@ -57,6 +57,7 @@ class Shape {
     }
     return true;
   }
+  void push_back(size_t value) { dims_.push_back(value); }
 
   bool operator!=(const Shape& other) const { return !(*this == other); }
   friend std::ostream& operator<<(std::ostream& os, const Shape& shape);
diff --git a/include/layers_oneDNN/ReduceLayer.hpp b/include/layers_oneDNN/ReduceLayer.hpp
@@ -0,0 +1,83 @@
+#pragma once
+#include <cstdint>
+#include <dnnl.hpp>
+#include <memory>
+#include <vector>
+
+#include "layers/Layer.hpp"
+#include "layers/ReduceLayer.hpp"
+#include "layers/Tensor.hpp"
+
+namespace it_lab_ai {
+
+class ReduceLayerOneDnn : public Layer {
+ public:
+  ReduceLayerOneDnn(ReduceLayer::Operation op, int64_t keepdims,
+                    const std::vector<int64_t>& axes)
+      : Layer(kReduce), op_(op), keepdims_(keepdims), axes_(axes) {}
+
+  explicit ReduceLayerOneDnn(int64_t keepdims = 0,
+                             const std::vector<int64_t>& axes = {})
+      : ReduceLayerOneDnn(ReduceLayer::Operation::kSum, keepdims, axes) {}
+
+  void run(const std::vector<Tensor>& input,
+           std::vector<Tensor>& output) override;
+
+  void set_axes(const std::vector<int64_t>& axes) {
+    axes_ = axes;
+    initialized_ = false;
+  }
+
+  void set_keepdims(int64_t keepdims) {
+    keepdims_ = keepdims;
+    initialized_ = false;
+  }
+
+  void set_operation(ReduceLayer::Operation op) {
+    op_ = op;
+    initialized_ = false;
+  }
+
+#ifdef ENABLE_STATISTIC_WEIGHTS
+  Tensor get_weights() override { return Tensor(); }
+#endif
+
+ private:
+  ReduceLayer::Operation op_;
+  int64_t keepdims_;
+  std::vector<int64_t> axes_;
+  std::vector<int64_t> normalized_axes_;
+  std::vector<int64_t> last_axes_;
+
+  bool initialized_ = false;
+  Shape last_input_shape_;
+  Type last_type_;
+
+  std::unique_ptr<dnnl::engine> engine_;
+  std::unique_ptr<dnnl::stream> stream_;
+  std::unique_ptr<dnnl::reduction> reduction_prim_;
+
+  dnnl::memory::desc src_md_;
+  dnnl::memory::desc dst_md_;
+  Shape output_shape_;
+
+  void initialize_onednn(const Tensor& input);
+  static void validate_input(const std::vector<Tensor>& input);
+  [[nodiscard]] static dnnl::memory::data_type get_dnnl_data_type(Type type);
+  [[nodiscard]] static dnnl::algorithm get_dnnl_algorithm(
+      ReduceLayer::Operation op);
+  [[nodiscard]] static dnnl::memory::format_tag pick_format(size_t ndims);
+  static void normalize_axes(const Shape& input_shape,
+                             std::vector<int64_t>& axes);
+  [[nodiscard]] Shape calculate_output_shape(
+      const Shape& input_shape, const std::vector<int64_t>& axes) const;
+
+  [[nodiscard]] static std::vector<dnnl::memory::dim> shape_to_dims(
+      const Shape& shape);
+  template <typename T>
+  std::vector<T> remove_unit_dims(const std::vector<T>& src_data,
+                                  const Shape& src_shape,
+                                  const Shape& dst_shape);
+};
+
+}  // namespace it_lab_ai
diff --git a/src/layers_oneDNN/ReduceLayer.cpp b/src/layers_oneDNN/ReduceLayer.cpp
diff --git a/test/single_layer_onednn_version/test_reducelayer_onednn.cpp b/test/single_layer_onednn_version/test_reducelayer_onednn.cpp

Original file line number	Diff line number	Diff line change
`@@ -760,8 +760,8 @@ ParseResult parse_json_model(RuntimeOptions options,`
`760`	`760`	`keepdims = attributes["keepdims"].get<int64_t>();`
`761`	`761`	`}`
`762`	`762`	`}`
`763`		`- auto reduce_layer = std::make_shared<it_lab_ai::ReduceLayer>(`
`764`		`- it_lab_ai::ReduceLayer::Operation::kMean, keepdims, axes);`
	`763`	`+ auto reduce_layer = LayerFactory::createReduceLayer(`
	`764`	`+ it_lab_ai::ReduceLayer::Operation::kMean, keepdims, axes, options);`
`765`	`765`	`layer = reduce_layer;`
`766`	`766`	`} else if (layer_type == "ReduceSum") {`
`767`	`767`	`int64_t keepdims = 0;`
`@@ -787,8 +787,8 @@ ParseResult parse_json_model(RuntimeOptions options,`
`787`	`787`	`}`
`788`	`788`	`}`
`789`	`789`	`}`
`790`		`- auto reduce_layer = std::make_shared<it_lab_ai::ReduceLayer>(`
`791`		`- it_lab_ai::ReduceLayer::Operation::kSum, keepdims, axes);`
	`790`	`+ auto reduce_layer = LayerFactory::createReduceLayer(`
	`791`	`+ it_lab_ai::ReduceLayer::Operation::kSum, keepdims, axes, options);`
`792`	`792`	`layer = reduce_layer;`
`793`	`793`	`} else if (layer_type == "Constant") {`
`794`	`794`	`if (layer_data.contains("attributes")) {`
Original file line number	Diff line number	Diff line change
`@@ -57,6 +57,7 @@ class Shape {`
`57`	`57`	`}`
`58`	`58`	`return true;`
`59`	`59`	`}`
	`60`	`+ void push_back(size_t value) { dims_.push_back(value); }`
`60`	`61`
`61`	`62`	`bool operator!=(const Shape& other) const { return !(*this == other); }`
`62`	`63`	`friend std::ostream& operator<<(std::ostream& os, const Shape& shape);`