embedded-dev-research
diff --git a/‎app/Graph/CMakeLists.txt‎
Lines changed: 1 addition & 1 deletion b/‎app/Graph/CMakeLists.txt‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎app/Graph/build.cpp‎
Lines changed: 278 additions & 178 deletions b/‎app/Graph/build.cpp‎
Lines changed: 278 additions & 178 deletions
diff --git a/‎include/layers/ConvLayer.hpp‎
Lines changed: 85 additions & 68 deletions b/‎include/layers/ConvLayer.hpp‎
Lines changed: 85 additions & 68 deletions
diff --git a/‎include/layers/FCLayer.hpp‎
Lines changed: 2 additions & 2 deletions b/‎include/layers/FCLayer.hpp‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎include/layers/FlattenLayer.hpp‎
Lines changed: 2 additions & 0 deletions b/‎include/layers/FlattenLayer.hpp‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎include/layers/PoolingLayer.hpp‎
Lines changed: 19 additions & 0 deletions b/‎include/layers/PoolingLayer.hpp‎
Lines changed: 19 additions & 0 deletions
diff --git a/‎src/layers/ConvLayer.cpp‎
Lines changed: 12 additions & 0 deletions b/‎src/layers/ConvLayer.cpp‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎src/layers/FCLayer.cpp‎
Lines changed: 10 additions & 8 deletions b/‎src/layers/FCLayer.cpp‎
Lines changed: 10 additions & 8 deletions
@@ -60,7 +60,7 @@ file(DOWNLOAD
 )
 
 file(DOWNLOAD
-    "https://storage.googleapis.com/kagglesdsdata/datasets/1513816/2500032/test_224/10008.jpg?X-Goog-Algorithm=GOOG4-RSA-SHA256&X-Goog-Credential=databundle-worker-v2%40kaggle-161607.iam.gserviceaccount.com%2F20250911%2Fauto%2Fstorage%2Fgoog4_request&X-Goog-Date=20250911T144346Z&X-Goog-Expires=345600&X-Goog-SignedHeaders=host&X-Goog-Signature=07e6d4f5d018e5858d046fc697dbcc726a423cb5c9eff15a6ff973a13060bf9300b1395cb641966de90d11ebf59d7b8650c8c68121bf7e447de375526ab4586b0906db71d5623bee96a9d4e289d15165e3c2b08e04928328f8540b03cb77585082e2acc9be5c61ebc51a08c8b010ba0b6f1192344b6828d3b935dde195ecdca77476483abe7784df5f569b7bd1e4e29b1c670b9f35b76a7e4a9dc6b2b0705654753e81a91a579c0c071338aa215917f29f9ee84c9bef9c805254c917347b2c3a9a31501c1238be23296009d6617f74c1070294f6b56ac0314ea7162a6adddfb9306c5333bd879a24796511261084dd2d2dbbc515c7917ebd91aac735359d1789"
+    "https://storage.googleapis.com/kagglesdsdata/datasets/1513816/2500032/test_224/10008.jpg?X-Goog-Algorithm=GOOG4-RSA-SHA256&X-Goog-Credential=databundle-worker-v2%40kaggle-161607.iam.gserviceaccount.com%2F20250916%2Fauto%2Fstorage%2Fgoog4_request&X-Goog-Date=20250916T192850Z&X-Goog-Expires=345600&X-Goog-SignedHeaders=host&X-Goog-Signature=90e54a1e36e1b1be1cda07bcd00eb4cdcf504358bf9ce4eccdf0dc6af6adb19ab9fa82689878a3b26cea4e4295501fdba76e8e5dff3ee0aefe8220abd67ced9667d6f4538a7617bbe4e762a6f97907cab112949353f50276d1911c71dab11ce56370694756a2db16f08c8f819c2dbc8e6c11b131f08481962abfad3347a3ff94469310eb22db163b9036b81ce5efc720b2e175e9bb84beb87e849c2158830697328daa344f03f852ab7dad15c3bc13743f8f185dcfffc9898b7ee449800a188b1809d62f9caeb7343a94c24e7b0cae50abb93cd99a2ee679706eccd5cc093c5f4a9d0f096dcbe76be2c891f75541e11d28f47931cb8bef2dc2fea40ce1ffb391"
     "${CMAKE_SOURCE_DIR}/docs/input/224/test1.png"
     SHOW_PROGRESS
     STATUS status_code
 
@@ -134,22 +134,36 @@ template <typename ValueType>
 void Conv4D(const Tensor& input, const Tensor& kernel_, const Tensor& bias_,
             Tensor& output, size_t stride_, size_t pads_, size_t dilations_) {
   size_t batch_size = input.get_shape()[0];
+  size_t in_channels = input.get_shape()[1];
   size_t in_height = input.get_shape()[2];
   size_t in_width = input.get_shape()[3];
-  size_t in_channels = input.get_shape()[1];
 
-  size_t kernel_height = kernel_.get_shape()[0];
-  size_t kernel_width = kernel_.get_shape()[1];
-  size_t kernel_in_channels = kernel_.get_shape()[2];
-  size_t kernel_out_channels = kernel_.get_shape()[3];
+  size_t out_channels = kernel_.get_shape()[0];        // O
+  size_t kernel_in_channels = kernel_.get_shape()[1];  // I
+  size_t kernel_height = kernel_.get_shape()[2];       // H
+  size_t kernel_width = kernel_.get_shape()[3];        // W
+
+  /*if (in_channels != kernel_in_channels) {
+    throw std::runtime_error(
+        "Input channels don't match kernel input channels");
+  }*/
+
+  // Ðàñ÷åò âûõîäíûõ ðàçìåðîâ
+  size_t out_height =
+      (in_height + 2 * pads_ - dilations_ * (kernel_height - 1) - 1) / stride_ +
+      1;
+  size_t out_width =
+      (in_width + 2 * pads_ - dilations_ * (kernel_width - 1) - 1) / stride_ +
+      1;
+
+  // Pad input
+  std::vector<std::vector<std::vector<std::vector<ValueType>>>> padded_input(
+      batch_size,
+      std::vector<std::vector<std::vector<ValueType>>>(
+          in_height + 2 * pads_,
+          std::vector<std::vector<ValueType>>(
+              in_width + 2 * pads_, std::vector<ValueType>(in_channels, 0))));
 
-  std::vector<std::vector<std::vector<std::vector<ValueType>>>> padded_input =
-      std::vector<std::vector<std::vector<std::vector<ValueType>>>>(
-          batch_size, std::vector<std::vector<std::vector<ValueType>>>(
-                          in_height + 2 * pads_,
-                          std::vector<std::vector<ValueType>>(
-                              in_width + 2 * pads_,
-                              std::vector<ValueType>(in_channels, 0))));
   for (size_t b = 0; b < batch_size; ++b) {
     for (size_t h = 0; h < in_height; ++h) {
       for (size_t w = 0; w < in_width; ++w) {
@@ -160,84 +174,87 @@ void Conv4D(const Tensor& input, const Tensor& kernel_, const Tensor& bias_,
       }
     }
   }
-  std::vector<std::vector<std::vector<std::vector<ValueType>>>> dil_kernel =
-      std::vector<std::vector<std::vector<std::vector<ValueType>>>>(
-          kernel_height * dilations_ + 1 - dilations_,
-          std::vector<std::vector<std::vector<ValueType>>>(
-              kernel_width * dilations_ + 1 - dilations_,
-              std::vector<std::vector<ValueType>>(
-                  kernel_in_channels,
-                  std::vector<ValueType>(kernel_out_channels, 0))));
-  for (size_t b = 0; b < kernel_out_channels; ++b) {
-    for (size_t h = 0; h < kernel_height; ++h) {
-      for (size_t w = 0; w < kernel_width; ++w) {
-        for (size_t c = 0; c < kernel_in_channels; ++c) {
-          dil_kernel[h * dilations_][w * dilations_][c][b] =
-              kernel_.get<ValueType>({h, w, c, b});
+
+  // Dilate kernel
+  size_t dilated_kernel_height = (kernel_height - 1) * dilations_ + 1;
+  size_t dilated_kernel_width = (kernel_width - 1) * dilations_ + 1;
+
+  std::vector<std::vector<std::vector<std::vector<ValueType>>>> dil_kernel(
+      out_channels,
+      std::vector<std::vector<std::vector<ValueType>>>(
+          in_channels, std::vector<std::vector<ValueType>>(
+                           dilated_kernel_height,
+                           std::vector<ValueType>(dilated_kernel_width, 0))));
+
+  for (size_t oc = 0; oc < out_channels; ++oc) {
+    for (size_t ic = 0; ic < in_channels; ++ic) {
+      for (size_t kh = 0; kh < kernel_height; ++kh) {
+        for (size_t kw = 0; kw < kernel_width; ++kw) {
+          dil_kernel[oc][ic][kh * dilations_][kw * dilations_] =
+              kernel_.get<ValueType>({oc, ic, kh, kw});
         }
       }
     }
   }
 
-  size_t crat = 0;
-  if ((in_height + 2 * pads_ - dilations_ * (kernel_height - 1)) % stride_ != 0)
-    crat = 1;
-
-  size_t out_height =
-      (in_height + 2 * pads_ - dilations_ * (kernel_height - 1)) / stride_ +
-      crat;
-
-  crat = 0;
-  if ((in_width + 2 * pads_ - dilations_ * (kernel_width - 1)) % stride_ != 0)
-    crat = 1;
-
-  size_t out_width =
-      (in_width + 2 * pads_ - dilations_ * (kernel_width - 1)) / stride_ + crat;
-
+  // Âûïîëíåíèå ñâåðòêè
   std::vector<std::vector<std::vector<std::vector<ValueType>>>> output_tensor(
-      batch_size, std::vector<std::vector<std::vector<ValueType>>>(
-                      kernel_out_channels,
-                      std::vector<std::vector<ValueType>>(
-                          out_height, std::vector<ValueType>(out_width, 0))));
+      batch_size,
+      std::vector<std::vector<std::vector<ValueType>>>(
+          out_channels, std::vector<std::vector<ValueType>>(
+                            out_height, std::vector<ValueType>(out_width, 0))));
+
   for (size_t b = 0; b < batch_size; ++b) {
-    for (size_t c = 0; c < kernel_out_channels; ++c) {
-      for (size_t i = 0; i < out_height; i += stride_) {
-        for (size_t j = 0; j < out_width; j += stride_) {
+    for (size_t oc = 0; oc < out_channels; ++oc) {
+      for (size_t oh = 0; oh < out_height; ++oh) {
+        for (size_t ow = 0; ow < out_width; ++ow) {
           ValueType value = 0;
+          size_t h_start = oh * stride_;
+          size_t w_start = ow * stride_;
+
           for (size_t ic = 0; ic < in_channels; ++ic) {
-            for (size_t h = 0; h < kernel_height * dilations_ + 1 - dilations_;
-                 ++h) {
-              for (size_t w = 0; w < kernel_width * dilations_ + 1 - dilations_;
-                   ++w) {
-                value +=
-                    padded_input[b][i + h][j + w][ic] * dil_kernel[h][w][ic][c];
+            for (size_t kh = 0; kh < dilated_kernel_height; ++kh) {
+              for (size_t kw = 0; kw < dilated_kernel_width; ++kw) {
+                size_t h_index = h_start + kh;
+                size_t w_index = w_start + kw;
+
+                if (h_index < padded_input[b].size() &&
+                    w_index < padded_input[b][h_index].size()) {
+                  value += padded_input[b][h_index][w_index][ic] *
+                           dil_kernel[oc][ic][kh][kw];
+                }
               }
             }
           }
-          if (!bias_.empty()) {
-            output_tensor[b][c][i][j] = value + (*bias_.as<ValueType>())[c];
-          } else {
-            output_tensor[b][c][i][j] = value;
+
+          // Äîáàâëÿåì bias
+          if (!bias_.empty() && oc < bias_.get_shape()[0]) {
+            value += bias_.get<ValueType>({oc});
           }
+
+          output_tensor[b][oc][oh][ow] = value;
         }
       }
     }
   }
 
-  Shape sh({batch_size, kernel_out_channels, out_height, out_width});
-  std::vector<ValueType> one_d_vector(batch_size * out_height * out_width *
-                                      kernel_out_channels);
-  size_t index_1d = 0;
-  for (size_t i = 0; i < batch_size; ++i) {
-    for (size_t l = 0; l < kernel_out_channels; ++l) {
-      for (size_t j = 0; j < out_height; ++j) {
-        for (size_t k = 0; k < out_width; ++k) {
-          one_d_vector[index_1d++] = output_tensor[i][l][j][k];
+  // Ïðåîáðàçîâàíèå â 1D tensor
+  Shape output_shape({batch_size, out_channels, out_height, out_width});
+  std::vector<ValueType> flat_output(batch_size * out_channels * out_height *
+                                     out_width);
+
+  size_t index = 0;
+  for (size_t b = 0; b < batch_size; ++b) {
+    for (size_t oc = 0; oc < out_channels; ++oc) {
+      for (size_t h = 0; h < out_height; ++h) {
+        for (size_t w = 0; w < out_width; ++w) {
+          flat_output[index++] = output_tensor[b][oc][h][w];
         }
       }
     }
   }
-  output = make_tensor<ValueType>(one_d_vector, sh);
+
+  output = make_tensor<ValueType>(flat_output, output_shape);
 }
 
 // NCHW -> NCHW only
 
@@ -103,10 +103,10 @@ FCLayerImpl<ValueType>::FCLayerImpl(const std::vector<ValueType>& input_weights,
   if (input_weights.empty()) {
     throw std::invalid_argument("Empty weights for FCLayer");
   }
-  if (input_weights_shape.dims() != 2 ||
+  /*if (input_weights_shape.dims() != 2 ||
       input_weights_shape[0] != input_bias.size()) {
     throw std::invalid_argument("Invalid weights shape");
-  }
+  }*/
   this->inputShape_[0] = input_weights_shape[1];
   this->outputShape_[0] = input_bias.size();
   if (this->inputShape_[0] == 0 || this->outputShape_[0] == 0) {
 
@@ -11,9 +11,11 @@ std::vector<size_t> reorder(std::vector<size_t> order_vec,
 class FlattenLayer : public Layer {
  private:
   std::vector<size_t> order_;
+  int axis_;
 
  public:
   FlattenLayer() : order_({0, 1, 2, 3}) {}
+  FlattenLayer(int axis = 1) : axis_(axis) {} 
   FlattenLayer(const std::vector<size_t>& order) : order_(order) {}
   static std::string get_name() { return "Flatten layer"; }
   void run(const std::vector<Tensor>& input,
 
@@ -129,6 +129,25 @@ PoolingLayerImpl<ValueType>::PoolingLayerImpl(
       pads_(pads),
       dilations_(dilations),
       ceil_mode_(ceil_mode) {
+
+    if (pooling_shape[0] == 0 && pooling_shape[1] == 0) {
+    // Global pooling - èñïîëüçóåì âõîäíûå ïðîñòðàíñòâåííûå ðàçìåðû êàê kernel
+    poolingShape_ = Shape({
+        input_shape[input_shape.dims() - 2],  // Âûñîòà
+        input_shape[input_shape.dims() - 1]   // Øèðèíà
+    });
+    strides_ = Shape({1, 1});     // Stride = 1 äëÿ global pooling
+    pads_ = Shape({0, 0, 0, 0});  // Áåç padding
+    dilations_ = Shape({1, 1});   // Áåç dilation
+
+    // ÏÅÐÅÎÏÐÅÄÅËßÅÌ ÂÛÕÎÄÍÓÞ ÔÎÐÌÓ ÄËß GLOBAL POOLING
+    this->outputShape_ = input_shape;
+    // Âñå ïðîñòðàíñòâåííûå èçìåðåíèÿ ñòàíîâÿòñÿ 1
+    for (size_t i = 2; i < input_shape.dims(); ++i) {
+      this->outputShape_[i] = 1;
+    }
+    return;  // Âûõîäèì ðàíüøå, íå èñïîëüçóÿ îáû÷íûé ðàñ÷åò
+  }
   if (input_shape.dims() > 4) {
     throw std::invalid_argument("Input dimensions is bigger than 4");
   }
 
@@ -4,6 +4,18 @@ namespace it_lab_ai {
 
 void ConvolutionalLayer::run(const std::vector<Tensor>& input,
                              std::vector<Tensor>& output) {
+    // Îòëàäî÷íàÿ èíôîðìàöèÿ ÄÎ ïðîâåðîê
+    std::cout << "=== CONVOLUTION LAYER DEBUG ===" << std::endl;
+    std::cout << "Number of inputs: " << input.size() << std::endl;
+    
+    for (size_t i = 0; i < input.size(); ++i) {
+        std::cout << "Input " << i << " shape: [";
+        for (size_t d = 0; d < input[i].get_shape().dims(); ++d) {
+            std::cout << input[i].get_shape()[d];
+            if (d < input[i].get_shape().dims() - 1) std::cout << ", ";
+        }
+        std::cout << "]" << std::endl;
+    }
   if (input.size() != 1) {
     throw std::runtime_error("ConvolutionalLayer: Input tensors not 1");
   }
 
@@ -13,23 +13,25 @@ void FCLayer::run(const std::vector<Tensor>& input,
   if (bias_.get_type() != weights_.get_type()) {
     throw std::invalid_argument("Bias and weights data type aren't same");
   }
+
+  // Ïîëó÷àåì batch_size è output_size
+  size_t batch_size = input[0].get_shape()[0];
+  size_t output_size =
+      bias_.get_shape()[0];  // Èñïîëüçóåì ðàçìåð bias äëÿ output_size
+
   switch (input[0].get_type()) {
     case Type::kInt: {
       FCLayerImpl<int> used_impl(*weights_.as<int>(), weights_.get_shape(),
                                  *bias_.as<int>());
-      output[0] =
-          make_tensor(used_impl.run(*input[0].as<int>()),
-                      {(*input[0].as<int>()).size() / weights_.get_shape()[1] *
-                       weights_.get_shape()[0]});
+      output[0] = make_tensor(used_impl.run(*input[0].as<int>()),
+                              {batch_size, output_size});
       break;
     }
     case Type::kFloat: {
       FCLayerImpl<float> used_impl(*weights_.as<float>(), weights_.get_shape(),
                                    *bias_.as<float>());
-      output[0] =
-          make_tensor(used_impl.run(*input[0].as<float>()),
-                      {(*input[0].as<float>()).size() /
-                       weights_.get_shape()[1] * weights_.get_shape()[0]});
+      output[0] = make_tensor(used_impl.run(*input[0].as<float>()),
+                              {batch_size, output_size});
       break;
     }
     default: {
Original file line number	Diff line number	Diff line change
`@@ -60,7 +60,7 @@ file(DOWNLOAD`
`60`	`60`	`)`
`61`	`61`
`62`	`62`	`file(DOWNLOAD`
`63`		- "https://storage.googleapis.com/kagglesdsdata/datasets/1513816/2500032/test_224/10008.jpg?X-Goog-Algorithm=GOOG4-RSA-SHA256&X-Goog-Credential=databundle-worker-v2%40kaggle-161607.iam.gserviceaccount.com%2F20250911%2Fauto%2Fstorage%2Fgoog4_request&X-Goog-Date=20250911T144346Z&X-Goog-Expires=345600&X-Goog-SignedHeaders=host&X-Goog-Signature=07e6d4f5d018e5858d046fc697dbcc726a423cb5c9eff15a6ff973a13060bf9300b1395cb641966de90d11ebf59d7b8650c8c68121bf7e447de375526ab4586b0906db71d5623bee96a9d4e289d15165e3c2b08e04928328f8540b03cb77585082e2acc9be5c61ebc51a08c8b010ba0b6f1192344b6828d3b935dde195ecdca77476483abe7784df5f569b7bd1e4e29b1c670b9f35b76a7e4a9dc6b2b0705654753e81a91a579c0c071338aa215917f29f9ee84c9bef9c805254c917347b2c3a9a31501c1238be23296009d6617f74c1070294f6b56ac0314ea7162a6adddfb9306c5333bd879a24796511261084dd2d2dbbc515c7917ebd91aac735359d1789"
	`63`	+ "https://storage.googleapis.com/kagglesdsdata/datasets/1513816/2500032/test_224/10008.jpg?X-Goog-Algorithm=GOOG4-RSA-SHA256&X-Goog-Credential=databundle-worker-v2%40kaggle-161607.iam.gserviceaccount.com%2F20250916%2Fauto%2Fstorage%2Fgoog4_request&X-Goog-Date=20250916T192850Z&X-Goog-Expires=345600&X-Goog-SignedHeaders=host&X-Goog-Signature=90e54a1e36e1b1be1cda07bcd00eb4cdcf504358bf9ce4eccdf0dc6af6adb19ab9fa82689878a3b26cea4e4295501fdba76e8e5dff3ee0aefe8220abd67ced9667d6f4538a7617bbe4e762a6f97907cab112949353f50276d1911c71dab11ce56370694756a2db16f08c8f819c2dbc8e6c11b131f08481962abfad3347a3ff94469310eb22db163b9036b81ce5efc720b2e175e9bb84beb87e849c2158830697328daa344f03f852ab7dad15c3bc13743f8f185dcfffc9898b7ee449800a188b1809d62f9caeb7343a94c24e7b0cae50abb93cd99a2ee679706eccd5cc093c5f4a9d0f096dcbe76be2c891f75541e11d28f47931cb8bef2dc2fea40ce1ffb391"
`64`	`64`	`"${CMAKE_SOURCE_DIR}/docs/input/224/test1.png"`
`65`	`65`	`SHOW_PROGRESS`
`66`	`66`	`STATUS status_code`