build dens,resn, yolo, google/ res&dens - perfect

Semyon1104 · Semyon1104 · commit b576bc9e9421 · 2025-09-19T12:41:17.000+03:00
diff --git a/app/Graph/build.cpp b/app/Graph/build.cpp
@@ -289,6 +289,8 @@ void build_graph(it_lab_ai::Tensor& input, it_lab_ai::Tensor& output,
   it_lab_ai::ImplType impl2 = parallel ? it_lab_ai::kSTL : it_lab_ai::kDefault;
 
   std::unordered_map<std::string, std::vector<int64_t>> layer_parameters;
+  std::string last_constant_name;
+  std::vector<int64_t> last_constant_value;
 
   std::unordered_map<std::string, std::shared_ptr<it_lab_ai::SplitLayer>>
       split_layers;
@@ -814,7 +816,6 @@ void build_graph(it_lab_ai::Tensor& input, it_lab_ai::Tensor& output,
         if (comments) {
           std::cout << "ReduceSum layer: " << layer_name << std::endl;
         }
-
         int64_t keepdims = 0;
         if (layer_data.contains("attributes")) {
           const auto& attributes = layer_data["attributes"];
@@ -830,12 +831,14 @@ void build_graph(it_lab_ai::Tensor& input, it_lab_ai::Tensor& output,
             std::string constant_name = inputs[1].get<std::string>();
             constant_name = get_base_layer_name(constant_name);
 
-            if (layer_parameters.count(constant_name)) {
+            if (layer_parameters.count(constant_name)){
               axes = layer_parameters[constant_name];
+            } else if (constant_name.find("onnx::") != constant_name.npos) {
+              axes = last_constant_value;
+              layer_parameters[constant_name] = last_constant_value;
             }
           }
         }
-
         auto reduce_layer = std::make_shared<it_lab_ai::ReduceLayer>(
             it_lab_ai::ReduceLayer::Operation::kSum, keepdims, axes);
         reduce_layer->setName(it_lab_ai::kReduce);
@@ -854,6 +857,8 @@ void build_graph(it_lab_ai::Tensor& input, it_lab_ai::Tensor& output,
               data.push_back(val.get<int64_t>());
             }
             layer_parameters[layer_name] = data;
+            last_constant_name = layer_name;
+            last_constant_value = data;
           }
         }
 
diff --git a/include/layers/FCLayer.hpp b/include/layers/FCLayer.hpp
@@ -30,24 +30,39 @@ template <typename ValueType>
 std::vector<ValueType> mat_vec_mul(const std::vector<ValueType>& mat,
                                    const Shape& mat_shape,
                                    const std::vector<ValueType>& vec) {
-  size_t c = vec.size() / mat_shape[1];
+  std::cout << "    mat_vec_mul DEBUG:" << std::endl;
+  std::cout << "      Matrix size: " << mat.size() << std::endl;
+  std::cout << "      Matrix shape: [" << mat_shape[0] << ", " << mat_shape[1]
+            << "]" << std::endl;
+  std::cout << "      Vector size: " << vec.size() << std::endl;
+
   if (mat_shape.dims() != 2) {
     throw std::invalid_argument("Not a matrix in argument");
   }
+
+  size_t batch_size = vec.size() / mat_shape[0];
+  std::cout << "      Batch size: " << batch_size << std::endl;
+
+  if (vec.size() % mat_shape[0] != 0) {
+    throw std::invalid_argument("Vector size not divisible by matrix rows");
+  }
+
   Shape res_shape(1);
-  res_shape[0] = mat_shape[0] * c;
+  res_shape[0] = mat_shape[1] * batch_size;
   std::vector<ValueType> res(res_shape[0]);
+  std::cout << "      Result size: " << res.size() << std::endl;
+
   ValueType elem;
-  for (size_t count = 0; count < c; count++) {
-    for (size_t i = 0; i < mat_shape[0]; i++) {
+  for (size_t batch = 0; batch < batch_size; batch++) {
+    for (size_t j = 0; j < mat_shape[1]; j++) {
       elem = ValueType(0);
-      for (size_t j = 0; j < mat_shape[1]; j++) {
-        // due to 1d indexing
-        elem += mat[i * mat_shape[1] + j] * vec[count * mat_shape[1] + j];
+      for (size_t i = 0; i < mat_shape[0]; i++) {
+        elem += mat[i * mat_shape[1] + j] * vec[batch * mat_shape[0] + i];
       }
-      res[count * mat_shape[0] + i] = elem;
+      res[batch * mat_shape[1] + j] = elem;
     }
   }
+
   return res;
 }
 
@@ -103,30 +118,40 @@ FCLayerImpl<ValueType>::FCLayerImpl(const std::vector<ValueType>& input_weights,
   if (input_weights.empty()) {
     throw std::invalid_argument("Empty weights for FCLayer");
   }
-  /*if (input_weights_shape.dims() != 2 ||
-      input_weights_shape[0] != input_bias.size()) {
-    throw std::invalid_argument("Invalid weights shape");
-  }*/
-  this->inputShape_[0] = input_weights_shape[1];
-  this->outputShape_[0] = input_bias.size();
+
+  // ��� ����������������� ������� [input_size, output_size] = [2048, 1000]
+  this->inputShape_[0] = input_weights_shape[0];   // input size = 2048
+  this->outputShape_[0] = input_weights_shape[1];  // output size = 1000
+
   if (this->inputShape_[0] == 0 || this->outputShape_[0] == 0) {
     throw std::invalid_argument("Invalid weights/bias size for FCLayer");
   }
+
+  // ��������� ������������ bias � output size
+  if (input_bias.size() != this->outputShape_[0]) {
+    throw std::invalid_argument("Bias size doesn't match output size");
+  }
+
   weights_.resize(input_weights_shape.count(), ValueType(0));
 }
 
 template <typename ValueType>
 std::vector<ValueType> FCLayerImpl<ValueType>::run(
     const std::vector<ValueType>& input) const {
-  Shape cur_w_shape({this->outputShape_[0], this->inputShape_[0]});
+  // ��� ����������������� �������: [input_size, output_size] = [2048, 1000]
+  Shape cur_w_shape({this->inputShape_[0], this->outputShape_[0]});
+
   std::vector<ValueType> output_values =
       mat_vec_mul(weights_, cur_w_shape, input);
-  for (size_t p = 0; p < output_values.size() / bias_.size(); ++p) {
+
+  // ��������� bias � ������� �������� ��������� �������
+  size_t batch_size = output_values.size() / this->outputShape_[0];
+  for (size_t batch = 0; batch < batch_size; ++batch) {
     for (size_t i = 0; i < bias_.size(); ++i) {
-      output_values[p * bias_.size() + i] += bias_[i];
+      output_values[batch * this->outputShape_[0] + i] += bias_[i];
     }
   }
+
   return output_values;
 }
-
 }  // namespace it_lab_ai
diff --git a/src/layers/FCLayer.cpp b/src/layers/FCLayer.cpp
@@ -16,28 +16,90 @@ void FCLayer::run(const std::vector<Tensor>& input,
 
   // �������� batch_size � output_size
   size_t batch_size = input[0].get_shape()[0];
-  size_t output_size =
-      bias_.get_shape()[0];  // ���������� ������ bias ��� output_size
+  size_t output_size = bias_.get_shape()[0];
+
+  // ��������� ���������� ������
+  std::cout << "FCLayer DEBUG:" << std::endl;
+  std::cout << "  Input shape: ";
+  for (size_t d = 0; d < input[0].get_shape().dims(); ++d) {
+    std::cout << input[0].get_shape()[d] << " ";
+  }
+  std::cout << std::endl;
+
+  std::cout << "  Weights shape: ";
+  for (size_t d = 0; d < weights_.get_shape().dims(); ++d) {
+    std::cout << weights_.get_shape()[d] << " ";
+  }
+  std::cout << std::endl;
+
+  std::cout << "  Bias shape: ";
+  for (size_t d = 0; d < bias_.get_shape().dims(); ++d) {
+    std::cout << bias_.get_shape()[d] << " ";
+  }
+  std::cout << std::endl;
+
+  std::cout << "  Batch size: " << batch_size << std::endl;
+  std::cout << "  Output size: " << output_size << std::endl;
 
   switch (input[0].get_type()) {
     case Type::kInt: {
       FCLayerImpl<int> used_impl(*weights_.as<int>(), weights_.get_shape(),
                                  *bias_.as<int>());
-      output[0] = make_tensor(used_impl.run(*input[0].as<int>()),
-                              {batch_size, output_size});
+
+      // ��������� ���������� ����� ����� ������� run
+      std::cout << "  Running INT implementation" << std::endl;
+
+      auto result = used_impl.run(*input[0].as<int>());
+
+      // ��������� ���������� ����� ����� ����������
+      std::cout << "  Result vector size: " << result.size() << std::endl;
+      std::cout << "  Expected output shape: [" << batch_size << ", "
+                << output_size << "]" << std::endl;
+      std::cout << "  Expected total elements: " << batch_size * output_size
+                << std::endl;
+
+      // ��������� ������ ����������
+      if (result.size() != batch_size * output_size) {
+        throw std::runtime_error("Result size mismatch: got " +
+                                 std::to_string(result.size()) + ", expected " +
+                                 std::to_string(batch_size * output_size));
+      }
+
+      output[0] = make_tensor(result, {batch_size, output_size});
       break;
     }
     case Type::kFloat: {
       FCLayerImpl<float> used_impl(*weights_.as<float>(), weights_.get_shape(),
                                    *bias_.as<float>());
-      output[0] = make_tensor(used_impl.run(*input[0].as<float>()),
-                              {batch_size, output_size});
+
+      // ��������� ���������� ����� ����� ������� run
+      std::cout << "  Running FLOAT implementation" << std::endl;
+
+      auto result = used_impl.run(*input[0].as<float>());
+
+      // ��������� ���������� ����� ����� ����������
+      std::cout << "  Result vector size: " << result.size() << std::endl;
+      std::cout << "  Expected output shape: [" << batch_size << ", "
+                << output_size << "]" << std::endl;
+      std::cout << "  Expected total elements: " << batch_size * output_size
+                << std::endl;
+
+      // ��������� ������ ����������
+      if (result.size() != batch_size * output_size) {
+        throw std::runtime_error("Result size mismatch: got " +
+                                 std::to_string(result.size()) + ", expected " +
+                                 std::to_string(batch_size * output_size));
+      }
+
+      output[0] = make_tensor(result, {batch_size, output_size});
       break;
     }
     default: {
       throw std::runtime_error("No such type");
     }
   }
+
+  std::cout << "  FCLayer completed successfully" << std::endl;
 }
 
 }  // namespace it_lab_ai
diff --git a/src/layers/ReduceLayer.cpp b/src/layers/ReduceLayer.cpp
@@ -173,17 +173,51 @@ void ReduceLayer::run(const std::vector<Tensor>& input,
     throw std::runtime_error("ReduceLayer: Input tensors not 1");
   }
 
+  // ���������� �����
+  std::cout << "=== REDUCE LAYER DEBUG ===" << std::endl;
+  std::cout << "Input shape: [";
+  for (size_t i = 0; i < input[0].get_shape().dims(); ++i) {
+    std::cout << input[0].get_shape()[i];
+    if (i < input[0].get_shape().dims() - 1) std::cout << ", ";
+  }
+  std::cout << "]" << std::endl;
+  std::cout << "Keep dims: " << keepdims_ << std::endl;
+  std::cout << "Axes: [";
+  for (size_t i = 0; i < axes_.size(); ++i) {
+    std::cout << axes_[i];
+    if (i < axes_.size() - 1) std::cout << ", ";
+  }
+  std::cout << "]" << std::endl;
+
   if (input[0].get_shape().count() == 0) {
+    std::cout << "Empty input tensor detected" << std::endl;
     output[0] = make_tensor<float>({0.0F}, {});
     return;
   }
 
   // ������ ���������� ����������� axes
   std::vector<int64_t> axes_indices = axes_;
   normalize_axes(input[0].get_shape(), axes_indices);
+
+  // ���������� ����� ����� ������������
+  std::cout << "Normalized axes: [";
+  for (size_t i = 0; i < axes_indices.size(); ++i) {
+    std::cout << axes_indices[i];
+    if (i < axes_indices.size() - 1) std::cout << ", ";
+  }
+  std::cout << "]" << std::endl;
+
   Shape output_shape =
       calculate_output_shape(input[0].get_shape(), axes_indices);
 
+  std::cout << "Output shape: [";
+  for (size_t i = 0; i < output_shape.dims(); ++i) {
+    std::cout << output_shape[i];
+    if (i < output_shape.dims() - 1) std::cout << ", ";
+  }
+  std::cout << "]" << std::endl;
+  std::cout << "==========================" << std::endl;
+
   switch (input[0].get_type()) {
     case Type::kFloat:
       compute<float>(input[0], output_shape, axes_indices, output[0]);

Original file line number	Diff line number	Diff line change
`@@ -289,6 +289,8 @@ void build_graph(it_lab_ai::Tensor& input, it_lab_ai::Tensor& output,`
`289`	`289`	`it_lab_ai::ImplType impl2 = parallel ? it_lab_ai::kSTL : it_lab_ai::kDefault;`
`290`	`290`
`291`	`291`	`std::unordered_map<std::string, std::vector<int64_t>> layer_parameters;`
	`292`	`+ std::string last_constant_name;`
	`293`	`+ std::vector<int64_t> last_constant_value;`
`292`	`294`
`293`	`295`	`std::unordered_map<std::string, std::shared_ptr<it_lab_ai::SplitLayer>>`
`294`	`296`	`split_layers;`
`@@ -814,7 +816,6 @@ void build_graph(it_lab_ai::Tensor& input, it_lab_ai::Tensor& output,`
`814`	`816`	`if (comments) {`
`815`	`817`	`std::cout << "ReduceSum layer: " << layer_name << std::endl;`
`816`	`818`	`}`
`817`		`-`
`818`	`819`	`int64_t keepdims = 0;`
`819`	`820`	`if (layer_data.contains("attributes")) {`
`820`	`821`	`const auto& attributes = layer_data["attributes"];`
`@@ -830,12 +831,14 @@ void build_graph(it_lab_ai::Tensor& input, it_lab_ai::Tensor& output,`
`830`	`831`	`std::string constant_name = inputs[1].get<std::string>();`
`831`	`832`	`constant_name = get_base_layer_name(constant_name);`
`832`	`833`
`833`		`- if (layer_parameters.count(constant_name)) {`
	`834`	`+ if (layer_parameters.count(constant_name)){`
`834`	`835`	`axes = layer_parameters[constant_name];`
	`836`	`+ } else if (constant_name.find("onnx::") != constant_name.npos) {`
	`837`	`+ axes = last_constant_value;`
	`838`	`+ layer_parameters[constant_name] = last_constant_value;`
`835`	`839`	`}`
`836`	`840`	`}`
`837`	`841`	`}`
`838`		`-`
`839`	`842`	`auto reduce_layer = std::make_shared<it_lab_ai::ReduceLayer>(`
`840`	`843`	`it_lab_ai::ReduceLayer::Operation::kSum, keepdims, axes);`
`841`	`844`	`reduce_layer->setName(it_lab_ai::kReduce);`
`@@ -854,6 +857,8 @@ void build_graph(it_lab_ai::Tensor& input, it_lab_ai::Tensor& output,`
`854`	`857`	`data.push_back(val.get<int64_t>());`
`855`	`858`	`}`
`856`	`859`	`layer_parameters[layer_name] = data;`
	`860`	`+ last_constant_name = layer_name;`
	`861`	`+ last_constant_value = data;`
`857`	`862`	`}`
`858`	`863`	`}`
`859`	`864`