Added unit tests, refactored cmake

RobBa · RobBa · commit eb0560c795a7 · 2026-02-17T14:59:45.000+01:00
diff --git a/src/backend/computational_graph/add_node.h b/src/backend/computational_graph/add_node.h
@@ -16,9 +16,7 @@
 namespace graph {
   class AddNode final : public GraphNode {  
     public:
-      AddNode(Tensor* t1, Tensor* t2) {
-        parents = {t1, t2};
-      }
+      explicit AddNode(Tensor* t1, Tensor* t2) : GraphNode({t1, t2}) {}
 
       AddNode(const AddNode& other) = delete;
       AddNode& operator=(const AddNode& other) = delete;
diff --git a/src/backend/computational_graph/elementwise_mul_node.h b/src/backend/computational_graph/elementwise_mul_node.h
@@ -16,9 +16,7 @@
 namespace graph {
   class ElementwiseMulNode final : public GraphNode {
     public:
-      ElementwiseMulNode(Tensor* t1, Tensor* t2) {
-        parents = {t1, t2};
-      }
+      explicit ElementwiseMulNode(Tensor* t1, Tensor* t2) : GraphNode({t1, t2}) {}
 
       ElementwiseMulNode(const ElementwiseMulNode& other) = delete;
       ElementwiseMulNode& operator=(const ElementwiseMulNode& other) = delete;
diff --git a/src/backend/computational_graph/graph_node.h b/src/backend/computational_graph/graph_node.h
@@ -16,11 +16,14 @@
 #include <vector>
 #include <memory>
 
+#include <utility>
+
 namespace graph {
   class GraphNode {
     protected:
       std::vector<Tensor*> parents;
-
+      explicit GraphNode(std::vector<Tensor*> parents) : parents{std::move(parents)}{}
+      
     public:
       virtual std::vector<std::shared_ptr<Tensor>> backward(const Tensor& upstreamGrad) = 0;
       
diff --git a/src/backend/computational_graph/matmul_node.h b/src/backend/computational_graph/matmul_node.h
@@ -18,9 +18,7 @@
 namespace graph {
   class MatMulNode final : public GraphNode {
     public:
-      MatMulNode(Tensor* t1, Tensor* t2) {
-        parents = {t1, t2};
-      }
+      explicit MatMulNode(Tensor* t1, Tensor* t2): GraphNode({t1, t2}) {}
 
       MatMulNode(const MatMulNode& other) = delete;
       MatMulNode& operator=(const MatMulNode& other) = delete;
diff --git a/src/backend/computational_graph/relu_node.cpp b/src/backend/computational_graph/relu_node.cpp
@@ -17,9 +17,12 @@ using namespace std;
 using namespace graph;
 
 vector<shared_ptr<Tensor>> ReLuNode::backward(const Tensor& upstreamGrad) {
+  constexpr ftype zero = 0.0;
+  
   auto res = make_shared<Tensor>(upstreamGrad.getDims().toVector(), upstreamGrad.getDevice(), false);
   for(tensorSize_t i=0; i<upstreamGrad.getSize(); i++){
-    (*res)[i] = upstreamGrad[i];
+    auto v = upstreamGrad.get(i);
+    res->set(v > zero ? v : zero, i);
   }
   return {std::move(res)};
 }
diff --git a/src/backend/computational_graph/relu_node.h b/src/backend/computational_graph/relu_node.h
@@ -18,9 +18,7 @@
 namespace graph {
   class ReLuNode final : public GraphNode {
     public:
-      ReLuNode(Tensor* t) {
-        parents = {t};
-      }
+      explicit ReLuNode(Tensor* t): GraphNode({t}) {}
 
       ReLuNode(const ReLuNode& other) = delete;
       ReLuNode& operator=(const ReLuNode& other) = delete;
diff --git a/src/backend/computational_graph/scalar_op_nodes.cpp b/src/backend/computational_graph/scalar_op_nodes.cpp
@@ -0,0 +1,29 @@
+/**
+ * @file scalar_op_nodes.cpp
+ * @author Robert Baumgartner (r.baumgartner-1@tudelft.nl)
+ * @brief 
+ * @version 0.1
+ * @date 2026-02-17
+ * 
+ * @copyright Copyright (c) 2026
+ * 
+ */
+
+#include "scalar_op_nodes.h"
+
+#include <utility>
+
+using namespace std;
+using namespace graph;
+
+vector<shared_ptr<Tensor>> graph::ScalarAddNode::backward(const Tensor& upstreamGrad) {
+  return {make_shared<Tensor>(upstreamGrad.createDeepCopy())};
+}
+
+vector<shared_ptr<Tensor>> graph::ScalarMulNode::backward(const Tensor& upstreamGrad) {
+  auto res = make_shared<Tensor>(upstreamGrad.createDeepCopy());
+  for(tensorSize_t i=0; i<res->getSize(); i++){
+    res->set(res->get(i) * factor, i);
+  }
+  return {std::move(res)};
+}
diff --git a/src/backend/computational_graph/scalar_op_nodes.h b/src/backend/computational_graph/scalar_op_nodes.h
@@ -0,0 +1,49 @@
+/**
+ * @file scalar_op_nodes.h
+ * @author Robert Baumgartner (r.baumgartner-1@tudelft.nl)
+ * @brief 
+ * @version 0.1
+ * @date 2026-02-17
+ * 
+ * @copyright Copyright (c) 2026
+ * 
+ */
+
+#pragma once
+
+#include "graph_node.h"
+
+namespace graph {
+  class ScalarAddNode final : public GraphNode {  
+    public:
+      explicit ScalarAddNode(Tensor* t) : GraphNode({t}) {}
+
+      ScalarAddNode(const ScalarAddNode& other) = delete;
+      ScalarAddNode& operator=(const ScalarAddNode& other) = delete;
+
+      ScalarAddNode(ScalarAddNode&& other) = default;
+      ScalarAddNode& operator=(ScalarAddNode&& other) = default;
+
+      ~ScalarAddNode() noexcept = default; 
+
+      std::vector<std::shared_ptr<Tensor>> backward(const Tensor& upstreamGrad) override;
+  };
+
+  class ScalarMulNode final : public GraphNode {
+    private:
+      const ftype factor;
+    
+    public:
+      explicit ScalarMulNode(Tensor* t, const ftype factor) : GraphNode({t}), factor{factor} {}
+
+      ScalarMulNode(const ScalarMulNode& other) = delete;
+      ScalarMulNode& operator=(const ScalarMulNode& other) = delete;
+
+      ScalarMulNode(ScalarMulNode&& other) = default;
+      ScalarMulNode& operator=(ScalarMulNode&& other) = default;
+
+      ~ScalarMulNode() noexcept = default; 
+
+      std::vector<std::shared_ptr<Tensor>> backward(const Tensor& upstreamGrad) override;
+  };
+}
diff --git a/src/backend/data_modeling/tensor.cpp b/src/backend/data_modeling/tensor.cpp
@@ -15,6 +15,7 @@
 #include "computational_graph/add_node.h"
 #include "computational_graph/matmul_node.h"
 #include "computational_graph/elementwise_mul_node.h"
+#include "computational_graph/scalar_op_nodes.h"
 #include "computational_graph/topological_sort.h"
 
 #include <utility>
@@ -148,6 +149,36 @@ ftype Tensor::tensorValues_t::operator[](const tensorSize_t idx) const {
   return values[idx];
 }
 
+void Tensor::tensorValues_t::set(ftype v, tensorSize_t idx) {
+  if(idx >= size)
+    throw std::out_of_range("Out of range for tensor");
+
+  switch(device){
+    case Device::CPU:
+      values[idx] = v;
+      return;
+    case Device::CUDA:
+      __throw_runtime_error("Not implemented for CUDA yet");
+  }
+
+  __throw_runtime_error("Should never reach here.");
+}
+
+ftype Tensor::tensorValues_t::get(tensorSize_t idx) {
+  if(idx >= size)
+    throw std::out_of_range("Out of range for tensor");
+  
+  switch(device){
+    case Device::CPU:
+      return values[idx];
+    case Device::CUDA:
+      __throw_runtime_error("Not implemented for CUDA yet");
+  }
+
+  __throw_runtime_error("Should never reach here.");
+  return 0; // suppress warnings
+}
+
 /******************************************************************** 
 *************************** Tensor **********************************
 ********************************************************************/
@@ -445,14 +476,28 @@ Tensor Tensor::operator*(ftype scalar) const {
   for (tensorSize_t i = 0; i < values->getSize(); ++i) {
     (*res.values)[i] = (*values)[i] * scalar;
   }
+
+  if(requiresGrad){
+    res.cgNode = std::make_shared<graph::ScalarMulNode>(const_cast<Tensor*>(this), scalar);
+  }
+
   return res;
 }
 
 Tensor Tensor::operator/(ftype scalar) const {
+  if(scalar==0.0){
+    __throw_runtime_error("Cannot divide by zero.");
+  }
+
   Tensor res(dims, values->getDevice(), requiresGrad);
   for (tensorSize_t i = 0; i < values->getSize(); ++i) {
     (*res.values)[i] = (*values)[i] / scalar;
   }
+
+  if(requiresGrad){
+    res.cgNode = std::make_shared<graph::ScalarMulNode>(const_cast<Tensor*>(this), (ftype)(1.0)/scalar);
+  }
+
   return res;
 }
 
@@ -461,6 +506,11 @@ Tensor Tensor::operator+(ftype scalar) const {
   for (tensorSize_t i = 0; i < values->getSize(); ++i) {
     (*res.values)[i] = (*values)[i] + scalar;
   }
+  
+  if(requiresGrad){
+    res.cgNode = std::make_shared<graph::ScalarAddNode>(const_cast<Tensor*>(this));
+  }
+
   return res;
 }
 
@@ -469,6 +519,11 @@ Tensor Tensor::operator-(ftype scalar) const {
   for (tensorSize_t i = 0; i < values->getSize(); ++i) {
     (*res.values)[i] = (*values)[i] - scalar;
   }
+
+  if(requiresGrad){
+    res.cgNode = std::make_shared<graph::ScalarAddNode>(const_cast<Tensor*>(this));
+  }
+
   return res;
 }
 
@@ -521,6 +576,16 @@ void Tensor::backward() {
   }
 }
 
+/**
+ * @brief Get gradients
+ */
+const shared_ptr<Tensor>& Tensor::getGrads() const {
+  if(!grads){
+    __throw_runtime_error("Tensor has no gradients.");
+  }
+  return grads;
+}
+
 /**
  * @brief Sometimes we do accept negative dim-values. In accordance with e.g. 
  * NumPy we map from the end to the beginning in that case. 
diff --git a/src/backend/data_modeling/tensor.h b/src/backend/data_modeling/tensor.h
@@ -82,6 +82,9 @@ class Tensor final {
             ftype& operator[](const tensorSize_t idx);
             ftype operator[](const tensorSize_t idx) const;
 
+            void set(ftype v, tensorSize_t idx);
+            ftype get(tensorSize_t idx);
+
             tensorSize_t getSize() const noexcept;
 
             // needed for gradient descent
@@ -151,6 +154,16 @@ class Tensor final {
             values->resize(this->dims.getSize());
         }
 
+        explicit Tensor(const std::vector<tensorDim_t>& dims, std::vector<ftype>&& initValues, bool requiresGrad=true) :
+            Tensor{dims, std::move(initValues), Tensor::getDefaultDevice(), requiresGrad} {}
+
+        explicit Tensor(const std::vector<tensorDim_t>& dims, std::vector<ftype>&& initValues, Device d, bool requiresGrad=true) :
+            Tensor{dims, d, requiresGrad} {            
+            for(tensorSize_t i=0; i<initValues.size(); i++){
+                values->set(initValues[i], i);
+            }
+        }
+
         /** 
          * Tensors can become very large. Deleting those two
          * helps us to not accidentally copy something we do not 
@@ -198,11 +211,11 @@ class Tensor final {
         friend Tensor operator*(ftype scalar, const Tensor& tensor);
         friend Tensor operator+(ftype scalar, const Tensor& tensor);
 
-        ftype& operator[](const tensorSize_t idx);
-        ftype operator[](const tensorSize_t idx) const;
-
         void backward();
 
+        bool hasGrads() const noexcept { return grads!=nullptr; }
+        const std::shared_ptr<Tensor>& getGrads() const;
+
         void transposeThis() noexcept;
         void transposeThis(int dim1, int dim2) noexcept;
 
diff --git a/src/backend/data_modeling/tensor_functions.cpp b/src/backend/data_modeling/tensor_functions.cpp
@@ -9,6 +9,47 @@
  * 
  */
 
- #include "tensor_functions.h"
+#include "tensor_functions.h"
 
- using namespace TensorFunctions;
+Tensor TensorFunctions::Zeros(std::vector<tensorDim_t> dims, Device d, const bool requiresGrad) {
+  auto res = Tensor(std::move(dims), d, requiresGrad);
+  res.reset(0);
+  return res;
+}
+    
+Tensor TensorFunctions::Zeros(std::vector<tensorDim_t> dims, const bool requiresGrad) {
+  return Zeros(std::move(dims), Tensor::getDefaultDevice(), requiresGrad);
+}
+
+Tensor TensorFunctions::Ones(std::vector<tensorDim_t> dims, Device d, const bool requiresGrad) {
+  auto res = Tensor(std::move(dims), d, requiresGrad);
+  res.reset(1);
+  return res;
+}
+    
+Tensor TensorFunctions::Ones(std::vector<tensorDim_t> dims, const bool requiresGrad) {
+  return Ones(std::move(dims), Tensor::getDefaultDevice(), requiresGrad);
+}
+
+Tensor TensorFunctions::Gaussian(std::vector<tensorDim_t> dims, Device d, const bool requiresGrad) {
+  auto res = Tensor(std::move(dims), d, requiresGrad);
+  res.reset(utility::InitClass::Gaussian);
+  return res;
+}
+    
+Tensor TensorFunctions::Gaussian(std::vector<tensorDim_t> dims, const bool requiresGrad) {
+  return Gaussian(std::move(dims), Tensor::getDefaultDevice(), requiresGrad);
+}
+
+// Tensor manipulation
+void TensorFunctions::ToZeros(Tensor& t) {
+  t.reset(0);
+}
+
+void TensorFunctions::ToOnes(Tensor& t) {
+  t.reset(1);
+}
+
+void TensorFunctions::ToGaussian(Tensor& t) {
+  t.reset(utility::InitClass::Gaussian);
+}
diff --git a/src/backend/data_modeling/tensor_functions.h b/src/backend/data_modeling/tensor_functions.h
diff --git a/src/python/data_modeling/py_data_modeling.h b/src/python/data_modeling/py_data_modeling.h
diff --git a/tests/backend/test_computational_graph.cpp b/tests/backend/test_computational_graph.cpp
diff --git a/tests/backend/test_data_modeling.cpp b/tests/backend/test_data_modeling.cpp

Original file line number	Diff line number	Diff line change
`@@ -17,9 +17,12 @@ using namespace std;`
`17`	`17`	`using namespace graph;`
`18`	`18`
`19`	`19`	`vector<shared_ptr<Tensor>> ReLuNode::backward(const Tensor& upstreamGrad) {`
	`20`	`+ constexpr ftype zero = 0.0;`
	`21`	`+`
`20`	`22`	`auto res = make_shared<Tensor>(upstreamGrad.getDims().toVector(), upstreamGrad.getDevice(), false);`
`21`	`23`	`for(tensorSize_t i=0; i<upstreamGrad.getSize(); i++){`
`22`		`- (*res)[i] = upstreamGrad[i];`
	`24`	`+ auto v = upstreamGrad.get(i);`
	`25`	`+ res->set(v > zero ? v : zero, i);`
`23`	`26`	`}`
`24`	`27`	`return {std::move(res)};`
`25`	`28`	`}`