JuanFMontesinos
diff --git a/‎.gitignore
Lines changed: 5 additions & 0 deletions b/‎.gitignore
Lines changed: 5 additions & 0 deletions
diff --git a/‎.vscode/c_cpp_properties.json
Lines changed: 19 additions & 0 deletions b/‎.vscode/c_cpp_properties.json
Lines changed: 19 additions & 0 deletions
diff --git a/‎.vscode/launch.json
Lines changed: 29 additions & 0 deletions b/‎.vscode/launch.json
Lines changed: 29 additions & 0 deletions
diff --git a/‎.vscode/settings.json
Lines changed: 83 additions & 0 deletions b/‎.vscode/settings.json
Lines changed: 83 additions & 0 deletions
diff --git a/‎.vscode/tasks.json
Lines changed: 23 additions & 0 deletions b/‎.vscode/tasks.json
Lines changed: 23 additions & 0 deletions
diff --git a/‎Makefile
Lines changed: 68 additions & 0 deletions b/‎Makefile
Lines changed: 68 additions & 0 deletions
diff --git a/‎README.md
Lines changed: 11 additions & 1 deletion b/‎README.md
Lines changed: 11 additions & 1 deletion
diff --git a/‎bindings.cpp
Lines changed: 106 additions & 0 deletions b/‎bindings.cpp
Lines changed: 106 additions & 0 deletions
diff --git a/‎include/activations.h
Lines changed: 17 additions & 0 deletions b/‎include/activations.h
Lines changed: 17 additions & 0 deletions
@@ -30,3 +30,8 @@
 *.exe
 *.out
 *.app
+
+*pyc
+build/
+*.o
+*.so
@@ -0,0 +1,19 @@
+{
+    "configurations": [
+        {
+            "name": "Linux",
+            "includePath": [
+                "${workspaceFolder}/**",
+                "/home/jmt/.pyenv/versions/3.11.2/lib/python3.11/site-packages/pybind11/include",
+                "/home/jmt/.pyenv/versions/3.11.2/include/python3.11"
+
+            ],
+            "defines": [],
+            "compilerPath": "/usr/bin/gcc",
+            "cStandard": "c17",
+            "cppStandard": "gnu++17",
+            "intelliSenseMode": "linux-gcc-x64"
+        }
+    ],
+    "version": 4
+}
@@ -0,0 +1,29 @@
+{
+    "version": "0.2.0",
+    "configurations": [
+        {
+            "name": "Launch C++ Program",
+            "type": "cppdbg",
+            "request": "launch",
+            "program": "${fileDirname}/${fileBasenameNoExtension}",
+            "args": [],
+            "stopAtEntry": false,
+            "cwd": "${workspaceFolder}",
+            "environment": [],
+            "externalConsole": false,
+            "MIMode": "gdb",
+            "setupCommands": [
+                {
+                    "description": "Enable pretty-printing for gdb",
+                    "text": "-enable-pretty-printing",
+                    "ignoreFailures": true
+                }
+            ],
+            "preLaunchTask": "compile",
+            "miDebuggerPath": "/usr/bin/gdb",
+            "logging": {
+                "engineLogging": true
+            }
+        }
+    ]
+}
@@ -0,0 +1,83 @@
+{
+    "files.associations": {
+        ".env*": "dotenv",
+        "*.tcc": "cpp",
+        "array": "cpp",
+        "atomic": "cpp",
+        "bit": "cpp",
+        "bitset": "cpp",
+        "cctype": "cpp",
+        "chrono": "cpp",
+        "clocale": "cpp",
+        "cmath": "cpp",
+        "codecvt": "cpp",
+        "compare": "cpp",
+        "concepts": "cpp",
+        "condition_variable": "cpp",
+        "cstdarg": "cpp",
+        "cstddef": "cpp",
+        "cstdint": "cpp",
+        "cstdio": "cpp",
+        "cstdlib": "cpp",
+        "cstring": "cpp",
+        "ctime": "cpp",
+        "cwchar": "cpp",
+        "cwctype": "cpp",
+        "deque": "cpp",
+        "string": "cpp",
+        "unordered_map": "cpp",
+        "vector": "cpp",
+        "exception": "cpp",
+        "algorithm": "cpp",
+        "functional": "cpp",
+        "iterator": "cpp",
+        "memory": "cpp",
+        "memory_resource": "cpp",
+        "numeric": "cpp",
+        "optional": "cpp",
+        "random": "cpp",
+        "ratio": "cpp",
+        "string_view": "cpp",
+        "system_error": "cpp",
+        "tuple": "cpp",
+        "type_traits": "cpp",
+        "utility": "cpp",
+        "fstream": "cpp",
+        "initializer_list": "cpp",
+        "iomanip": "cpp",
+        "iosfwd": "cpp",
+        "iostream": "cpp",
+        "istream": "cpp",
+        "limits": "cpp",
+        "mutex": "cpp",
+        "new": "cpp",
+        "numbers": "cpp",
+        "ostream": "cpp",
+        "semaphore": "cpp",
+        "sstream": "cpp",
+        "stdexcept": "cpp",
+        "stop_token": "cpp",
+        "streambuf": "cpp",
+        "thread": "cpp",
+        "typeinfo": "cpp",
+        "__nullptr": "cpp",
+        "complex": "cpp",
+        "forward_list": "cpp",
+        "list": "cpp",
+        "map": "cpp",
+        "set": "cpp",
+        "unordered_set": "cpp",
+        "cinttypes": "cpp",
+        "typeindex": "cpp",
+        "valarray": "cpp",
+        "variant": "cpp",
+        "__functional_base": "cpp",
+        "__hash_table": "cpp",
+        "__split_buffer": "cpp",
+        "__tree": "cpp",
+        "__memory": "cpp",
+        "filesystem": "cpp",
+        "queue": "cpp",
+        "stack": "cpp"
+    }
+}
@@ -0,0 +1,23 @@
+{
+    "version": "2.0.0",
+    "tasks": [
+        {
+            "label": "compile",
+            "type": "shell",
+            "command": "g++",
+            "args": [
+                "-ansi",
+                "-pedantic-errors",
+                "-std=c++11",
+                "${file}",
+                "-o",
+                "${fileDirname}/${fileBasenameNoExtension}"
+            ],
+            "group": {
+                "kind": "build",
+                "isDefault": true
+            },
+            "problemMatcher": ["$gcc"]
+        }
+    ]
+}
@@ -0,0 +1,68 @@
+# Compiler and flags
+CXX = g++
+PYTHON = $(shell which python3)
+PYBIND11_INCLUDE = $(shell $(PYTHON) -m pybind11 --includes)
+CXXFLAGS = -O3 -Wall $(PYBIND11_INCLUDE) -fPIC -Wall -Wextra -std=c++17 -fPIC -I include
+PYTHON_EXTENSION_SUFFIX = $(shell $(PYTHON) -c 'import sysconfig; print(sysconfig.get_config_var("EXT_SUFFIX"))')
+
+# Target output
+TARGET = libmnist$(PYTHON_EXTENSION_SUFFIX)
+BUILD_DIR = build
+
+# Source files
+SRC = bindings.cpp \
+      src/activations.cpp \
+      src/cross_entropy.cpp \
+      src/dataloader.cpp \
+      src/functionals.cpp \
+      src/linear.cpp
+
+# Object files
+OBJ = $(patsubst %.cpp,$(BUILD_DIR)/%.o,$(SRC))
+
+# Default target
+all: $(TARGET)
+
+# Create output directories if they don't exist
+$(BUILD_DIR):
+	mkdir -p $(BUILD_DIR)
+
+$(BUILD_DIR)/src:
+	mkdir -p $(BUILD_DIR)/src
+
+# Compile the shared library
+$(TARGET): $(OBJ)
+	$(CXX) -shared -o $@ $(OBJ)
+
+# Compile object files for root-level source files
+$(BUILD_DIR)/%.o: %.cpp | $(BUILD_DIR)
+	$(CXX) $(CXXFLAGS) -c $< -o $@
+
+# Compile object files for src/ source files
+$(BUILD_DIR)/src/%.o: src/%.cpp | $(BUILD_DIR)/src
+	$(CXX) $(CXXFLAGS) -c $< -o $@
+
+# Show Python interpreter and include paths
+python:
+	@echo $(PYTHON)
+	@echo $(PYBIND11_INCLUDE)
+	@echo $(PYTHON_EXTENSION_SUFFIX)
+
+# Clean up build files
+clean:
+	rm -f $(BUILD_DIR)/src/*.o $(BUILD_DIR)/*.o $(TARGET)
+	rm -rf $(BUILD_DIR)
+
+	@if [ -d results/ ]; then rm -rf results/; fi
+	@mkdir results/
+
+download_mnist:
+	@if [ -d data/ ]; then rm -rf data/; fi
+	@mkdir data/
+
+	@wget -P data/ https://raw.githubusercontent.com/fgnt/mnist/master/train-images-idx3-ubyte.gz
+	@wget -P data/ https://raw.githubusercontent.com/fgnt/mnist/master/train-labels-idx1-ubyte.gz
+	@wget -P data/ https://raw.githubusercontent.com/fgnt/mnist/master/t10k-images-idx3-ubyte.gz
+	@wget -P data/ https://raw.githubusercontent.com/fgnt/mnist/master/t10k-labels-idx1-ubyte.gz
+
+	@gunzip data/*.gz
@@ -1,2 +1,12 @@
 # MNIST-CPP-and-python
-Beginner-friendly repo on how to Code a Simple Neural network with backprop in C++, bind it to python and train MNIST!
+Beginner-friendly repo on how to Code a Simple Neural network with backprop in C++, bind it to python and train MNIST!  
+
+## Summary  
+ReLu and Linear layers are implemented in C++ following  PyTorch's naming convention. Some functionals like softmax are also implemented. The code is bound to python using pybind11. The model is trained on MNIST dataset using a python script.
+
+## How to run  
+1. Download the data via `make download_mnist`.  
+2. Install the python dependencies via `pip install -r requirements.txt`.
+3. Compile the C++ code via `make`.  
+4. Run the python script via `python train.py`.
+5. (Optional) Compare against pytorch training via `python train_pytorch.py`.
@@ -0,0 +1,106 @@
+// bindings.cpp
+#include <pybind11/pybind11.h>
+#include <pybind11/stl.h>
+#include <pybind11/numpy.h>
+
+#include "include/modules.h"
+#include "include/activations.h"
+#include "include/functionals.h"
+#include "include/cross_entropy.h"
+#include "include/dataloader.h"
+
+namespace py = pybind11;
+
+PYBIND11_MODULE(libmnist, m) {
+    // Bind the ReLu class
+    py::class_<ReLu>(m, "ReLu")
+        .def(py::init<>())
+        .def("forward", [](ReLu& self, const std::vector<float>& input) {
+            auto output = self.forward(input);
+            // Return as NumPy array
+            return py::array_t<float>(output.size(), output.data());
+        }, "Apply ReLu activation")
+        .def("backward", [](ReLu& self, const std::vector<float>& grad_output) {
+            auto grad_input = self.backward(grad_output);
+            return py::array_t<float>(grad_input.size(), grad_input.data());
+        }, "Compute the backward pass of ReLu")
+        .def("update", &ReLu::update, py::arg("lr"), "Update the parameters of ReLu");
+
+    // Bind the LinearLayer class
+    py::class_<LinearLayer>(m, "LinearLayer")
+        .def(py::init<int, int>())
+        .def("forward", [](LinearLayer& self, const std::vector<float>& input) {
+            auto output = self.forward(input);
+            // Return as NumPy array
+            return py::array_t<float>(output.size(), output.data());
+        }, "Perform forward pass with Linear Layer")
+        .def("backward", [](LinearLayer& self, const std::vector<float>& grad_output) {
+            auto grad_input = self.backward(grad_output);
+            return py::array_t<float>(grad_input.size(), grad_input.data());
+        }, "Compute the backward pass of Linear Layer")
+        .def("update", &LinearLayer::update, py::arg("lr"), "Update the parameters of LinearLayer")
+        .def_readwrite("weights", &LinearLayer::weights)
+        .def_readwrite("bias", &LinearLayer::bias)
+        .def_readwrite("grad_weights", &LinearLayer::grad_weights)
+        .def_readwrite("grad_bias", &LinearLayer::grad_bias);  
+
+
+    // Bind the SoftmaxndCrossEntropy class
+    py::class_<SoftmaxndCrossEntropy>(m, "SoftmaxndCrossEntropy")
+        .def(py::init<int>())
+        .def("forward", [](SoftmaxndCrossEntropy& self, const std::vector<float>& input, int class_label) {
+            return self.forward(input, class_label);
+        }, "Compute the forward pass of Softmax and Cross Entropy")
+        .def("backward", [](SoftmaxndCrossEntropy& self) {
+            auto grad = self.backward();
+            return py::array_t<float>(grad.size(), grad.data());
+        }, "Compute the backward pass of Softmax and Cross Entropy");
+    // Bind the DataLoader class
+    py::class_<DataLoader>(m, "DataLoader")
+        .def_static("load_images", [](const std::string& filepath) {
+            auto images = DataLoader::load_images(filepath);
+            py::ssize_t num_images = static_cast<py::ssize_t>(images.size());
+            if (num_images == 0) {
+                throw std::runtime_error("No images loaded");
+            }
+            py::ssize_t image_size = static_cast<py::ssize_t>(images[0].size());
+
+            // Create a NumPy array of shape (num_images, image_size)
+            py::array_t<float> result({num_images, image_size});
+
+            auto buf = result.mutable_unchecked<2>();
+
+            for (py::ssize_t i = 0; i < num_images; ++i) {
+                if (static_cast<py::ssize_t>(images[i].size()) != image_size) {
+                    throw std::runtime_error("Inconsistent image sizes");
+                }
+                for (py::ssize_t j = 0; j < image_size; ++j) {
+                    buf(i, j) = images[i][j];
+                }
+            }
+            return result;
+        }, "Load images from file")
+        .def_static("load_labels", [](const std::string& filepath) {
+            auto labels = DataLoader::load_labels(filepath);
+            py::ssize_t num_labels = static_cast<py::ssize_t>(labels.size());
+
+            py::array_t<int> result({num_labels});
+            auto buf = result.mutable_unchecked<1>();
+            for (py::ssize_t i = 0; i < num_labels; ++i) {
+                buf(i) = labels[i];
+            }
+            return result;
+        }, "Load labels from file");
+
+    // Bind the functionals submodule
+    py::module_ functionals = m.def_submodule("functionals", "Submodule for functional operations");
+    functionals.def("softmax", [](const std::vector<float>& input) {
+        auto output = functionals::softmax(input);
+        return py::array_t<float>(output.size(), output.data());
+    }, "Compute the softmax of a 1D vector");
+    functionals.def("flatten2d", [](const std::vector<std::vector<float>>& input) {
+        auto output = functionals::flatten2d(input);
+        return py::array_t<float>(output.size(), output.data());
+    }, "Flatten a 2D vector into a 1D vector");
+}
+
@@ -0,0 +1,17 @@
+#ifndef ACTIVATIONS
+#define ACTIVATIONS
+
+#include <vector>
+#include "modules.h"
+
+class ReLu : public Module
+{
+public:
+    std::vector<float> forward(const std::vector<float> &input) override;
+    std::vector<float> backward(const std::vector<float> &grad_output) override;
+    void update(float lr) override;
+private:
+    std::vector<bool> zeroed;
+};
+
+#endif
-Original file line number
+Diff line change
 *.exe
 *.out
 *.app
++
 +*pyc
 +build/
 +*.o
 +*.so