// =========================================================================== // newnet — Neural Network from Scratch // // Compile: g++ -std=c++17 -O2 -pthread -o newnet main.cpp // Run: ./newnet // // This trains a small network on the XOR problem to prove: // 1. Forward pass works (matmul + bias + activation) // 2. Backward pass works (chain rule, gradient computation) // 3. Optimizer works (weights update, loss decreases) // 4. Non-linear problems are solvable (XOR needs hidden layers) // =========================================================================== #include "core/tensor.hpp" #include "core/backend.hpp" #include "layers/dense.hpp" #include "graph/graph.hpp" #include "graph/optimizer.hpp" #include "loss/loss.hpp" #include #include #include #include using namespace newnet; // --- Progress bar --- void print_progress(int epoch, int total_epochs, float loss, float elapsed_ms) { int bar_width = 30; float progress = (float)(epoch + 1) / total_epochs; int filled = (int)(bar_width * progress); std::cout << "\r ["; for (int i = 0; i < bar_width; i++) { if (i < filled) std::cout << "█"; else std::cout << "░"; } std::cout << "] " << std::setw(4) << epoch + 1 << "/" << total_epochs << " | loss: " << std::fixed << std::setprecision(6) << loss << " | " << std::fixed << std::setprecision(1) << elapsed_ms << "ms" << std::flush; } // --- Print predictions --- void print_predictions(Sequential& net, const Tensor& input, const Tensor& target) { Tensor output = net.forward(input); std::cout << "\n ┌──────────────┬────────────┬────────────┬─────────┐\n"; std::cout << " │ Input │ Predicted │ Target │ Correct │\n"; std::cout << " ├──────────────┼────────────┼────────────┼─────────┤\n"; int correct = 0; for (int i = 0; i < input.rows(); i++) { float pred = output(i, 0); float tgt = target(i, 0); bool is_correct = (pred > 0.5f) == (tgt > 0.5f); if (is_correct) correct++; std::cout << " │ [" << std::fixed << std::setprecision(0) << input(i, 0) << ", " << input(i, 1) << "]" << " │ " << std::fixed << std::setprecision(4) << pred << " │ " << std::fixed << std::setprecision(4) << tgt << " │ " << (is_correct ? "✓" : "✗") << " │\n"; } std::cout << " └──────────────┴────────────┴────────────┴─────────┘\n"; std::cout << " Accuracy: " << correct << "/" << input.rows() << " (" << (100.0f * correct / input.rows()) << "%)\n"; } int main() { std::cout << "\n"; std::cout << " ╔═══════════════════════════════════════════════╗\n"; std::cout << " ║ newnet v0.1 — Training Demo ║\n"; std::cout << " ║ Neural Network Engine from Scratch (C++) ║\n"; std::cout << " ╚═══════════════════════════════════════════════╝\n\n"; std::cout << " Hardware threads: " << std::thread::hardware_concurrency() << "\n"; std::cout << " Backend: CPU (multi-threaded)\n\n"; // ========================================================================= // Dataset: XOR // This is the simplest non-linear classification problem. // A single layer (linear model) CANNOT solve this. // You need at least one hidden layer — proving our NN works. // ========================================================================= std::cout << " ── Dataset: XOR ──────────────────────────────────\n\n"; Tensor input({4, 2}); input(0,0) = 0; input(0,1) = 0; // 0 XOR 0 = 0 input(1,0) = 0; input(1,1) = 1; // 0 XOR 1 = 1 input(2,0) = 1; input(2,1) = 0; // 1 XOR 0 = 1 input(3,0) = 1; input(3,1) = 1; // 1 XOR 1 = 0 Tensor target({4, 1}); target(0,0) = 0; target(1,0) = 1; target(2,0) = 1; target(3,0) = 0; std::cout << " Samples: 4 | Features: 2 | Output: 1 (binary)\n\n"; // ========================================================================= // Model: 2 → 16 (relu) → 8 (relu) → 1 (sigmoid) // ========================================================================= std::cout << " ── Model Architecture ────────────────────────────\n\n"; std::cout << " Input(2) → Dense(16, relu) → Dense(8, relu) → Dense(1, sigmoid)\n"; std::cout << " Parameters: " << (2*16+16) + (16*8+8) + (8*1+1) << " total\n\n"; Sequential net; net.add(new Dense(2, 16, "relu")); net.add(new Dense(16, 8, "relu")); net.add(new Dense(8, 1, "sigmoid")); // ========================================================================= // Training // ========================================================================= std::cout << " ── Training ──────────────────────────────────────\n\n"; std::cout << " Optimizer: Adam (lr=0.01)\n"; std::cout << " Loss: MSE\n"; std::cout << " Epochs: 2000\n\n"; Adam optimizer(0.01f); MSELoss loss_fn; int epochs = 2000; auto train_start = std::chrono::high_resolution_clock::now(); float final_loss = 0.0f; for (int epoch = 0; epoch < epochs; epoch++) { // 1. Zero gradients from previous iteration optimizer.zero_grad(net.parameters()); // 2. Forward pass Tensor output = net.forward(input); // 3. Compute loss float loss = loss_fn.forward(output, target); final_loss = loss; // 4. Backward pass — compute gradients via chain rule Tensor grad = loss_fn.backward(); net.backward(grad); // 5. Update weights optimizer.step(net.parameters()); // Progress bar update if (epoch % 50 == 0 || epoch == epochs - 1) { auto now = std::chrono::high_resolution_clock::now(); float elapsed = std::chrono::duration(now - train_start).count(); print_progress(epoch, epochs, loss, elapsed); } } auto train_end = std::chrono::high_resolution_clock::now(); float total_ms = std::chrono::duration(train_end - train_start).count(); std::cout << "\n\n Training complete in " << std::fixed << std::setprecision(1) << total_ms << "ms\n"; std::cout << " Final loss: " << std::fixed << std::setprecision(6) << final_loss << "\n\n"; // ========================================================================= // Results // ========================================================================= std::cout << " ── Predictions ───────────────────────────────────\n"; print_predictions(net, input, target); std::cout << "\n ── Summary ───────────────────────────────────────\n\n"; std::cout << " If predictions are close to targets (>0.5 = 1, <0.5 = 0),\n"; std::cout << " then forward pass, backward pass, and optimizer all work.\n"; std::cout << " XOR is non-linear — a single Dense layer cannot solve it.\n"; std::cout << " The hidden layers learned the non-linear decision boundary.\n\n"; return 0; }