From 8963ea41bae327b786fbccb4c3735bf370a96f49 Mon Sep 17 00:00:00 2001
From: Brett Laptop <tri11paragon@tpgc.me>
Date: Wed, 8 Jan 2025 17:05:06 -0500
Subject: [PATCH] first test

---
 graph.py      |  54 ++++++++++++++++++++++
 src/MNIST.cpp | 124 ++++++++++++++++++++++++++++++++++++++++----------
 2 files changed, 155 insertions(+), 23 deletions(-)
 create mode 100644 graph.py
diff --git a/graph.py b/graph.py
new file mode 100644
index 0000000..6421a2d
--- /dev/null
+++ b/graph.py
@@ -0,0 +1,54 @@
+import matplotlib.pyplot as plt
+import pandas as pd
+import sys
+
+def plot_stacked_graph(title, output, csv_file1, csv_file2, position, position2):
+    # Read CSV files
+    data1 = pd.read_csv(csv_file1, header=0)
+    data2 = pd.read_csv(csv_file2, header=0)
+    
+    # Extract column titles
+    x1_label, y1_label = data1.columns[0], data1.columns[1]
+    x2_label, y2_label = data2.columns[0], data2.columns[1]
+
+    # Extract data
+    x1, y1 = data1[x1_label], data1[y1_label]
+    x2, y2 = data2[x2_label], data2[y2_label]
+
+    # Create the plot
+    fig, ax = plt.subplots()
+
+    ax.plot(x1, y1, label=f"{csv_file1}")
+    ax.plot(x2, y2, label=f"{csv_file2}")
+
+    ax.fill_between(x1, y1, alpha=0.5)
+    ax.fill_between(x2, y2, alpha=0.5)
+    
+    if position < 2 ** 32:
+        ax.axvline(x=position, color='red', linestyle='--')
+        ax.text(position, ax.get_ylim()[1] * 0.95, f"Feed-forward average # of epochs", color='red', fontsize=10, ha='right', va='top', backgroundcolor='white')
+        
+    if position2 < 2 ** 32:
+        ax.axvline(x=position2, color='red', linestyle='--')
+        ax.text(position2, ax.get_ylim()[1] * 0.95, f"Deep learning average # of epochs", color='red', fontsize=10, ha='right', va='top', backgroundcolor='white')
+
+    ax.set_xlabel(x1_label)
+    ax.set_ylabel(y1_label)
+    ax.legend()
+    ax.set_title(title)
+
+    plt.savefig(output)
+
+if __name__ == "__main__":
+    if len(sys.argv) != 5:
+        print("Usage: python script.py <title> <output_file> <csv_file1> <csv_file2> <position_feed_forward> <position_deep>")
+        sys.exit(1)
+
+    csv_file1 = sys.argv[3]
+    csv_file2 = sys.argv[4]
+    title = sys.argv[1]
+    output = sys.argv[2]
+    position = sys.argv[5]
+    position2 = sys.argv[6]
+
+    plot_stacked_graph(title, output, csv_file1, csv_file2, position, position2)
\ No newline at end of file
diff --git a/src/MNIST.cpp b/src/MNIST.cpp
index b981430..3813212 100644
--- a/src/MNIST.cpp
+++ b/src/MNIST.cpp
@@ -20,7 +20,8 @@
 #include <blt/std/memory.h>
 #include <blt/std/memory_util.h>
 #include <variant>
-#include <bits/fs_ops.h>
+#include <filesystem>
+#include <iomanip>
 #include <blt/iterator/iterator.h>
 #include <blt/parse/argparse.h>
 #include <blt/std/time.h>
@@ -29,6 +30,18 @@
 
 namespace fp
 {
+    std::string binary_directory;
+    std::string python_dual_stacked_graph_program;
+
+    void run_python_line_graph(const std::string& title, const std::string& output_file, const std::string& csv1, const std::string& csv2,
+                               const blt::size_t pos_forward, const blt::size_t pos_deep)
+    {
+        const auto command = "python3 " + python_dual_stacked_graph_program + " '" + title + "' '" + output_file + "' '" + csv1 + "' '" + csv2 + "' "
+            + std::to_string(pos_forward) + " " + std::to_string(pos_deep);
+        BLT_TRACE("Running %s", command.c_str());
+        std::system(command.c_str());
+    }
+
     class idx_file_t
     {
         template <typename T>
@@ -248,7 +261,7 @@ namespace fp
 
     struct epoch_stats_t
     {
-        batch_stats_t test_results {};
+        batch_stats_t test_results{};
         double average_loss = 0;
         double learn_rate = 0;
 
@@ -321,7 +334,7 @@ namespace fp
             return *this;
         }
 
-        blt::size_t average_size() const
+        [[nodiscard]] blt::size_t average_size() const
         {
             blt::size_t acc = 0;
             for (const auto& [epoch_stats] : run_stats)
@@ -329,7 +342,7 @@ namespace fp
             return acc;
         }
 
-        network_stats_t average_stats() const
+        [[nodiscard]] network_stats_t average_stats() const
         {
             network_stats_t stats;
             for (const auto& [epoch_stats] : run_stats)
@@ -380,8 +393,8 @@ namespace fp
     template <typename NetworkType>
     batch_stats_t test_network(NetworkType& network)
     {
-        const idx_file_t test_images{"../problems/mnist/t10k-images.idx3-ubyte"};
-        const idx_file_t test_labels{"../problems/mnist/t10k-labels.idx1-ubyte"};
+        const idx_file_t test_images{binary_directory + "../problems/mnist/t10k-images.idx3-ubyte"};
+        const idx_file_t test_labels{binary_directory + "../problems/mnist/t10k-labels.idx1-ubyte"};
 
         const image_t test_image{test_images, test_labels};
 
@@ -398,8 +411,8 @@ namespace fp
     template <typename NetworkType>
     network_stats_t train_network(const std::string& ident, NetworkType& network)
     {
-        const idx_file_t train_images{"../problems/mnist/train-images.idx3-ubyte"};
-        const idx_file_t train_labels{"../problems/mnist/train-labels.idx1-ubyte"};
+        const idx_file_t train_images{binary_directory + "../problems/mnist/train-images.idx3-ubyte"};
+        const idx_file_t train_labels{binary_directory + "../problems/mnist/train-labels.idx1-ubyte"};
 
         const image_t train_image{train_images, train_labels};
 
@@ -480,8 +493,9 @@ namespace fp
         return network;
     }
 
-    template<typename NetworkType>
-    void run_network_tests(std::string path, const std::string& ident, const blt::i32 runs, const bool restore)
+    template <typename NetworkType>
+    std::pair<network_average_stats_t, batch_stats_t> run_network_tests(std::string path, const std::string& ident, const blt::i32 runs,
+                                                                        const bool restore)
     {
         path += ("/" + ident + "/");
         std::filesystem::create_directories(path);
@@ -495,16 +509,28 @@ namespace fp
             auto local_ident = ident + std::to_string(i);
             NetworkType network{};
             if (restore)
-                network = load_network<NetworkType>(local_ident);
+                try
+                {
+                    network = load_network<NetworkType>(local_ident);
+                }
+                catch (dlib::serialization_error&)
+                {
+                    stats += train_network(local_ident, network);
+                }
             else
                 stats += train_network(local_ident, network);
             test_stats.push_back(test_network(network));
         }
 
+        batch_stats_t average;
+        for (const auto& v : test_stats)
+            average += v;
+        average /= runs;
 
+        return {stats, average};
     }
 
-    void run_deep_learning_tests(const std::string& path, const blt::i32 runs, const bool restore)
+    auto run_deep_learning_tests(const std::string& path, const blt::i32 runs, const bool restore)
     {
         using namespace dlib;
         using net_type_dl = loss_multiclass_log<
@@ -514,30 +540,41 @@ namespace fp
                                max_pool<2, 2, 2, 2, relu<con<16, 5, 5, 1, 1,
                                                              max_pool<2, 2, 2, 2, relu<con<6, 5, 5, 1, 1,
                                                                                            input<matrix<blt::u8>>>>>>>>>>>>>>;
-        run_network_tests<net_type_dl>(path, "deep_learning", runs, restore);
+        return run_network_tests<net_type_dl>(path, "deep_learning", runs, restore);
     }
 
-    void run_feed_forward_tests(const std::string& path, const blt::i32 runs, const bool restore)
+    auto run_feed_forward_tests(const std::string& path, const blt::i32 runs, const bool restore)
     {
         using namespace dlib;
 
         using net_type_ff = loss_multiclass_log<
             fc<10,
                relu<fc<84,
-                      relu<fc<120,
-                             input<matrix<blt::u8>>>>>>>>;
+                       relu<fc<120,
+                               input<matrix<blt::u8>>>>>>>>;
 
-        run_network_tests<net_type_ff>(path, "feed_forward", runs, restore);
+        return run_network_tests<net_type_ff>(path, "feed_forward", runs, restore);
     }
 
     void run_mnist(const int argc, const char** argv)
     {
+        binary_directory = std::filesystem::current_path();
+        if (!blt::string::ends_with(binary_directory, '/'))
+            binary_directory += '/';
+        python_dual_stacked_graph_program = binary_directory + "../graph.py";
+        BLT_TRACE(binary_directory);
+        BLT_TRACE(python_dual_stacked_graph_program);
+
         using namespace dlib;
 
         blt::arg_parse parser{};
         parser.addArgument(
-            blt::arg_builder{"-r", "--restore"}.setAction(blt::arg_action_t::STORE_TRUE).setDefault(false).setHelp("Restores from last save").build());
+            blt::arg_builder{"-r", "--restore"}.setAction(blt::arg_action_t::STORE_TRUE).setDefault(false).setHelp(
+                "Restores from last save").build());
         parser.addArgument(blt::arg_builder{"-t", "--runs"}.setHelp("Number of runs to perform [default: 10]").setDefault("10").build());
+        parser.addArgument(
+            blt::arg_builder{"-p", "--python"}.setHelp("Only run the python scripts").setAction(blt::arg_action_t::STORE_TRUE).setDefault(false).
+                                               build());
         parser.addArgument(blt::arg_builder{"type"}.setDefault("all").setHelp("Type of network to run [ff, dl, default: all]").build());
 
         auto args = parser.parse_args(argc, argv);
@@ -545,16 +582,57 @@ namespace fp
         const auto type = blt::string::toLowerCase(args.get<std::string>("type"));
         const auto runs = std::stoi(args.get<std::string>("runs"));
         const auto restore = args.get<bool>("restore");
-        const auto path = "./" + std::to_string(blt::system::getCurrentTimeMilliseconds());
+        const auto path = binary_directory + std::to_string(blt::system::getCurrentTimeMilliseconds());
+
 
         if (type == "all")
         {
-            run_deep_learning_tests(path, runs, restore);
-            run_feed_forward_tests(path, runs, restore);
-        } else if (type == "ff")
+            auto [deep_stats, deep_tests] = run_deep_learning_tests(path, runs, restore);
+            auto [forward_stats, forward_tests] = run_feed_forward_tests(path, runs, restore);
+
+            auto average_forward_size = forward_stats.average_size();
+            auto average_deep_size = deep_stats.average_size();
+
+            {
+                std::ofstream test_results_f{path + "/test_results_table.txt"};
+                test_results_f << "\\begin{figure}" << std::endl;
+                test_results_f << "\t\\begin{tabular}{|c|c|c|c|}" << std::endl;
+                test_results_f << "\t\t\\hline" << std::endl;
+                test_results_f << "\t\tTest & Correct & Incorrect & Accuracy (\\%) \\\\" << std::endl;
+                test_results_f << "\t\t\\hline" << std::endl;
+                auto test_accuracy = forward_tests.hits / static_cast<double>(forward_tests.hits + forward_tests.misses) * 100;
+                test_results_f << "\t\tFeed-Forward & " << forward_tests.hits << " & " << forward_tests.misses << " & " << std::setprecision(2) <<
+                    test_accuracy << "\\\\" << std::endl;
+                test_accuracy = deep_tests.hits / static_cast<double>(deep_tests.hits + deep_tests.misses) * 100;
+                test_results_f << "\t\tDeep Learning & " << deep_tests.hits << " & " << deep_tests.misses << " & " << std::setprecision(2) <<
+                    test_accuracy << "\\\\" << std::endl;
+                test_results_f << "\t\\end{tabular}" << std::endl;
+                test_results_f << "\\end{figure}" << std::endl;
+
+                const auto [forward_epoch_stats] = forward_stats.average_stats();
+                std::ofstream train_forward{path + "/forward_train_results.csv"};
+                train_forward << "Epoch,Loss" << std::endl;
+                for (const auto& [i, v] : blt::enumerate(forward_epoch_stats))
+                    train_forward << i << ',' << v.average_loss << std::endl;
+
+                const auto [deep_epoch_stats] = deep_stats.average_stats();
+                std::ofstream train_deep{path + "/deep_train_results.csv"};
+                train_deep << "Epoch,Loss" << std::endl;
+                for (const auto& [i, v] : blt::enumerate(deep_epoch_stats))
+                    train_deep << i << ',' << v.average_loss << std::endl;
+
+                std::ofstream average_epochs{path + "/average_epochs.txt"};
+                average_epochs << average_forward_size << "," << average_deep_size << std::endl;
+            }
+
+            run_python_line_graph("Feed-Forward vs Deep Learning, Average Loss over Epochs", "epochs.png", path + "/forward_train_results.csv",
+                                  path + "/deep_train_results.csv", average_forward_size, average_deep_size);
+        }
+        else if (type == "ff")
         {
             run_feed_forward_tests(path, runs, restore);
-        } else if (type == "df")
+        }
+        else if (type == "df")
         {
             run_deep_learning_tests(path, runs, restore);
         }