COSC-4P80-Assignment-2/include/assign2/layer.h

#pragma once
/*
 *  Copyright (C) 2024  Brett Terpstra
 *
 *  This program is free software: you can redistribute it and/or modify
 *  it under the terms of the GNU General Public License as published by
 *  the Free Software Foundation, either version 3 of the License, or
 *  (at your option) any later version.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU General Public License for more details.
 *
 *  You should have received a copy of the GNU General Public License
 *  along with this program.  If not, see <https://www.gnu.org/licenses/>.
 */

#include "blt/std/assert.h"

#ifndef COSC_4P80_ASSIGNMENT_2_LAYER_H
#define COSC_4P80_ASSIGNMENT_2_LAYER_H
    
    #include <blt/std/types.h>
    #include <assign2/initializers.h>
    #include "blt/iterator/zip.h"
    #include "blt/iterator/iterator.h"
    #include "global_magic.h"

namespace assign2
{
    class neuron_t
    {
            friend layer_t;
        public:
            // empty neuron for loading from a stream
            explicit neuron_t(weight_view weights, weight_view dw): dw(dw), weights(weights)
            {}
            
            // neuron with bias
            explicit neuron_t(weight_view weights, weight_view dw, Scalar bias): bias(bias), dw(dw), weights(weights)
            {}
            
            Scalar activate(const std::vector<Scalar>& inputs, function_t* act_func)
            {
                BLT_ASSERT_MSG(inputs.size() == weights.size(), (std::to_string(inputs.size())  + " vs " + std::to_string(weights.size())).c_str());
                
                z = bias;
                for (auto [x, w] : blt::zip_iterator_container({inputs.begin(), inputs.end()}, {weights.begin(), weights.end()}))
                    z += x * w;
                a = act_func->call(z);
                return a;
            }
            
            void back_prop(function_t* act, const std::vector<Scalar>& previous_outputs, Scalar next_error)
            {
                // delta for weights
                error = act->derivative(z) * next_error;
                db = learn_rate * error;
                BLT_ASSERT(previous_outputs.size() == dw.size());
                for (auto [prev_out, d_weight] : blt::zip(previous_outputs, dw))
                {
                    // dw
                    d_weight = -learn_rate * prev_out * error;
                }
            }
            
            void update()
            {
                for (auto [w, d] : blt::in_pairs(weights, dw))
                    w += d;
                bias += db;
            }
            
            template<typename OStream>
            OStream& serialize(OStream& stream)
            {
                stream << bias;
                for (auto d : weights)
                    stream << d;
            }
            
            template<typename IStream>
            IStream& deserialize(IStream& stream)
            {
                for (auto& d : blt::iterate(weights).rev())
                    stream >> d;
                stream >> bias;
            }
            
            void debug() const
            {
                std::cout << bias << " ";
            }
        
        private:
            float z = 0;
            float a = 0;
            float bias = 0;
            float db = 0;
            float error = 0;
            weight_view dw;
            weight_view weights;
    };
    
    class layer_t
    {
            friend network_t;
        public:
            template<typename WeightFunc, typename BiasFunc>
            layer_t(const blt::i32 in, const blt::i32 out, function_t* act_func, WeightFunc w, BiasFunc b):
                    in_size(in), out_size(out), layer_id(layer_id_counter++), act_func(act_func)
            {
                neurons.reserve(out_size);
                weights.preallocate(in_size * out_size);
                weight_derivatives.preallocate(in_size * out_size);
                for (blt::i32 i = 0; i < out_size; i++)
                {
                    auto weight = weights.allocate_view(in_size);
                    auto dw = weight_derivatives.allocate_view(in_size);
                    for (auto& v : weight)
                        v = w(i);
                    neurons.push_back(neuron_t{weight, dw, b(i)});
                }
            }
            
            const std::vector<Scalar>& call(const std::vector<Scalar>& in)
            {
                outputs.clear();
                outputs.reserve(out_size);
#if BLT_DEBUG_LEVEL > 0
                if (in.size() != in_size)
                    throw std::runtime_exception("Input vector doesn't match expected input size!");
#endif
                for (auto& n : neurons)
                    outputs.push_back(n.activate(in, act_func));
                return outputs;
            }
            
            error_data_t back_prop(const std::vector<Scalar>& prev_layer_output,
                                                const std::variant<blt::ref<const std::vector<Scalar>>, blt::ref<const layer_t>>& data)
            {
                Scalar total_error = 0;
                Scalar total_derivative = 0;
                std::visit(blt::lambda_visitor{
                        // is provided if we are an output layer, contains output of this net (per neuron) and the expected output (per neuron)
                        [this, &prev_layer_output, &total_error, &total_derivative](const std::vector<Scalar>& expected) {
                            for (auto [i, n] : blt::enumerate(neurons))
                            {
                                auto d = outputs[i] - expected[i];
                                auto d2 = 0.5f * (d * d);
                                total_error += d2;
                                total_derivative += d;
                                n.back_prop(act_func, prev_layer_output, d);
                            }
                            total_error /= static_cast<Scalar>(expected.size());
                            total_derivative /= static_cast<Scalar>(expected.size());
                        },
                        // interior layer
                        [this, &prev_layer_output](const layer_t& layer) {
                            for (auto [i, n] : blt::enumerate(neurons))
                            {
                                Scalar w = 0;
                                // TODO: this is not efficient on the cache!
                                for (auto nn : layer.neurons)
                                    w += nn.error * nn.weights[i];
                                n.back_prop(act_func, prev_layer_output, w);
                            }
                        }
                }, data);
                return {total_error, total_derivative};
            }
            
            void update()
            {
                for (auto& n : neurons)
                    n.update();
            }
            
            template<typename OStream>
            OStream& serialize(OStream& stream)
            {
                for (auto d : neurons)
                    stream << d;
            }
            
            template<typename IStream>
            IStream& deserialize(IStream& stream)
            {
                for (auto& d : blt::iterate(neurons).rev())
                    stream >> d;
            }
            
            [[nodiscard]] inline blt::i32 get_in_size() const
            {
                return in_size;
            }
            
            [[nodiscard]] inline blt::i32 get_out_size() const
            {
                return out_size;
            }
            
            void debug() const
            {
                std::cout << "Bias: ";
                for (auto& v : neurons)
                    v.debug();
                std::cout << std::endl;
                weights.debug();
            }

#ifdef BLT_USE_GRAPHICS
            
            void render(blt::gfx::batch_renderer_2d& renderer) const
            {
                const blt::size_t distance_between_layers = 30;
                const float neuron_size = 30;
                const float padding = -5;
                for (const auto& [i, n] : blt::enumerate(neurons))
                {
                    auto color = std::abs(n.a);
                    renderer.drawPointInternal(blt::make_color(0.1, 0.1, 0.1),
                                               blt::gfx::point2d_t{static_cast<float>(i) * (neuron_size + padding) + neuron_size,
                                                                   static_cast<float>(layer_id * distance_between_layers) + neuron_size,
                                                                   neuron_size / 2}, 10);
                    auto outline_size = neuron_size + 10;
                    renderer.drawPointInternal(blt::make_color(color, color, color),
                                               blt::gfx::point2d_t{static_cast<float>(i) * (neuron_size + padding) + neuron_size,
                                                                   static_cast<float>(layer_id * distance_between_layers) + neuron_size,
                                                                   outline_size / 2}, 0);
//                    const ImVec2 alignment = ImVec2(0.5f, 0.5f);
//                    if (i > 0)
//                        ImGui::SameLine();
//                    ImGui::PushStyleVar(ImGuiStyleVar_SelectableTextAlign, alignment);
//                    std::string name;
//                    name = std::to_string(n.a);
//                    ImGui::Selectable(name.c_str(), false, ImGuiSelectableFlags_None, ImVec2(80, 80));
//                    ImGui::PopStyleVar();
                }
            }

#endif
        
        private:
            const blt::i32 in_size, out_size;
            const blt::size_t layer_id;
            weight_t weights;
            weight_t weight_derivatives;
            function_t* act_func;
            std::vector<neuron_t> neurons;
            std::vector<Scalar> outputs;
    };
}

#endif //COSC_4P80_ASSIGNMENT_2_LAYER_H
eigen because im a pussy 2024-10-21 16:42:03 -04:00			`#pragma once`
			`/*`
			`* Copyright (C) 2024 Brett Terpstra`
			`*`
			`* This program is free software: you can redistribute it and/or modify`
			`* it under the terms of the GNU General Public License as published by`
			`* the Free Software Foundation, either version 3 of the License, or`
			`* (at your option) any later version.`
			`*`
			`* This program is distributed in the hope that it will be useful,`
			`* but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
			`* GNU General Public License for more details.`
			`*`
			`* You should have received a copy of the GNU General Public License`
			`* along with this program. If not, see <https://www.gnu.org/licenses/>.`
			`*/`

silly boi 2024-10-25 14:20:18 -04:00			`#include "blt/std/assert.h"`
works 2024-10-27 18:09:37 -04:00
eigen because im a pussy 2024-10-21 16:42:03 -04:00			`#ifndef COSC_4P80_ASSIGNMENT_2_LAYER_H`
			`#define COSC_4P80_ASSIGNMENT_2_LAYER_H`
works 2024-10-27 18:09:37 -04:00
			`#include <blt/std/types.h>`
			`#include <assign2/initializers.h>`
			`#include "blt/iterator/zip.h"`
			`#include "blt/iterator/iterator.h"`
			`#include "global_magic.h"`
eigen because im a pussy 2024-10-21 16:42:03 -04:00
			`namespace assign2`
			`{`
work 2024-10-23 01:51:32 -04:00			`class neuron_t`
eigen because im a pussy 2024-10-21 16:42:03 -04:00			`{`
getting closer! 2024-10-25 01:22:32 -04:00			`friend layer_t;`
eigen because im a pussy 2024-10-21 16:42:03 -04:00			`public:`
work 2024-10-23 01:51:32 -04:00			`// empty neuron for loading from a stream`
fuck you 2024-10-25 14:01:47 -04:00			`explicit neuron_t(weight_view weights, weight_view dw): dw(dw), weights(weights)`
work 2024-10-23 01:51:32 -04:00			`{}`

			`// neuron with bias`
fuck you 2024-10-25 14:01:47 -04:00			`explicit neuron_t(weight_view weights, weight_view dw, Scalar bias): bias(bias), dw(dw), weights(weights)`
eigen because im a pussy 2024-10-21 16:42:03 -04:00			`{}`

sleep 2024-10-28 01:55:13 -04:00			`Scalar activate(const std::vector<Scalar>& inputs, function_t* act_func)`
silly 2024-10-21 19:25:00 -04:00			`{`
sleep 2024-10-28 01:55:13 -04:00			`BLT_ASSERT_MSG(inputs.size() == weights.size(), (std::to_string(inputs.size()) + " vs " + std::to_string(weights.size())).c_str());`

getting closer! 2024-10-25 01:22:32 -04:00			`z = bias;`
sleep 2024-10-28 01:55:13 -04:00			`for (auto [x, w] : blt::zip_iterator_container({inputs.begin(), inputs.end()}, {weights.begin(), weights.end()}))`
getting closer! 2024-10-25 01:22:32 -04:00			`z += x * w;`
			`a = act_func->call(z);`
			`return a;`
silly 2024-10-21 19:25:00 -04:00			`}`

fuck you 2024-10-25 14:01:47 -04:00			`void back_prop(function_t* act, const std::vector<Scalar>& previous_outputs, Scalar next_error)`
			`{`
			`// delta for weights`
			`error = act->derivative(z) * next_error;`
works 2024-10-27 18:09:37 -04:00			`db = learn_rate * error;`
silly boi 2024-10-25 14:20:18 -04:00			`BLT_ASSERT(previous_outputs.size() == dw.size());`
fuck you 2024-10-25 14:01:47 -04:00			`for (auto [prev_out, d_weight] : blt::zip(previous_outputs, dw))`
			`{`
works 2024-10-27 18:09:37 -04:00			`// dw`
			`d_weight = -learn_rate * prev_out * error;`
fuck you 2024-10-25 14:01:47 -04:00			`}`
			`}`

			`void update()`
			`{`
			`for (auto [w, d] : blt::in_pairs(weights, dw))`
			`w += d;`
works 2024-10-27 18:09:37 -04:00			`bias += db;`
fuck you 2024-10-25 14:01:47 -04:00			`}`

work 2024-10-23 01:51:32 -04:00			`template<typename OStream>`
			`OStream& serialize(OStream& stream)`
eigen because im a pussy 2024-10-21 16:42:03 -04:00			`{`
work 2024-10-23 01:51:32 -04:00			`stream << bias;`
			`for (auto d : weights)`
			`stream << d;`
			`}`

			`template<typename IStream>`
			`IStream& deserialize(IStream& stream)`
			`{`
			`for (auto& d : blt::iterate(weights).rev())`
			`stream >> d;`
			`stream >> bias;`
eigen because im a pussy 2024-10-21 16:42:03 -04:00			`}`
getting closer! 2024-10-25 01:22:32 -04:00
			`void debug() const`
			`{`
			`std::cout << bias << " ";`
			`}`
eigen because im a pussy 2024-10-21 16:42:03 -04:00
work 2024-10-23 01:51:32 -04:00			`private:`
getting closer! 2024-10-25 01:22:32 -04:00			`float z = 0;`
			`float a = 0;`
			`float bias = 0;`
works 2024-10-27 18:09:37 -04:00			`float db = 0;`
getting closer! 2024-10-25 01:22:32 -04:00			`float error = 0;`
fuck you 2024-10-25 14:01:47 -04:00			`weight_view dw;`
work 2024-10-23 01:51:32 -04:00			`weight_view weights;`
			`};`

			`class layer_t`
			`{`
fuck you 2024-10-25 14:01:47 -04:00			`friend network_t;`
work 2024-10-23 01:51:32 -04:00			`public:`
			`template<typename WeightFunc, typename BiasFunc>`
getting closer! 2024-10-25 01:22:32 -04:00			`layer_t(const blt::i32 in, const blt::i32 out, function_t* act_func, WeightFunc w, BiasFunc b):`
works 2024-10-27 18:09:37 -04:00			`in_size(in), out_size(out), layer_id(layer_id_counter++), act_func(act_func)`
work 2024-10-23 01:51:32 -04:00			`{`
			`neurons.reserve(out_size);`
silly boi 2024-10-25 14:20:18 -04:00			`weights.preallocate(in_size * out_size);`
			`weight_derivatives.preallocate(in_size * out_size);`
work 2024-10-23 01:51:32 -04:00			`for (blt::i32 i = 0; i < out_size; i++)`
			`{`
			`auto weight = weights.allocate_view(in_size);`
fuck you 2024-10-25 14:01:47 -04:00			`auto dw = weight_derivatives.allocate_view(in_size);`
work 2024-10-23 01:51:32 -04:00			`for (auto& v : weight)`
			`v = w(i);`
fuck you 2024-10-25 14:01:47 -04:00			`neurons.push_back(neuron_t{weight, dw, b(i)});`
work 2024-10-23 01:51:32 -04:00			`}`
			`}`

fuck you 2024-10-25 14:01:47 -04:00			`const std::vector<Scalar>& call(const std::vector<Scalar>& in)`
work 2024-10-23 01:51:32 -04:00			`{`
fuck you 2024-10-25 14:01:47 -04:00			`outputs.clear();`
			`outputs.reserve(out_size);`
work 2024-10-23 01:51:32 -04:00			`#if BLT_DEBUG_LEVEL > 0`
			`if (in.size() != in_size)`
			`throw std::runtime_exception("Input vector doesn't match expected input size!");`
			`#endif`
			`for (auto& n : neurons)`
sleep 2024-10-28 01:55:13 -04:00			`outputs.push_back(n.activate(in, act_func));`
fuck you 2024-10-25 14:01:47 -04:00			`return outputs;`
work 2024-10-23 01:51:32 -04:00			`}`

sleep 2024-10-28 01:55:13 -04:00			`error_data_t back_prop(const std::vector<Scalar>& prev_layer_output,`
works 2024-10-27 18:09:37 -04:00			`const std::variant<blt::ref<const std::vector<Scalar>>, blt::ref<const layer_t>>& data)`
getting closer! 2024-10-25 01:22:32 -04:00			`{`
works 2024-10-27 18:09:37 -04:00			`Scalar total_error = 0;`
			`Scalar total_derivative = 0;`
			`std::visit(blt::lambda_visitor{`
fuck you 2024-10-25 14:01:47 -04:00			`// is provided if we are an output layer, contains output of this net (per neuron) and the expected output (per neuron)`
works 2024-10-27 18:09:37 -04:00			`[this, &prev_layer_output, &total_error, &total_derivative](const std::vector<Scalar>& expected) {`
fuck you 2024-10-25 14:01:47 -04:00			`for (auto [i, n] : blt::enumerate(neurons))`
			`{`
			`auto d = outputs[i] - expected[i];`
			`auto d2 = 0.5f * (d * d);`
			`total_error += d2;`
works 2024-10-27 18:09:37 -04:00			`total_derivative += d;`
			`n.back_prop(act_func, prev_layer_output, d);`
fuck you 2024-10-25 14:01:47 -04:00			`}`
sleep 2024-10-28 01:55:13 -04:00			`total_error /= static_cast<Scalar>(expected.size());`
			`total_derivative /= static_cast<Scalar>(expected.size());`
fuck you 2024-10-25 14:01:47 -04:00			`},`
			`// interior layer`
			`[this, &prev_layer_output](const layer_t& layer) {`
			`for (auto [i, n] : blt::enumerate(neurons))`
			`{`
works 2024-10-27 18:09:37 -04:00			`Scalar w = 0;`
fuck you 2024-10-25 14:01:47 -04:00			`// TODO: this is not efficient on the cache!`
			`for (auto nn : layer.neurons)`
works 2024-10-27 18:09:37 -04:00			`w += nn.error * nn.weights[i];`
			`n.back_prop(act_func, prev_layer_output, w);`
fuck you 2024-10-25 14:01:47 -04:00			`}`
			`}`
			`}, data);`
works 2024-10-27 18:09:37 -04:00			`return {total_error, total_derivative};`
fuck you 2024-10-25 14:01:47 -04:00			`}`

			`void update()`
			`{`
			`for (auto& n : neurons)`
			`n.update();`
getting closer! 2024-10-25 01:22:32 -04:00			`}`

work 2024-10-23 01:51:32 -04:00			`template<typename OStream>`
			`OStream& serialize(OStream& stream)`
			`{`
			`for (auto d : neurons)`
			`stream << d;`
			`}`

			`template<typename IStream>`
			`IStream& deserialize(IStream& stream)`
			`{`
			`for (auto& d : blt::iterate(neurons).rev())`
			`stream >> d;`
			`}`

			`[[nodiscard]] inline blt::i32 get_in_size() const`
			`{`
			`return in_size;`
			`}`

			`[[nodiscard]] inline blt::i32 get_out_size() const`
			`{`
			`return out_size;`
			`}`
getting closer! 2024-10-25 01:22:32 -04:00
			`void debug() const`
			`{`
			`std::cout << "Bias: ";`
			`for (auto& v : neurons)`
			`v.debug();`
			`std::cout << std::endl;`
			`weights.debug();`
			`}`
works 2024-10-27 18:09:37 -04:00
			`#ifdef BLT_USE_GRAPHICS`

sleep 2024-10-28 01:55:13 -04:00			`void render(blt::gfx::batch_renderer_2d& renderer) const`
works 2024-10-27 18:09:37 -04:00			`{`
sleep 2024-10-28 01:55:13 -04:00			`const blt::size_t distance_between_layers = 30;`
			`const float neuron_size = 30;`
			`const float padding = -5;`
			`for (const auto& [i, n] : blt::enumerate(neurons))`
			`{`
			`auto color = std::abs(n.a);`
			`renderer.drawPointInternal(blt::make_color(0.1, 0.1, 0.1),`
			`blt::gfx::point2d_t{static_cast<float>(i) * (neuron_size + padding) + neuron_size,`
			`static_cast<float>(layer_id * distance_between_layers) + neuron_size,`
			`neuron_size / 2}, 10);`
			`auto outline_size = neuron_size + 10;`
			`renderer.drawPointInternal(blt::make_color(color, color, color),`
			`blt::gfx::point2d_t{static_cast<float>(i) * (neuron_size + padding) + neuron_size,`
			`static_cast<float>(layer_id * distance_between_layers) + neuron_size,`
			`outline_size / 2}, 0);`
			`// const ImVec2 alignment = ImVec2(0.5f, 0.5f);`
			`// if (i > 0)`
			`// ImGui::SameLine();`
			`// ImGui::PushStyleVar(ImGuiStyleVar_SelectableTextAlign, alignment);`
			`// std::string name;`
			`// name = std::to_string(n.a);`
			`// ImGui::Selectable(name.c_str(), false, ImGuiSelectableFlags_None, ImVec2(80, 80));`
			`// ImGui::PopStyleVar();`
			`}`
works 2024-10-27 18:09:37 -04:00			`}`

			`#endif`
getting closer! 2024-10-25 01:22:32 -04:00
eigen because im a pussy 2024-10-21 16:42:03 -04:00			`private:`
			`const blt::i32 in_size, out_size;`
works 2024-10-27 18:09:37 -04:00			`const blt::size_t layer_id;`
work 2024-10-23 01:51:32 -04:00			`weight_t weights;`
fuck you 2024-10-25 14:01:47 -04:00			`weight_t weight_derivatives;`
getting closer! 2024-10-25 01:22:32 -04:00			`function_t* act_func;`
work 2024-10-23 01:51:32 -04:00			`std::vector<neuron_t> neurons;`
fuck you 2024-10-25 14:01:47 -04:00			`std::vector<Scalar> outputs;`
eigen because im a pussy 2024-10-21 16:42:03 -04:00			`};`
			`}`

			`#endif //COSC_4P80_ASSIGNMENT_2_LAYER_H`