AlgoPlus/mlp_8h_source.html

#pragma once


#ifdef __cplusplus

#include <cassert>

#include <iostream>

#include <vector>

#include "../activation/activation_functions.h"

#include "../metrics/metrics.h"

#include "nn.h"

#endif


class MLP {

    std::vector<std::vector<double>> data_;

    std::vector<double> labels_;

    std::vector<nn::Linear> seq_;

    double binary_;

    int epochs_;

    double learning_rate_;


  public:

    explicit MLP(std::vector<std::vector<double>> const&, std::vector<std::pair<int, int>> const,

                 const int epochs = 100, const double learning_rate = 0.001);


    void fit();


    double predict(std::vector<double> const&);

};


inline MLP::MLP(std::vector<std::vector<double>> const& data,

                std::vector<std::pair<int, int>> const arch, const int epochs,

                const double learning_rate) {

    assert(data.size() > 0);

    assert(epochs > 0);

    assert(learning_rate > 0);

    assert(arch.size() > 0);

    this->epochs_ = epochs;

    this->data_ = data;

    this->learning_rate_ = learning_rate;

    this->binary_ = (arch.back().second == 1) ? true : false;

    for (std::vector<double>& row : this->data_) {

        this->labels_.push_back(row.back());

        row.pop_back();

    }


    for (auto [in_features_, out_features_] : arch) {

        assert(in_features_ > 0);

        assert(out_features_ > 0);

        this->seq_.push_back(nn::Linear(in_features_, out_features_, true));

    }

}


inline void MLP::fit() {

    for (int epoch = 0; epoch < this->epochs_; epoch++) {

        std::vector<double> y_pred;

        for (size_t i = 0; i < this->data_.size(); i++) {

            std::vector<double> out_ = this->data_[i];

            for (nn::Linear& layer : this->seq_) {

                out_ = layer.forward(out_);

            }


            // double y_pred;

            double y_pred_ = (out_[0] > 0.0) ? 1.0 : -1.0;

            y_pred.push_back(y_pred_);

            // TODO: Perform multiclass classification

            // else {

            //     std::vector<double> logits = activation::softmax(out_);

            //     y_pred = std::max_element(logits.begin(), logits.end()) -

            //     logits.begin(); std::cout << y_pred << '\n';

            // }

            double err = y_pred_ - this->labels_[i];


            if (err != 0) {

                for (nn::Linear& layer : this->seq_) {

                    layer.update_weights(this->data_[i], err, this->learning_rate_);

                }

            }

        }

        std::cout << "Epoch: " << epoch + 1 << ": "

                  << "Accuracy: " << metrics::accuracy_score(this->labels_, y_pred)

                  << " | f1_score: " << metrics::f1_score(this->labels_, y_pred)

                  << " | Recall: " << metrics::recall(this->labels_, y_pred)

                  << " | Precision: " << metrics::precision(this->labels_, y_pred) << '\n';

    }

}


inline double MLP::predict(std::vector<double> const& input) {

    assert(input.size() == this->data_[0].size());

    std::vector<double> out_ = input;

    for (nn::Linear& layer : this->seq_) {

        out_ = layer.forward(out_);

    }


    return (out_[0] > 0.0) ? 1.0 : -1.0;

    // else {

    //     std::vector<double> logits = activation::softmax(out_);

    //     return std::max_element(logits.begin(), logits.end()) - logits.begin();

    // }

}


MLP::fit
void fit()
fit an MLP on the input data
Definition mlp.h:75

MLP::predict
double predict(std::vector< double > const &)
performs inference
Definition mlp.h:109

MLP::MLP
MLP(std::vector< std::vector< double > > const &, std::vector< std::pair< int, int > > const, const int epochs=100, const double learning_rate=0.001)
default constructor for MLP class
Definition mlp.h:52

nn::Linear
Linear module. This implementation mostly follows PyTorch's implementation.
Definition nn.h:18

metrics::f1_score
double f1_score(const std::vector< double > &y, const std::vector< double > &y_pred)
f1 score function: [2 * precision * recall / precision + recall]
Definition metrics.h:99

metrics::accuracy_score
double accuracy_score(const std::vector< double > &y, const std::vector< double > &y_pred)
accuracy score function[(tp + tn) / (tp + tn + fp + fn)]
Definition metrics.h:81

metrics::recall
double recall(const std::vector< double > &y, const std::vector< double > &y_pred)
recall function[tp / tp + fn]
Definition metrics.h:72

metrics::precision
double precision(const std::vector< double > &y, const std::vector< double > &y_pred)
precision function[tp / tp + fp]
Definition metrics.h:90