matrix/Matrix_8hpp_source.html

 #ifndef MACHINE_LEARNING_MATRIX_HPP
 #define MACHINE_LEARNING_MATRIX_HPP

 #include <vector>
 #include <functional>
 #include <stdexcept>
 #include <algorithm>
 #include <iostream>
 #include <iomanip>
 #include <cmath>
 #include <set>
 #include <complex>
 #include "include/nr3/nr3.h"
 #include "include/nr3/eigen_unsym.h"
 #include "include/csv_reader/CSVReader.hpp"

 using namespace std;

 template<
     typename T,
     typename = typename std::enable_if<std::is_arithmetic<T>::value, T>::type>
 class Matrix {
  private:
   size_t mRows;
   size_t mCols;
   std::vector<T> mData;

   void validateIndexes(size_t row, size_t col) const {
     if (row < 0 or row >= mRows)
       throw invalid_argument(
           "Invalid row index (" + to_string(row) + "): should be between 0 and " + to_string(mRows - 1));
     if (col < 0 or col >= mCols)
       throw invalid_argument(
           "Invalid column index (" + to_string(col) + "): should be between 0 and " + to_string(mCols - 1));
   }

   static pair<Matrix, Matrix> eigsort(Matrix eigenvalues, Matrix eigenvectors) {
 //    if (eigenvalues.mCols != eigenvectors.mRows)
 //      throw runtime_error("Incompatible number of eigenvalues and eigenvectors");

     Matrix eigval(eigenvalues.mRows, eigenvalues.mCols, eigenvalues.mData);
     Matrix eigvec(eigenvectors.mRows, eigenvectors.mCols, eigenvectors.mData);

     // keep the order of eigenvalues in this vector
     vector<size_t> newOrder;
     for (size_t i = 0; i < eigenvalues.nRows(); i++) {
       int position = 0;
       for (int j = 0; j < newOrder.size(); j++)
         if (eigenvalues(i, 0) < eigenvalues(newOrder[j], 0))
           position++;
       newOrder.insert(newOrder.begin() + position, i);
     }

     // order eigenvalues and eigenvectors by the value of the eigenvalues
     for (size_t i = 0; i < newOrder.size(); i++) {
       eigval(i, 0) = eigenvalues(newOrder[i], 0);

       for (int j = 0; j < eigenvectors.nRows(); j++) {
         eigvec(static_cast<size_t>(j), i) = eigenvectors(j, newOrder[i]);
       }
     }

     return make_pair(eigval, eigvec);
   }

  public:

   enum Axis { ALL, ROWS, COLUMNS };

   size_t nCols() const { return mCols; }

   size_t nRows() const { return mRows; }

   //region Constructors

   Matrix() {
     mRows = mCols = 0;
   }

   Matrix(size_t dimension) {
     Matrix(dimension, dimension);
   }

   Matrix(size_t rows, size_t cols)
       : mRows(rows),
         mCols(cols),
         mData(rows * cols) {
   }

   Matrix(size_t rows, size_t cols, const vector<T> &data)
       : mRows(rows),
         mCols(cols) {
     if (data.size() != rows * cols)
       throw invalid_argument("Matrix dimension incompatible with its initializing vector.");
     mData = data;
   }

   template<std::size_t N>
   Matrix(size_t rows, size_t cols, T (&data)[N]) {
     if (N != rows * cols)
       throw invalid_argument("Matrix dimension incompatible with its initializing vector.");
     vector<T> v(data, data + N);
     Matrix(rows, cols, v);
   }
   //endregion

   //region Operators

   //region Scalar operators

   friend Matrix operator+(const Matrix &m, double value) {
     Matrix result(m.mRows, m.mCols);

     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < m.mRows; i++) {
       for (size_t j = 0; j < m.mCols; j++) {
         result(i, j) = value + m(i, j);
       }
     }

     return result;
   }

   friend Matrix operator+(double value, const Matrix &m) {
     return m + value;
   }

   friend Matrix operator-(const Matrix &m, double value) {
     return m + (-value);
   }

   friend Matrix operator-(double value, const Matrix &m) {
     return m - value;
   }

   friend Matrix operator*(const Matrix &m, double value) {
     Matrix result(m.mRows, m.mCols);

     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < m.mRows; i++) {
       for (size_t j = 0; j < m.mCols; j++) {
         result(i, j) = value * m(i, j);
       }
     }

     return result;
   }

   friend Matrix operator*(double value, const Matrix &m) {
     return m * value;
   }

   friend Matrix operator/(const Matrix &m, double value) {
     Matrix result(m.mRows, m.mCols);

     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < m.mRows; i++) {
       for (size_t j = 0; j < m.mCols; j++) {
         result(i, j) = m(i, j) / value;
       }
     }

     return result;
   }

   friend Matrix operator/(double value, const Matrix &m) {
     // division is not commutative, so a new method is implemented
     Matrix result(m.mRows, m.mCols);

     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < m.mRows; i++) {
       for (size_t j = 0; j < m.mCols; j++) {
         result(i, j) = value / m(i, j);
       }
     }

     return result;
   }

   Matrix operator+=(double value) {
     #pragma omp parallel for
     for (int i = 0; i < mData.size(); i++)
       mData[i] += value;
     return *this;
   }

   Matrix operator-=(double value) {
     #pragma omp parallel for
     for (int i = 0; i < mData.size(); i++)
       mData[i] -= value;
     return *this;
   }

   Matrix operator*=(double value) {
     #pragma omp parallel for
     for (int i = 0; i < mData.size(); i++)
       mData[i] *= value;
     return *this;
   }

   Matrix operator/=(double value) {
     #pragma omp parallel for
     for (int i = 0; i < mData.size(); i++)
       mData[i] /= value;
     return *this;
   }
   //endregion

   //region Matrix operators

   Matrix operator+(const Matrix &b) {
     if (mRows != b.mRows || mCols != b.mCols)
       throw invalid_argument("Cannot add these matrices: L = " + to_string(mRows) + "x" + to_string(mCols) + ", R = "
                                  + to_string(b.mRows) + "x" + to_string(b.mCols));

     Matrix result(mRows, mCols);

     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < mRows; i++) {
       for (size_t j = 0; j < mCols; j++) {
         result(i, j) = operator()(i, j) + b(i, j);
       }
     }

     return result;
   }

   Matrix operator-(const Matrix &b) {
     if (mRows != b.mRows || mCols != b.mCols)
       throw invalid_argument(
           "Cannot subtract these matrices: L = " + to_string(mRows) + "x" + to_string(mCols) + ", R = "
               + to_string(b.mRows) + "x" + to_string(b.mCols));

     Matrix result(mRows, mCols);

     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < mRows; i++) {
       for (size_t j = 0; j < mCols; j++) {
         result(i, j) = operator()(i, j) - b(i, j);
       }
     }

     return result;
   }

   Matrix operator*(const Matrix &b) const {
     if (mCols != b.mRows)
       throw invalid_argument(
           "Cannot multiply these matrices: L = " + to_string(this->mRows) + "x" +
               to_string(this->mCols) + ", R = " + to_string(b.mRows) + "x" + to_string(b.mCols));

     Matrix result = zeros(mRows, b.mCols);

     #pragma omp parallel for if(result.mRows * result.mCols > 250)
     for (size_t i = 0; i < result.mRows; i++) {
       for (size_t k = 0; k < mCols; k++) {
         double tmp = operator()(i, k);
         for (size_t j = 0; j < result.mCols; j++) {
           result(i, j) += tmp * b(k, j);
         }
       }
     }

     return result;
   }

   Matrix &operator+=(const Matrix &other) {
     if (mRows != other.mRows || mCols != other.mCols)
       throw invalid_argument("Cannot add these matrices: L = " + to_string(mRows) + "x" + to_string(mCols) + ", R = "
                                  + to_string(other.mRows) + "x" + to_string(other.mCols));
     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < other.mRows; i++) {
       for (size_t j = 0; j < other.mCols; j++) {
         operator()(i, j) += other(i, j);
       }
     }

     return *this;
   }

   Matrix &operator-=(const Matrix &other) {
     if (mRows != other.mRows || mCols != other.mCols)
       throw invalid_argument(
           "Cannot subtract these matrices: L = " + to_string(mRows) + "x" + to_string(mCols) + ", R = "
               + to_string(other.mRows) + "x" + to_string(other.mCols));

     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < other.mRows; i++) {
       for (size_t j = 0; j < other.mCols; j++) {
         operator()(i, j) -= other(i, j);
       }
     }

     return *this;
   }

   Matrix &operator*=(const Matrix &other) {
     if (mCols != other.mRows)
       throw invalid_argument(
           "Cannot multiply these matrices: L " + to_string(mRows) + "x" +
               to_string(mCols) + ", R " + to_string(other.mRows) + "x" + to_string(other.mCols));

     Matrix result(mRows, other.mCols);

     #pragma omp parallel for collapse(2)
     // two loops iterate through every cell of the new matrix
     for (size_t i = 0; i < result.mRows; i++) {
       for (size_t j = 0; j < result.mCols; j++) {
         // here we calculate the value of a single cell in our new matrix
         result(i, j) = 0;
         for (size_t ii = 0; ii < mCols; ii++)
           result(i, j) += operator()(i, ii) * other(ii, j);
       }
     }

     mRows = result.mRows;
     mCols = result.mCols;
     mData = result.mData;
     return *this;
   }
   //endregion

   //region Equality operators

   Matrix<int> operator==(const T &value) {
     Matrix<int> result(mRows, mCols);

     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < mRows; i++) {
       for (size_t j = 0; j < mCols; j++) {
         result(i, j) = operator()(i, j) == value;
       }
     }

     return result;
   }

   bool operator==(const Matrix &other) {
     if (mData.size() != other.mData.size() || mRows != other.mRows || mCols != other.mCols)
       return false;

     for (int k = 0; k < mData.size(); k++) {
       if (mData[k] != other.mData[k])return false;
     }

     return true;
   }

   Matrix operator!=(const double &value) {
     // subtract 1 from everything: 0s become -1s, 1s become 0s
     // negate everything: 0s remains 0s, -1s becomes 1s
     return -((*this == value) - 1);
   }

   bool operator!=(const Matrix &other) {
     // subtract 1 from everything: 0s become -1s, 1s become 0s
     // negate everything: 0s remains 0s, -1s becomes 1s
     return !(*this == other);
   }
   //endregion

   Matrix operator-() {
     Matrix result(this->mRows, this->mCols);

     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < mCols; i++) {
       for (size_t j = 0; j < mRows; j++) {
         result(i, j) = -operator()(i, j);
       }
     }

     return result;
   }

   //region Functors

   T &operator()(size_t i, size_t j) {
     validateIndexes(i, j);
     return mData[i * mCols + j];
   }

   T operator()(size_t i, size_t j) const {
     validateIndexes(i, j);
     return mData[i * mCols + j];
   }
   //endregion
   //endregion

   static Matrix fill(size_t rows, size_t cols, double value) {
     Matrix result(rows, cols, vector<T>(rows * cols, value));
     return result;
   }

   static Matrix diagonal(size_t size, double value) {
     Matrix result = zeros(size, size);
     for (size_t i = 0; i < size; i++)
       result(i, i) = value;

     return result;
   }

   bool isSquare() const {
     return mCols == mRows;
   }

   Matrix diagonal() {
     if (!isSquare()) {
       throw runtime_error("Can't get the diagonal, not a square matrix");
     }

     Matrix result(mRows, 1);

     #pragma omp parallel
     for (size_t i = 0; i < mRows; i++)
       result(i, 0) = operator()(i, i);

     return result;
   }

   static Matrix identity(size_t size) {
     return diagonal(size, 1);
   }

   static Matrix ones(size_t rows, size_t cols) {
     return fill(rows, cols, 1);
   }

   static Matrix zeros(size_t rows, size_t cols) {
     return fill(rows, cols, 0);
   }

   Matrix hadamard(const Matrix &b) {
     if (mCols != b.mCols || mRows != b.mRows)
       throw invalid_argument(
           "Cannot multiply these matrices element-wise: L = " + to_string(mRows) + "x" +
               to_string(mCols) + ", R = " + to_string(b.mRows) + "x" + to_string(b.mCols));

     Matrix result(mRows, mCols);

     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < mRows; i++) {
       for (size_t j = 0; j < mCols; j++) {
         result(i, j) = operator()(i, j) * b(i, j);
       }
     }

     return result;
   }

   Matrix submatrix(size_t row, size_t column) const {
     Matrix result(mRows - 1, mCols - 1);

     size_t subi = 0;

     #pragma omp parallel for
     for (size_t i = 0; i < mRows; i++) {
       size_t subj = 0;
       if (i == row) continue;
       for (size_t j = 0; j < mCols; j++) {
         if (j == column) continue;
         result(subi, subj) = operator()(i, j);
         subj++;
       }
       subi++;
     }

     return result;
   }

   double getMinor(size_t row, size_t column) const {
 //        the minor of a 2x2 a b is d c
 //                           c d    b a
     if (mRows == 2 and mCols == 2) {
       Matrix result(2, 2);
       result(0, 0) = operator()(1, 1);
       result(0, 1) = operator()(1, 0);
       result(1, 0) = operator()(0, 1);
       result(1, 1) = operator()(0, 0);
       return result.determinant();
     }

     return submatrix(row, column).determinant();
   }

   double cofactor(size_t row, size_t column) const {
     double minor;

     // special case for when our matrix is 2x2
     if (mRows == 2 and mCols == 2) {
       if (row == 0 and column == 0)
         minor = operator()(1, 1);
       else if (row == 1 and column == 1)
         minor = operator()(0, 0);
       else if (row == 0 and column == 1)
         minor = operator()(1, 0);
       else if (row == 1 and column == 0)
         minor = operator()(0, 1);
     } else
       minor = this->getMinor(row, column);
     return (row + column) % 2 == 0 ? minor : -minor;
   }

   Matrix cofactorMatrix() const {
     Matrix result(mRows, mCols);

     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < mRows; i++) {
       for (size_t j = 0; j < mCols; j++) {
         result(i, j) = cofactor(i, j);
       }
     }
     return result;
   }

   Matrix adjugate() const {
     return cofactorMatrix().transpose();
   }

   Matrix inverse() const {
     if (!isSquare())
       throw runtime_error("Cannot invert a non-square matrix");

     double det = determinant();

     if (det == 0)
       throw runtime_error("Matrix is singular");

     Matrix adj = adjugate();
     return adjugate() / det;
   };

   double determinant() const {
     if (!isSquare()) {
       throw runtime_error("Cannot calculate the determinant of a non-square matrix");
     }

     size_t n = mRows;
     double d = 0;
     if (n == 2) {
       return ((operator()(0, 0) * operator()(1, 1)) -
           (operator()(1, 0) * operator()(0, 1)));
     } else {
       #pragma omp parallel for reduction (+:d)
       for (size_t c = 0; c < n; c++) {
         d += pow(-1, c) * operator()(0, c) * submatrix(0, c).determinant();
       }
       return d;
     }
   }

   Matrix transpose() const {
     Matrix result(mCols, mRows);

     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < mRows; i++) {
       for (size_t j = 0; j < mCols; j++) {
         result(j, i) = operator()(i, j);
       }
     }

     return result;
   }

   void addColumn(Matrix values) {
     addColumn(values, mCols);
   }

   void addRow(Matrix values) {
     addRow(values, mRows);
   }

   void addColumn(Matrix values, size_t position) {
     if (!isEmpty() and values.nRows() != mRows)
       throw invalid_argument("Wrong number of values passed for new column");
     if (values.nCols() != 1)
       throw invalid_argument("Can't add multiple columns at once");

     if (isEmpty()) {
       mRows = values.mRows;
       mCols = values.mCols;
       mData = values.mData;
       return;
     }

     vector<T> newData(mData.size() + values.mRows);

     size_t newData_mCols = mCols + 1;
     for (size_t i = 0; i < mRows; i++) {
       for (size_t j = 0; j < newData_mCols; j++) {
         if (j == position)
           newData[i * newData_mCols + j] = values(i, 0);
         else {
           int a = j > position;
           newData[i * newData_mCols + j] = operator()(i, j - (j > position));
         }
       }
     }
     mCols += 1;
     mData = newData;
   }

   void addRow(Matrix values, size_t position) {
     if (!isEmpty() and values.mRows != mCols)
       throw invalid_argument("Wrong number of values passed for new row");
     if (values.mCols != 1)
       throw invalid_argument("Can't add multiple rows at once");

     if (isEmpty()) {
       mRows = values.mCols;
       mCols = values.mRows;
       mData = values.mData;
       return;
     }

     // TODO addColumn with same logic was wrong, must check this one

     vector<T> newData(mData.size() + values.mRows);

     mRows += 1;
     for (size_t i = 0; i < mRows; i++) {
       for (size_t j = 0; j < mCols; j++) {
         if (i == position)
           newData[i * mCols + j] = values(j, 0);
         else
           newData[i * mCols + j] = operator()(i - (i > position), j);
       }
     }

     mData = newData;
   }

   void removeColumn(int position) {
     // this is how you stop a reverse for loop with unsigned integers
     for (size_t i = mRows - 1; i != (size_t) -1; i--)
       mData.erase(mData.begin() + (i * mCols + position));

     mCols -= 1;
   }

   Matrix unique() const {
     // include all data from the inner vector in a set
     set<T> s;
     unsigned long size = mData.size();

     for (unsigned i = 0; i < size; ++i)
       s.insert(mData[i]);

     // include all the data from the set back into a vector
     vector<T> auxVec;
     auxVec.assign(s.begin(), s.end());

     // return a column matrix with the unique elements
     return Matrix(auxVec.size(), 1, auxVec);
   }

   void sort() {
     // just sort the inner vector
     std::sort(mData.begin(), mData.end());
   }

   static Matrix sort(Matrix m) {
     // copy the inner vector of the matrix passed as argument
     // and return a new matrix with the sorted inner vector
     vector<T> data = m.mData;
     std::sort(data.begin(), data.end());
     return Matrix(m.mRows, m.mCols, data);
   }

   Matrix count() {
     Matrix result = unique();
     result.sort();

     result.addColumn(zeros(result.mRows, 1), 1);

     for (size_t i = 0; i < mRows; i++)
       for (size_t j = 0; j < mCols; j++)
         for (size_t g = 0; g < result.mRows; g++)
           if (operator()(i, j) == result(g, 0)) {
             result(g, 1)++;
             break;
           }

     return result;
   }

   Matrix mean(Matrix groups) {
     if (mRows != groups.mRows)
       throw invalid_argument("Not enough groups for every element in the matrix");

     Matrix groupCount = groups.count();
     Matrix result = zeros(groupCount.mRows, mCols);

     for (size_t i = 0; i < mRows; i++) {
       for (size_t g = 0; g < groupCount.mRows; g++) {
         if (groups(i, 0) == groupCount(g, 0)) {
           for (size_t j = 0; j < mCols; j++) {
             result(g, j) += operator()(i, j);
           }
           break;
         }
       }
     }

     for (size_t i = 0; i < result.mRows; i++)
       for (size_t j = 0; j < result.mCols; j++)
         result(i, j) /= groupCount(i, 1);

     return result;
   }

   Matrix mean() {
     Matrix result = zeros(mCols, 1);

     for (size_t i = 0; i < mRows; i++) {
       for (size_t j = 0; j < mCols; j++) {
         result(j, 0) += operator()(i, j);
       }
     }

     result /= mRows;

     return result;
   }

   Matrix scatter() {
     Matrix means = mean();
     Matrix result(mCols, mCols);

     for (size_t i = 0; i < mRows; i++) {
       Matrix rowDiff = getRow(i) - means;
       result += rowDiff * rowDiff.transpose();
     }

     return result;
   }

   Matrix cov() {
     return scatter() / (mRows - 1);
   }

   Matrix var() {
     Matrix means = mean();
     Matrix result = zeros(mCols, 1);

     for (size_t i = 0; i < mCols; i++) {
       for (size_t ii = 0; ii < mRows; ii++)
         result(i, 0) += pow((operator()(ii, i) - means(i, 0)), 2);

       result(i, 0) /= (mRows - 1);
     }

     return result;
   }

   Matrix stdev() {
     Matrix result = var();

     #pragma omp parallel for
     for (size_t i = 0; i < mCols; i++)
       result(i, 0) = sqrt(result(i, 0));

     return result;
   }

   void reshape(size_t rows, size_t cols) {
     if (mData.size() != rows * cols)
       throw invalid_argument(
           "Invalid shape (" + to_string(rows) + "x" +
               to_string(cols) + " = " + to_string(rows * cols) +
               ") for a matrix with" + to_string(mData.size()) + " elements");

     mRows = rows;
     mCols = cols;
   }

   Matrix getColumn(size_t index) {
     if (index >= mCols)
       throw invalid_argument("Column index out of bounds");

     Matrix result(mRows, 1);
     #pragma omp parallel for
     for (size_t i = 0; i < mRows; i++)
       result(i, 0) = operator()(i, index);

     return result;
   }

   Matrix getRow(size_t index) {
     if (index >= mRows)
       throw invalid_argument("Row index out of bounds");

     Matrix result(mCols, 1);
     #pragma omp parallel for
     for (size_t i = 0; i < mCols; i++)
       result(i, 0) = operator()(index, i);

     return result;
   }

   friend ostream &operator<<(ostream &os, const Matrix &matrix) {
     const int numWidth = 13;
     char fill = ' ';

     for (int i = 0; i < matrix.mRows; i++) {
       for (int j = 0; j < matrix.mCols; j++) {
         // the trick to print a table-like structure was stolen from here
         // https://stackoverflow.com/a/14796892
         os << left << setw(numWidth) << setfill(fill) << to_string(matrix(i, j));
       }
       os << endl;
     }

     return os;
   }

   static Matrix fromCSV(const string &path) {
     vector<vector<double>> outer = CSVReader::csvToNumericVecVec(path, true);

     Matrix result(outer.size(), outer[0].size());

     for (size_t i = 0; i < result.mRows; i++)
       for (size_t j = 0; j < result.mCols; j++)
         result(i, j) = outer[i][j];

     return result;
   }

   Matrix asDiagonal() {
     if (mRows != 1 and mCols != 1)
       throw runtime_error("Can't diagonalize, not a vector");

     size_t dimension = mCols > 1 ? mCols : mRows;

     Matrix result = zeros(dimension, dimension);

     #pragma omp parallel for
     for (size_t i = 0; i < dimension; i++) {
       result(i, i) = mCols > 1 ? operator()(0, i) : operator()(i, 0);
     }
     return result;
   }

   Matrix copy() {
     Matrix result(mRows, mCols);
     result.mData = mData;
     return result;
   }

   Matrix standardize() {
     return standardize(mean(), stdev());
   }

   Matrix standardize(Matrix means, Matrix stds) {
     if (!means.isColumn())
       throw invalid_argument("Argument \"mean\" must have exactly one column");
     if (!stds.isColumn())
       throw invalid_argument("Argument \"stds\" must have exactly one column");
     if (means.mRows != mCols)
       throw invalid_argument("Number of mean values is different than number of features");
     if (stds.mRows != mCols)
       throw invalid_argument("Number of std. dev. values is different than number of features");

     Matrix result(mRows, mCols);

     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < mRows; i++) {
       for (size_t j = 0; j < mCols; j++) {
         result(i, j) = (operator()(i, j) - means(j, 0)) / stds(j, 0);
       }
     }

     return result;
   }

   Matrix minusMean() {
     Matrix result(mRows, mCols), means = mean();

     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < mRows; i++) {
       for (size_t j = 0; j < mCols; j++) {
         result(i, j) = operator()(i, j) - means(j, 0);
       }
     }

     return result;
   }

   bool contains(T value) {
     return std::find(mData.begin(), mData.end(), value) != mData.end();
   }

   bool isEmpty() {
     return mCols == 0 and mRows == 0;
   }

   Matrix filter(const Matrix<int> bin, bool columns = false) {
     size_t dimension = columns ? mCols : mRows;

     if (bin.nCols() != 1)
       throw invalid_argument("Binary filter must have only one column");
     if (bin.nRows() != dimension)
       throw invalid_argument("Binary filter has the wrong number of row entries");

     Matrix result;

     for (size_t i = 0; i < bin.nRows(); i++) {
       if (bin(i, 0)) {
         if (columns)
           result.addColumn(getColumn(i));
         else
           result.addRow(getRow(i));
       }
     }

     return result;
   }

   Matrix getRows(const Matrix<int> bin) {
     return filter(bin);
   }

   Matrix getColumns(const Matrix<int> bin) {
     return filter(bin, true);
   }

   bool isSymmetric() {
     return *this == transpose();
   }

   Matrix normalize() {
     Matrix result(mRows, mCols, mData);

     // Calculate length of the column vector
     for (size_t j = 0; j < mCols; j++) {
       T length = 0;
       #pragma omp parallel for reduction(+:length)
       for (size_t i = 0; i < mRows; i++) {
         length += pow(result(i, j), 2);
       }
       length = sqrt(length);

       // divide each element of the column by its length
       for (size_t i = 0; i < mRows; i++) {
         result(i, j) /= length;
       }
     }

     return result;
   }

   pair<Matrix, Matrix> eigen() {
     return isSymmetric() ? eigenSymmetric() : eigenNonSymmetric();
   };

   pair<Matrix, Matrix> eigenSymmetric() {
     // Jacobi eigenvalue algorithm as explained
     // by profs Marina Andretta and Franklina Toledo

     // copy the current matrix
     Matrix A = copy();
     // initialize the eigenvector matrix
     Matrix V = identity(A.mCols);

     // get the tolerance
     double eps = numeric_limits<double>::epsilon();
     unsigned iterations = 0;

     // initiate the loop for numerical approximation of the eigenvalues
     while (true) {
       // find the element in the matrix with the largest modulo
       size_t p, q;
       T largest = 0;
       for (size_t i = 0; i < A.mRows; i++) {
         for (size_t j = 0; j < A.mCols; j++) {
           // it can't be in the diagonal
           if (i != j and abs(A(i, j)) > largest) {
             largest = abs(A(i, j));
             p = i;
             q = j;
           }
         }
       }

       // if the largest non-diagonal element of A is zero +/- eps,
       // it means A is almost diagonalized and the eigenvalues are
       // in the diagonal of A
       if (largest < 2 * eps or iterations >= 1000) {
         //eigenvalues are returned in a column matrix for convenience
         return eigsort(A.diagonal(), V);
       }

       iterations++;

       // else, perform a Jacobi rotation using this angle phi as reference
       double phi = (A(q, q) - A(p, p)) / (2 * A(p, q));
       double sign = (phi > 0) - (phi < 0);
       double t = phi == 0 ? 1 : 1 / (phi + sign * sqrt(pow(phi, 2) + 1));
       double cos = 1 / (sqrt(1 + pow(t, 2)));
       double sin = t / (sqrt(1 + pow(t, 2)));

       // the matrix that will apply the rotation is basically an identity matrix...
       Matrix U = identity(A.mRows);

       // ... with the exception of these values
       U(p, p) = U(q, q) = cos;
       U(p, q) = sin;
       U(q, p) = -sin;

       // apply the rotation
       A = U.transpose() * A * U;
       // update the corresponding eigenvectors
       V = V * U;
     }
   }

   pair<Matrix, Matrix> eigenNonSymmetric(bool hes = true) {

     MatDoub unholyConvertion(static_cast<int>(mRows), static_cast<int>(mCols));

     #pragma omp parallel for collapse(2)
     for (size_t i = 0; i < mRows; i++) {
       for (size_t j = 0; j < mCols; j++) {
         unholyConvertion[i][j] = operator()(i, j);
       }
     }

     Unsymmeig nr3Miracle(unholyConvertion, true, hes);

     Matrix eigenvalues(1, static_cast<size_t>(nr3Miracle.wri.size()));

     for (size_t i = 0; i < nr3Miracle.wri.size(); i++) {
       eigenvalues(0, i) = nr3Miracle.wri[i].real();
     }

     Matrix eigenvectors(static_cast<size_t>(nr3Miracle.zz.nrows()),
                         static_cast<size_t>(nr3Miracle.zz.ncols()));

     for (size_t i = 0; i < nr3Miracle.zz.nrows(); i++)
       for (size_t j = 0; j < nr3Miracle.zz.ncols(); j++)
         eigenvectors(i, j) = nr3Miracle.zz[i][j];

     return make_pair(eigenvalues, eigenvectors);
   }

   Matrix WithinClassScatter(Matrix y) {
     Matrix Sw = zeros(mCols, mCols);
     Matrix uniqueClasses = y.unique();

     for (size_t i = 0; i < uniqueClasses.nRows(); i++) {
       Matrix classElements = getRows(y == i); // get class elements

       Matrix scatterMatrix = classElements.scatter();
       Sw += scatterMatrix;
     }

     return Sw;
   }

   Matrix BetweenClassScatter(Matrix y) {
     Matrix innerMean = mean(y); // means for each class
     Matrix grandMean = mean(); // mean of the entire data set
     Matrix Sb = zeros(mCols, mCols);
     Matrix uniqueClasses = y.unique();

     for (size_t i = 0; i < uniqueClasses.nRows(); i++) {
       Matrix classElements = getRows(y == i); // get class elements
       Matrix meanDiff = innerMean.getRow(i) - grandMean;
       Sb += classElements.nRows() * meanDiff * meanDiff.transpose();
     }

     return Sb;
   }

   T sum() const {
     T sum_of_elems = 0;
     for (T n : mData)
       sum_of_elems += n;

     return sum_of_elems;
   }

   bool isColumn() const {
     return mCols == 1;
   }

   bool isRow() const {
     return mRows == 1;
   }

   T min() const {
     return *std::min_element(std::begin(mData), std::end(mData));
   }

   T max() const {
     return *std::max_element(std::begin(mData), std::end(mData));
   }

   Matrix<T> apply(function<T(T)> f) {
     Matrix<T> result(mRows, mCols, vector<T>(mRows * mCols, 0));
     std::transform(mData.begin(), mData.end(), result.mData.begin(), f);
     return result;
   }

   Matrix oneHot() {
     Matrix uniqueValues = unique();
     Matrix oneHotUnique = identity(uniqueValues.mRows);
     Matrix result(mRows, oneHotUnique.mCols);

     for (size_t i = 0; i < mRows; i++) {
       for (size_t ii = 0; ii < uniqueValues.mRows; ++ii) {
         if (getRow(i) == uniqueValues.getRow(ii)) {
           result.setRow(i, oneHotUnique.getRow(ii).transpose());
         }
       }
     }

     return result;
   }

   void setRow(size_t index, Matrix<T> row) {
     if (mRows < index)
       throw invalid_argument("Invalid row index, matrix is not that large");
     if (mCols != row.mCols)
       throw invalid_argument("Incompatible number of columns");
     if (row.mRows > 1)
       throw invalid_argument("Row matrix contains more than one row");

     for (size_t col = 0; col < mCols; col++)
       operator()(index, col) = row(0, col);
   }

   void setColumn(size_t index, Matrix<T> column) {
     if (mCols < index)
       throw invalid_argument("Invalid row column, matrix is not that large");
     if (mRows != column.mRows)
       throw invalid_argument("Incompatible number of rows");
     if (column.mCols > 1)
       throw invalid_argument("Column matrix contains more than one column");

     for (size_t row = 0; row < mCols; row++)
       operator()(row, index) = column(row, 0);
   }

   bool isBinary() const {
     Matrix<T> uniqueBin = unique();
     return uniqueBin.mRows <= 2 && uniqueBin.contains(1) or uniqueBin.contains(0);
   }
 };

 typedef Matrix<double> MatrixD;
 typedef Matrix<int> MatrixI;

 #endif //MACHINE_LEARNING_MATRIX_HPP
Matrix::isBinary
bool isBinary() const
Definition: Matrix.hpp:1370

Matrix::nRows
size_t nRows() const
Definition: Matrix.hpp:89

Matrix::hadamard
Matrix hadamard(const Matrix &b)
Executes the Hadamard, or entrywise multiplication between two matrices.
Definition: Matrix.hpp:534

Matrix::diagonal
Matrix diagonal()
Definition: Matrix.hpp:494

Matrix::Axis
Axis
Definition: Matrix.hpp:85

Matrix::diagonal
static Matrix diagonal(size_t size, double value)
Creates a square matrix with a fixed value on the diagonal.
Definition: Matrix.hpp:481

Matrix::isEmpty
bool isEmpty()
Checks if the matrix is empty or uninitialized.
Definition: Matrix.hpp:1089

Matrix::isColumn
bool isColumn() const
Definition: Matrix.hpp:1308

Matrix::getRows
Matrix getRows(const Matrix< int > bin)
Selects a subset of rows of the matrix.
Definition: Matrix.hpp:1123

Matrix::inverse
Matrix inverse() const
Calculates the inverse of the current matrix.
Definition: Matrix.hpp:641

Matrix::Matrix
Matrix(size_t rows, size_t cols, const vector< T > &data)
Initializes a matrix with a predetermined number of rows and columns and populates it with data...
Definition: Matrix.hpp:117

Matrix::normalize
Matrix normalize()
Normalizes the column vectors of the matrix.
Definition: Matrix.hpp:1143

Matrix::validateIndexes
void validateIndexes(size_t row, size_t col) const
Validates if indices are contained inside the matrix.
Definition: Matrix.hpp:40

Matrix::eigenSymmetric
pair< Matrix, Matrix > eigenSymmetric()
Calculates the eigenvalues and eigenvectors of a symmetric matrix using the Jacobi eigenvalue algorit...
Definition: Matrix.hpp:1175

Matrix::var
Matrix var()
Calculates the variance of the columns of the matrix.
Definition: Matrix.hpp:903

Matrix::mCols
size_t mCols
Definition: Matrix.hpp:33

Matrix::nCols
size_t nCols() const
Definition: Matrix.hpp:87

Matrix::fromCSV
static Matrix fromCSV(const string &path)
Loads CSV data into a matrix.
Definition: Matrix.hpp:996

Matrix::addRow
void addRow(Matrix values, size_t position)
Adds a row to the matrix at the given position.
Definition: Matrix.hpp:740

Matrix::addColumn
void addColumn(Matrix values, size_t position)
Adds a column to the matrix at the given position.
Definition: Matrix.hpp:706

Matrix::sum
T sum() const
Definition: Matrix.hpp:1300

Matrix::operator()
T & operator()(size_t i, size_t j)
Functor used to access elements in the matrix.
Definition: Matrix.hpp:451

Matrix::operator!=
bool operator!=(const Matrix &other)
Definition: Matrix.hpp:423

Matrix::operator*=
Matrix operator*=(double value)
Definition: Matrix.hpp:253

Matrix::operator-=
Matrix operator-=(double value)
Definition: Matrix.hpp:246

Matrix::contains
bool contains(T value)
Checks if the matrix contains a value.
Definition: Matrix.hpp:1083

Matrix::eigenNonSymmetric
pair< Matrix, Matrix > eigenNonSymmetric(bool hes=true)
Calculates the eigenvalues and eigenvectors of a on-symmetric matrix.
Definition: Matrix.hpp:1242

std
Matrix implementation, with a series of linear algebra functions.

Matrix::setColumn
void setColumn(size_t index, Matrix< T > column)
Definition: Matrix.hpp:1358

Matrix::mean
Matrix mean(Matrix groups)
Calculates means of a matrix, grouped by classes.
Definition: Matrix.hpp:840

Matrix::sort
static Matrix sort(Matrix m)
Sorts the elements of a matrix.
Definition: Matrix.hpp:807

Matrix::isRow
bool isRow() const
Definition: Matrix.hpp:1312

Matrix::setRow
void setRow(size_t index, Matrix< T > row)
Definition: Matrix.hpp:1346

Matrix::identity
static Matrix identity(size_t size)
Returns the identity matrix.
Definition: Matrix.hpp:511

Matrix::stdev
Matrix stdev()
Calculates the standard deviation of the columns of the matrix.
Definition: Matrix.hpp:919

Matrix::operator-
friend Matrix operator-(double value, const Matrix &m)
Scalar subtraction.
Definition: Matrix.hpp:175

Matrix::mRows
size_t mRows
Definition: Matrix.hpp:32

Matrix::copy
Matrix copy()
Returns a copy of the matrix.
Definition: Matrix.hpp:1027

Matrix::unique
Matrix unique() const
Returns only unique values from the matrix.
Definition: Matrix.hpp:782

Matrix::operator*
friend Matrix operator*(double value, const Matrix &m)
Scalar multiplication.
Definition: Matrix.hpp:200

Matrix::cofactorMatrix
Matrix cofactorMatrix() const
Calculates the cofactor matrix.
Definition: Matrix.hpp:620

Matrix::operator*=
Matrix & operator*=(const Matrix &other)
Definition: Matrix.hpp:365

Matrix::minusMean
Matrix minusMean()
Definition: Matrix.hpp:1067

Matrix::isSquare
bool isSquare() const
Definition: Matrix.hpp:489

Matrix::operator-
friend Matrix operator-(const Matrix &m, double value)
Scalar subtraction.
Definition: Matrix.hpp:167

Matrix::WithinClassScatter
Matrix WithinClassScatter(Matrix y)
Definition: Matrix.hpp:1271

Matrix::max
T max() const
Definition: Matrix.hpp:1320

Matrix::removeColumn
void removeColumn(int position)
Removes a column from the matrix.
Definition: Matrix.hpp:772

Matrix::operator/=
Matrix operator/=(double value)
Definition: Matrix.hpp:260

Matrix::operator+
Matrix operator+(const Matrix &b)
Matrix addition operation.
Definition: Matrix.hpp:273

Matrix::addColumn
void addColumn(Matrix values)
Adds a column at the end of the matrix.
Definition: Matrix.hpp:692

Matrix::mData
std::vector< T > mData
Definition: Matrix.hpp:34

Matrix::operator+=
Matrix operator+=(double value)
Definition: Matrix.hpp:239

Matrix::operator!=
Matrix operator!=(const double &value)
Definition: Matrix.hpp:417

Matrix::getColumn
Matrix getColumn(size_t index)
Gets a column from the matrix.
Definition: Matrix.hpp:946

Matrix::ones
static Matrix ones(size_t rows, size_t cols)
Returns a matrix filled with ones.
Definition: Matrix.hpp:519

Matrix::operator+
friend Matrix operator+(const Matrix &m, double value)
Scalar addition.
Definition: Matrix.hpp:142

Matrix::operator-
Matrix operator-()
Matrix negative operation.
Definition: Matrix.hpp:432

Matrix::isSymmetric
bool isSymmetric()
Checks if the matrix is symmetric.
Definition: Matrix.hpp:1136

Matrix::count
Matrix count()
Counts occurrences of elements in a matrix.
Definition: Matrix.hpp:818

Matrix::standardize
Matrix standardize(Matrix means, Matrix stds)
Standardizes the columns of the matrix, subtracting each element of a column by the mean argument and...
Definition: Matrix.hpp:1045

Matrix::BetweenClassScatter
Matrix BetweenClassScatter(Matrix y)
Definition: Matrix.hpp:1285

Matrix::min
T min() const
Definition: Matrix.hpp:1316

Matrix
Matrix implementation, with a series of linear algebra functions.
Definition: Matrix.hpp:30

Matrix::operator-=
Matrix & operator-=(const Matrix &other)
Definition: Matrix.hpp:349

Matrix::apply
Matrix< T > apply(function< T(T)> f)
Definition: Matrix.hpp:1324

MatrixD
Matrix< double > MatrixD
Definition: Matrix.hpp:1376

Matrix::operator/
friend Matrix operator/(const Matrix &m, double value)
Scalar division.
Definition: Matrix.hpp:208

Matrix::cov
Matrix cov()
Calculates the covariance matrix of the current matrix.
Definition: Matrix.hpp:897

Matrix::asDiagonal
Matrix asDiagonal()
Creates a diagonal matrix from a row or column vector.
Definition: Matrix.hpp:1010

Matrix::mean
Matrix mean()
Calculates the mean of the columns of the matrix.
Definition: Matrix.hpp:867

Matrix::standardize
Matrix standardize()
Standardizes the columns of the matrix, subtracting each element of a column by the column mean and d...
Definition: Matrix.hpp:1036

MatrixI
Matrix< int > MatrixI
Definition: Matrix.hpp:1377

Matrix::determinant
double determinant() const
Calculates the determinant of the matrix.
Definition: Matrix.hpp:656

Matrix::sort
void sort()
Sorts elements of the matrix inplace.
Definition: Matrix.hpp:799

Matrix::Matrix
Matrix(size_t rows, size_t cols, T(&data)[N])
Definition: Matrix.hpp:126

Matrix::Matrix
Matrix(size_t dimension)
Initializes a square matrix.
Definition: Matrix.hpp:100

Matrix::Matrix
Matrix(size_t rows, size_t cols)
Initializes a matrix with a predetermined number of rows and columns.
Definition: Matrix.hpp:107

Matrix::adjugate
Matrix adjugate() const
Returns the adjugate of the current matrix, which is the transpose of its cofactor matrix...
Definition: Matrix.hpp:634

Matrix::operator/
friend Matrix operator/(double value, const Matrix &m)
Scalar division.
Definition: Matrix.hpp:225

Matrix::operator==
bool operator==(const Matrix &other)
Definition: Matrix.hpp:406

Matrix::reshape
void reshape(size_t rows, size_t cols)
Reshapes the current matrix.
Definition: Matrix.hpp:932

Matrix::operator*
Matrix operator*(const Matrix &b) const
Matrix multiplication operation.
Definition: Matrix.hpp:314

Matrix::ROWS
Definition: Matrix.hpp:85

Matrix::fill
static Matrix fill(size_t rows, size_t cols, double value)
Returns a matrix filled with a single value.
Definition: Matrix.hpp:472

Matrix::filter
Matrix filter(const Matrix< int > bin, bool columns=false)
Selects a subset of either columns or rows of the matrix.
Definition: Matrix.hpp:1098

Matrix::eigen
pair< Matrix, Matrix > eigen()
Calculates the eigenvalues and eigenvectors of a matrix.
Definition: Matrix.hpp:1168

Matrix::submatrix
Matrix submatrix(size_t row, size_t column) const
Returns a submatrix of the current matrix, removing one row and column of the original matrix...
Definition: Matrix.hpp:556

Matrix::operator==
Matrix< int > operator==(const T &value)
Definition: Matrix.hpp:393

Matrix::operator<<
friend ostream & operator<<(ostream &os, const Matrix &matrix)
Prints a matrix.
Definition: Matrix.hpp:977

Matrix::getRow
Matrix getRow(size_t index)
Gets a row from the matrix.
Definition: Matrix.hpp:961

Matrix::getMinor
double getMinor(size_t row, size_t column) const
Returns the minor of a matrix, which is the determinant of a submatrix where a single row and column ...
Definition: Matrix.hpp:581

Matrix::operator+=
Matrix & operator+=(const Matrix &other)
Definition: Matrix.hpp:335

Matrix::Matrix
Matrix()
Initializes an empty matrix.
Definition: Matrix.hpp:94

Matrix::eigsort
static pair< Matrix, Matrix > eigsort(Matrix eigenvalues, Matrix eigenvectors)
Sorts eigenvalues by magnitude, sorting their corresponding eigenvectors in te same order...
Definition: Matrix.hpp:54

Matrix::getColumns
Matrix getColumns(const Matrix< int > bin)
Selects a subset of columns of the matrix.
Definition: Matrix.hpp:1130

Matrix::addRow
void addRow(Matrix values)
Adds a row at the end of the matrix.
Definition: Matrix.hpp:698

Matrix::cofactor
double cofactor(size_t row, size_t column) const
Calculates the cofactor of a matrix at a given point.
Definition: Matrix.hpp:600

Matrix::operator-
Matrix operator-(const Matrix &b)
Matrix subtraction operation.
Definition: Matrix.hpp:293

Matrix::zeros
static Matrix zeros(size_t rows, size_t cols)
Returns a matrix filled with zeros.
Definition: Matrix.hpp:527

Matrix::operator+
friend Matrix operator+(double value, const Matrix &m)
Scalar addition.
Definition: Matrix.hpp:159

Matrix::transpose
Matrix transpose() const
Returns the transpose of a matrix.
Definition: Matrix.hpp:677

Matrix::oneHot
Matrix oneHot()
Definition: Matrix.hpp:1330

Matrix::operator*
friend Matrix operator*(const Matrix &m, double value)
Scalar multiplication.
Definition: Matrix.hpp:183

Matrix::operator()
T operator()(size_t i, size_t j) const
Functor used to access elements in the matrix.
Definition: Matrix.hpp:460

Matrix::scatter
Matrix scatter()
Calculates the scatter matrix.
Definition: Matrix.hpp:883