2023-01-23 21:13:26 +01:00
//
// LinReg.cpp
//
// Created by Marc Melikyan on 10/2/20.
//
2023-01-24 18:12:23 +01:00
# include "lin_reg.h"
2023-01-24 19:00:54 +01:00
# include "../cost/cost.h"
2023-01-24 18:12:23 +01:00
# include "../lin_alg/lin_alg.h"
# include "../regularization/reg.h"
2023-01-24 19:00:54 +01:00
# include "../stat/stat.h"
2023-01-24 18:12:23 +01:00
# include "../utilities/utilities.h"
2023-01-23 21:13:26 +01:00
# include <cmath>
2023-01-24 19:00:54 +01:00
# include <iostream>
2023-01-23 21:13:26 +01:00
# include <random>
2023-01-24 19:20:18 +01:00
2023-01-24 19:00:54 +01:00
2023-01-25 00:54:50 +01:00
MLPPLinReg : : MLPPLinReg ( std : : vector < std : : vector < double > > inputSet , std : : vector < double > outputSet , std : : string reg , double lambda , double alpha ) :
2023-01-24 19:00:54 +01:00
inputSet ( inputSet ) , outputSet ( outputSet ) , n ( inputSet . size ( ) ) , k ( inputSet [ 0 ] . size ( ) ) , reg ( reg ) , lambda ( lambda ) , alpha ( alpha ) {
y_hat . resize ( n ) ;
2023-01-25 01:09:37 +01:00
weights = MLPPUtilities : : weightInitialization ( k ) ;
bias = MLPPUtilities : : biasInitialization ( ) ;
2023-01-24 19:00:54 +01:00
}
2023-01-25 00:54:50 +01:00
std : : vector < double > MLPPLinReg : : modelSetTest ( std : : vector < std : : vector < double > > X ) {
2023-01-24 19:00:54 +01:00
return Evaluate ( X ) ;
}
2023-01-25 00:54:50 +01:00
double MLPPLinReg : : modelTest ( std : : vector < double > x ) {
2023-01-24 19:00:54 +01:00
return Evaluate ( x ) ;
}
2023-01-25 00:54:50 +01:00
void MLPPLinReg : : NewtonRaphson ( double learning_rate , int max_epoch , bool UI ) {
2023-01-25 00:29:02 +01:00
MLPPLinAlg alg ;
2023-01-25 00:54:50 +01:00
MLPPReg regularization ;
2023-01-24 19:00:54 +01:00
double cost_prev = 0 ;
int epoch = 1 ;
forwardPass ( ) ;
while ( true ) {
cost_prev = Cost ( y_hat , outputSet ) ;
std : : vector < double > error = alg . subtraction ( y_hat , outputSet ) ;
// Calculating the weight gradients (2nd derivative)
std : : vector < double > first_derivative = alg . mat_vec_mult ( alg . transpose ( inputSet ) , error ) ;
std : : vector < std : : vector < double > > second_derivative = alg . matmult ( alg . transpose ( inputSet ) , inputSet ) ;
weights = alg . subtraction ( weights , alg . scalarMultiply ( learning_rate / n , alg . mat_vec_mult ( alg . transpose ( alg . inverse ( second_derivative ) ) , first_derivative ) ) ) ;
weights = regularization . regWeights ( weights , lambda , alpha , reg ) ;
// Calculating the bias gradients (2nd derivative)
bias - = learning_rate * alg . sum_elements ( error ) / n ; // We keep this the same. The 2nd derivative is just [1].
forwardPass ( ) ;
if ( UI ) {
2023-01-25 01:09:37 +01:00
MLPPUtilities : : CostInfo ( epoch , cost_prev , Cost ( y_hat , outputSet ) ) ;
MLPPUtilities : : UI ( weights , bias ) ;
2023-01-24 19:00:54 +01:00
}
epoch + + ;
if ( epoch > max_epoch ) {
break ;
}
}
}
2023-01-25 00:54:50 +01:00
void MLPPLinReg : : gradientDescent ( double learning_rate , int max_epoch , bool UI ) {
2023-01-25 00:29:02 +01:00
MLPPLinAlg alg ;
2023-01-25 00:54:50 +01:00
MLPPReg regularization ;
2023-01-24 19:00:54 +01:00
double cost_prev = 0 ;
int epoch = 1 ;
forwardPass ( ) ;
while ( true ) {
cost_prev = Cost ( y_hat , outputSet ) ;
std : : vector < double > error = alg . subtraction ( y_hat , outputSet ) ;
// Calculating the weight gradients
weights = alg . subtraction ( weights , alg . scalarMultiply ( learning_rate / n , alg . mat_vec_mult ( alg . transpose ( inputSet ) , error ) ) ) ;
weights = regularization . regWeights ( weights , lambda , alpha , reg ) ;
// Calculating the bias gradients
bias - = learning_rate * alg . sum_elements ( error ) / n ;
forwardPass ( ) ;
if ( UI ) {
2023-01-25 01:09:37 +01:00
MLPPUtilities : : CostInfo ( epoch , cost_prev , Cost ( y_hat , outputSet ) ) ;
MLPPUtilities : : UI ( weights , bias ) ;
2023-01-24 19:00:54 +01:00
}
epoch + + ;
if ( epoch > max_epoch ) {
break ;
}
}
}
2023-01-25 00:54:50 +01:00
void MLPPLinReg : : SGD ( double learning_rate , int max_epoch , bool UI ) {
2023-01-25 00:29:02 +01:00
MLPPLinAlg alg ;
2023-01-25 00:54:50 +01:00
MLPPReg regularization ;
2023-01-24 19:00:54 +01:00
double cost_prev = 0 ;
int epoch = 1 ;
while ( true ) {
std : : random_device rd ;
std : : default_random_engine generator ( rd ( ) ) ;
std : : uniform_int_distribution < int > distribution ( 0 , int ( n - 1 ) ) ;
int outputIndex = distribution ( generator ) ;
double y_hat = Evaluate ( inputSet [ outputIndex ] ) ;
cost_prev = Cost ( { y_hat } , { outputSet [ outputIndex ] } ) ;
double error = y_hat - outputSet [ outputIndex ] ;
// Weight updation
weights = alg . subtraction ( weights , alg . scalarMultiply ( learning_rate * error , inputSet [ outputIndex ] ) ) ;
weights = regularization . regWeights ( weights , lambda , alpha , reg ) ;
// Bias updation
bias - = learning_rate * error ;
y_hat = Evaluate ( { inputSet [ outputIndex ] } ) ;
if ( UI ) {
2023-01-25 01:09:37 +01:00
MLPPUtilities : : CostInfo ( epoch , cost_prev , Cost ( { y_hat } , { outputSet [ outputIndex ] } ) ) ;
MLPPUtilities : : UI ( weights , bias ) ;
2023-01-24 19:00:54 +01:00
}
epoch + + ;
if ( epoch > max_epoch ) {
break ;
}
}
forwardPass ( ) ;
}
2023-01-25 00:54:50 +01:00
void MLPPLinReg : : MBGD ( double learning_rate , int max_epoch , int mini_batch_size , bool UI ) {
2023-01-25 00:29:02 +01:00
MLPPLinAlg alg ;
2023-01-25 00:54:50 +01:00
MLPPReg regularization ;
2023-01-24 19:00:54 +01:00
double cost_prev = 0 ;
int epoch = 1 ;
// Creating the mini-batches
int n_mini_batch = n / mini_batch_size ;
2023-01-25 01:09:37 +01:00
auto [ inputMiniBatches , outputMiniBatches ] = MLPPUtilities : : createMiniBatches ( inputSet , outputSet , n_mini_batch ) ;
2023-01-24 19:00:54 +01:00
while ( true ) {
for ( int i = 0 ; i < n_mini_batch ; i + + ) {
std : : vector < double > y_hat = Evaluate ( inputMiniBatches [ i ] ) ;
cost_prev = Cost ( y_hat , outputMiniBatches [ i ] ) ;
std : : vector < double > error = alg . subtraction ( y_hat , outputMiniBatches [ i ] ) ;
// Calculating the weight gradients
weights = alg . subtraction ( weights , alg . scalarMultiply ( learning_rate / outputMiniBatches [ i ] . size ( ) , alg . mat_vec_mult ( alg . transpose ( inputMiniBatches [ i ] ) , error ) ) ) ;
weights = regularization . regWeights ( weights , lambda , alpha , reg ) ;
// Calculating the bias gradients
bias - = learning_rate * alg . sum_elements ( error ) / outputMiniBatches [ i ] . size ( ) ;
y_hat = Evaluate ( inputMiniBatches [ i ] ) ;
if ( UI ) {
2023-01-25 01:09:37 +01:00
MLPPUtilities : : CostInfo ( epoch , cost_prev , Cost ( y_hat , outputMiniBatches [ i ] ) ) ;
MLPPUtilities : : UI ( weights , bias ) ;
2023-01-24 19:00:54 +01:00
}
}
epoch + + ;
if ( epoch > max_epoch ) {
break ;
}
}
forwardPass ( ) ;
}
2023-01-25 00:54:50 +01:00
void MLPPLinReg : : normalEquation ( ) {
2023-01-25 00:29:02 +01:00
MLPPLinAlg alg ;
2023-01-25 01:09:37 +01:00
MLPPStat stat ;
2023-01-24 19:00:54 +01:00
std : : vector < double > x_means ;
std : : vector < std : : vector < double > > inputSetT = alg . transpose ( inputSet ) ;
x_means . resize ( inputSetT . size ( ) ) ;
for ( int i = 0 ; i < inputSetT . size ( ) ; i + + ) {
x_means [ i ] = ( stat . mean ( inputSetT [ i ] ) ) ;
}
2023-01-24 19:14:38 +01:00
//try {
2023-01-24 19:00:54 +01:00
std : : vector < double > temp ;
temp . resize ( k ) ;
temp = alg . mat_vec_mult ( alg . inverse ( alg . matmult ( alg . transpose ( inputSet ) , inputSet ) ) , alg . mat_vec_mult ( alg . transpose ( inputSet ) , outputSet ) ) ;
if ( std : : isnan ( temp [ 0 ] ) ) {
2023-01-24 19:14:38 +01:00
//throw 99;
//TODO ERR_FAIL_COND
2023-01-24 19:00:54 +01:00
} else {
if ( reg = = " Ridge " ) {
weights = alg . mat_vec_mult ( alg . inverse ( alg . addition ( alg . matmult ( alg . transpose ( inputSet ) , inputSet ) , alg . scalarMultiply ( lambda , alg . identity ( k ) ) ) ) , alg . mat_vec_mult ( alg . transpose ( inputSet ) , outputSet ) ) ;
} else {
weights = alg . mat_vec_mult ( alg . inverse ( alg . matmult ( alg . transpose ( inputSet ) , inputSet ) ) , alg . mat_vec_mult ( alg . transpose ( inputSet ) , outputSet ) ) ;
}
bias = stat . mean ( outputSet ) - alg . dot ( weights , x_means ) ;
forwardPass ( ) ;
}
2023-01-24 19:14:38 +01:00
//} catch (int err_num) {
// std::cout << "ERR " << err_num << ": Resulting matrix was noninvertible/degenerate, and so the normal equation could not be performed. Try utilizing gradient descent." << std::endl;
//}
2023-01-24 19:00:54 +01:00
}
2023-01-25 00:54:50 +01:00
double MLPPLinReg : : score ( ) {
2023-01-25 01:09:37 +01:00
MLPPUtilities util ;
2023-01-24 19:00:54 +01:00
return util . performance ( y_hat , outputSet ) ;
}
2023-01-25 00:54:50 +01:00
void MLPPLinReg : : save ( std : : string fileName ) {
2023-01-25 01:09:37 +01:00
MLPPUtilities util ;
2023-01-24 19:00:54 +01:00
util . saveParameters ( fileName , weights , bias ) ;
}
2023-01-25 00:54:50 +01:00
double MLPPLinReg : : Cost ( std : : vector < double > y_hat , std : : vector < double > y ) {
MLPPReg regularization ;
2023-01-24 19:37:08 +01:00
class MLPPCost cost ;
2023-01-24 19:00:54 +01:00
return cost . MSE ( y_hat , y ) + regularization . regTerm ( weights , lambda , alpha , reg ) ;
}
2023-01-25 00:54:50 +01:00
std : : vector < double > MLPPLinReg : : Evaluate ( std : : vector < std : : vector < double > > X ) {
2023-01-25 00:29:02 +01:00
MLPPLinAlg alg ;
2023-01-24 19:00:54 +01:00
return alg . scalarAdd ( bias , alg . mat_vec_mult ( X , weights ) ) ;
}
2023-01-25 00:54:50 +01:00
double MLPPLinReg : : Evaluate ( std : : vector < double > x ) {
2023-01-25 00:29:02 +01:00
MLPPLinAlg alg ;
2023-01-24 19:00:54 +01:00
return alg . dot ( weights , x ) + bias ;
}
// wTx + b
2023-01-25 00:54:50 +01:00
void MLPPLinReg : : forwardPass ( ) {
2023-01-24 19:00:54 +01:00
y_hat = Evaluate ( inputSet ) ;
}