/*************************************************************************/ /* pca.cpp */ /*************************************************************************/ /* This file is part of: */ /* PMLPP Machine Learning Library */ /* https://github.com/Relintai/pmlpp */ /*************************************************************************/ /* Copyright (c) 2023-present Péter Magyar. */ /* Copyright (c) 2022-2023 Marc Melikyan */ /* */ /* Permission is hereby granted, free of charge, to any person obtaining */ /* a copy of this software and associated documentation files (the */ /* "Software"), to deal in the Software without restriction, including */ /* without limitation the rights to use, copy, modify, merge, publish, */ /* distribute, sublicense, and/or sell copies of the Software, and to */ /* permit persons to whom the Software is furnished to do so, subject to */ /* the following conditions: */ /* */ /* The above copyright notice and this permission notice shall be */ /* included in all copies or substantial portions of the Software. */ /* */ /* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, */ /* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF */ /* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.*/ /* IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY */ /* CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, */ /* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE */ /* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */ /*************************************************************************/ #include "pca.h" #include "../data/data.h" Ref MLPPPCA::get_input_set() { return _input_set; } void MLPPPCA::set_input_set(const Ref &val) { _input_set = val; } int MLPPPCA::get_k() { return _k; } void MLPPPCA::set_k(const int val) { _k = val; } Ref MLPPPCA::principal_components() { ERR_FAIL_COND_V(!_input_set.is_valid() || _k == 0, Ref()); MLPPData data; MLPPMatrix::SVDResult svr_res = _input_set->cov()->svd(); _x_normalized = data.mean_centering(_input_set); Size2i svr_res_u_size = svr_res.U->size(); _u_reduce->resize(Size2i(_k, svr_res_u_size.y)); for (int i = 0; i < _k; ++i) { for (int j = 0; j < svr_res_u_size.y; ++j) { _u_reduce->element_set(j, i, svr_res.U->element_get(j, i)); } } _z = _u_reduce->transposen()->multn(_x_normalized); return _z; } // Simply tells us the percentage of variance maintained. real_t MLPPPCA::score() { ERR_FAIL_COND_V(!_input_set.is_valid() || _k == 0, 0); Ref x_approx = _u_reduce->multn(_z); real_t num = 0; real_t den = 0; Size2i x_normalized_size = _x_normalized->size(); int x_normalized_size_y = x_normalized_size.y; Ref x_approx_row_tmp; x_approx_row_tmp.instance(); x_approx_row_tmp->resize(x_approx->size().x); Ref x_normalized_row_tmp; x_normalized_row_tmp.instance(); x_normalized_row_tmp->resize(x_normalized_size.x); for (int i = 0; i < x_normalized_size_y; ++i) { _x_normalized->row_get_into_mlpp_vector(i, x_normalized_row_tmp); x_approx->row_get_into_mlpp_vector(i, x_approx_row_tmp); num += x_normalized_row_tmp->subn(x_approx_row_tmp)->norm_sq(); } num /= x_normalized_size_y; for (int i = 0; i < x_normalized_size_y; ++i) { _x_normalized->row_get_into_mlpp_vector(i, x_normalized_row_tmp); den += x_normalized_row_tmp->norm_sq(); } den /= x_normalized_size_y; if (den == 0) { den += 1e-10; // For numerical sanity as to not recieve a domain error } return 1 - num / den; } MLPPPCA::MLPPPCA(const Ref &p_input_set, int p_k) { _k = p_k; _input_set = p_input_set; _x_normalized.instance(); _u_reduce.instance(); _z.instance(); } MLPPPCA::MLPPPCA() { _k = 0; _x_normalized.instance(); _u_reduce.instance(); _z.instance(); } MLPPPCA::~MLPPPCA() { } void MLPPPCA::_bind_methods() { ClassDB::bind_method(D_METHOD("get_input_set"), &MLPPPCA::get_input_set); ClassDB::bind_method(D_METHOD("set_input_set", "val"), &MLPPPCA::set_input_set); ADD_PROPERTY(PropertyInfo(Variant::OBJECT, "get_input_set", PROPERTY_HINT_RESOURCE_TYPE, "MLPPMatrix"), "set_input_set", "get_input_set"); ClassDB::bind_method(D_METHOD("get_k"), &MLPPPCA::get_k); ClassDB::bind_method(D_METHOD("set_k", "val"), &MLPPPCA::set_k); ADD_PROPERTY(PropertyInfo(Variant::INT, "k"), "set_k", "get_k"); ClassDB::bind_method(D_METHOD("principal_components"), &MLPPPCA::principal_components); ClassDB::bind_method(D_METHOD("score"), &MLPPPCA::score); }