#pragma once #include "core/omp_config.h" #include "utils/vector.h" #include "utils/matrix.h" #include "Layer.h" #include "utils/random.h" #include "random/random.h" namespace neural_networks{ template struct Dense_Layer : Layer{ T weight_regularizer_l1 = {0}; T weight_regularizer_l2 = {0}; T bias_regularizer_l1 = {0}; T bias_regularizer_l2 = {0}; utils::Matrix _inputs; utils::Matrix weights; utils::Vector biases; utils::Matrix outputs; utils::Matrix dweights; utils::Vector dbiases; utils::Matrix dinputs; // Variables for optimizers utils::Matrix weight_momentums; utils::Vector bias_momentums; utils::Matrix weight_cache; utils::Vector bias_cache; // Default Constructor Dense_Layer() = default; // Constructor Dense_Layer(const uint64_t n_inputs, const uint64_t n_neurons, const T weight_regularizer_l1=T{0}, const T weight_regularizer_l2=T{0}, const T bias_regularizer_l1=T{0}, const T bias_regularizer_l2=T{0}){ this->weight_regularizer_l1 = weight_regularizer_l1; this->weight_regularizer_l2 = weight_regularizer_l2; this->bias_regularizer_l1 = bias_regularizer_l1; this->bias_regularizer_l2 = bias_regularizer_l2; weights = numerics::mul( rng::normal(n_inputs, n_neurons, 0.0f, 1.0f), 0.1f); //weights = numerics::random_matrix(n_inputs, n_neurons, -1, 1); biases.resize(n_neurons, T{0}); } void forward(const utils::Matrix& inputs){ _inputs = inputs; //std::cout << "HERE" << std::endl; outputs = numerics::add_rowwise(numerics::matmul(inputs, weights), biases); } void backward(const utils::Matrix& dvalues){ // Gradients on parameters dweights = numerics::matmul(numerics::transpose(_inputs), dvalues); dbiases = numerics::sum_colwise(dvalues); // Gradients on regularization // L1 on weights if(weight_regularizer_l1){ utils::Matrix dL1(weights.rows(), weights.cols(), T{1}); for (uint64_t i = 0; i < weights.rows(); ++i){ for (uint64_t j = 0; j < weights.cols(); ++j){ if (weights(i,j) < 0){ dL1(i,j) = -1; } } } dweights = numerics::add(dweights, numerics::mul(dL1, weight_regularizer_l1)); } // L2 on weights if(weight_regularizer_l2){ dweights = numerics::add(dweights, numerics::mul(numerics::mul(weights, weight_regularizer_l2),T{2})); } // L1 on biases if(bias_regularizer_l1){ utils::Vector dL1(biases.size(), T{1}); for (uint64_t i = 0; i < dL1.size(); ++i){ if (biases[i] < 0){ dL1[i] = -1; } } dbiases = numerics::add(dbiases, numerics::mul(dL1, bias_regularizer_l1)); } // L2 on biases if (bias_regularizer_l2){ dbiases = numerics::add(dbiases, numerics::mul(numerics::mul(biases, bias_regularizer_l2),T{2})); } //Gradient on values dinputs = numerics::matmul(dvalues, numerics::transpose(weights)); } }; } // end namespace neural_networks