Sync public subset from Flux

This commit is contained in:
Gitea CI
2025-10-20 12:24:21 +00:00
parent 9a69d64d79
commit a334b74935
8 changed files with 230 additions and 35 deletions

View File

@@ -11,30 +11,47 @@
#include "./numerics/matdiv.h"
namespace neural_networks{
template <typename T>
struct Activation_Softmax{
utils::Matrix<T> exp_values;
utils::Matrix<T> probabilities;
//utils::Matrix<T> exp_values;
//utils::Matrix<T> probabilities;
utils::Matrix<T> outputs;
utils::Matrix<T> dinputs;
void forward(const utils::Matrix<T>& inputs){
// Get unnormalized probabilities
exp_values = numerics::matexp(numerics::matsubtract(inputs, numerics::matmax(inputs, "rows"), "col"));
utils::Matrix<T> exp_values = numerics::matexp(numerics::matsubtract(inputs, numerics::matmax(inputs, "rows"), "col"));
// Normalize them for each sample
probabilities = numerics::matdiv(exp_values, numerics::matsum(exp_values, "col"), "col");
utils::Matrix<T> probabilities = numerics::matdiv(exp_values, numerics::matsum(exp_values, "col"), "col");
outputs = probabilities;
}
void backward(const utils::Matrix<T>& dvalues){
const uint64_t rows = dvalues.rows();
const uint64_t cols = dvalues.cols();
if ((dinputs.rows() != rows) || dinputs.cols() != cols){
dinputs.resize(rows, cols);
}
for (uint64_t i = 0; i < rows; ++i){
T dot = T{0};
for (uint64_t j = 0; j < cols; ++j){
dot += outputs(i,j) * dvalues(i,j);
}
for (uint64_t j = 0; j < cols; ++j){
dinputs(i,j) = outputs(i,j) * (dvalues(i,j) - dot);
}
}
}
};
} // end namespace neural_networks