deep-learning-algo-impls/losses_8cpp_source.html

#include "loss/losses.hpp"

#include <cmath>

#include <algorithm>


namespace dl::loss {


    // ============================================================================

    // MSE Loss Implementation

    // ============================================================================


    template<typename T>


    Variable<T> MSELoss<T>::forward(const Variable<T>& predictions, const Variable<T>& targets) {

        // TODO: Implement MSE loss computation

        // Steps:

        // 1. Compute difference: diff = predictions - targets

        // 2. Square the difference: squared_diff = diff * diff

        // 3. Apply reduction (mean, sum, or none)


        Variable<T> diff = predictions - targets;

        Variable<T> squared_diff = diff * diff;


        if (reduction_ == "mean") {

            return squared_diff.mean();

        } else if (reduction_ == "sum") {

            return squared_diff.sum();

        } else {

            return squared_diff;

        }

    }


    // ============================================================================

    // Cross Entropy Loss Implementation

    // ============================================================================


    template<typename T>

    Variable<T> CrossEntropyLoss<T>::softmax(const Variable<T>& logits) {

        // TODO: Implement numerically stable softmax

        // Steps:

        // 1. Subtract max for numerical stability: shifted = logits - max(logits)

        // 2. Compute exp: exp_shifted = exp(shifted)

        // 3. Normalize: softmax = exp_shifted / sum(exp_shifted)


        // Placeholder implementation

        Variable<T> exp_logits = logits.exp();

        Variable<T> sum_exp = exp_logits.sum();

        // TODO: Implement proper broadcasting division

        return exp_logits; // Placeholder

    }


    template<typename T>

    Variable<T> CrossEntropyLoss<T>::log_softmax(const Variable<T>& logits) {

        // TODO: Implement numerically stable log_softmax

        // log_softmax(x) = x - log(sum(exp(x)))

        // More stable than log(softmax(x))


        // Placeholder implementation

        return logits.log(); // Placeholder

    }


    template<typename T>


    Variable<T> CrossEntropyLoss<T>::forward(const Variable<T>& predictions, const Variable<T>& targets) {

        // TODO: Implement cross entropy loss

        // Steps:

        // 1. Apply log_softmax to predictions

        // 2. Compute negative log likelihood: -targets * log_softmax_pred

        // 3. Apply reduction


        Variable<T> log_probs = log_softmax(predictions);

        Variable<T> nll = targets * log_probs;

        Variable<T> loss = nll * Variable<T>(Matrix<T>(1, 1, -1.0), false); // Negate


        if (reduction_ == "mean") {

            return loss.mean();

        } else if (reduction_ == "sum") {

            return loss.sum();

        } else {

            return loss;

        }

    }


    // ============================================================================

    // Binary Cross Entropy Loss Implementation

    // ============================================================================


    template<typename T>


    Variable<T> BCELoss<T>::forward(const Variable<T>& predictions, const Variable<T>& targets) {

        // TODO: Implement BCE loss

        // BCE = -[y * log(p) + (1-y) * log(1-p)]

        // Steps:

        // 1. Compute log(predictions) and log(1 - predictions)

        // 2. Apply BCE formula

        // 3. Apply reduction


        // Add small epsilon for numerical stability

        T eps = 1e-7;

        Variable<T> eps_var(Matrix<T>(1, 1, eps), false);

        Variable<T> one_var(Matrix<T>(1, 1, 1.0), false);


        // Clamp predictions to avoid log(0)

        // TODO: Implement proper clamping

        Variable<T> log_pred = predictions.log();

        Variable<T> log_one_minus_pred = (one_var - predictions).log();


        Variable<T> loss = targets * log_pred + (one_var - targets) * log_one_minus_pred;

        loss = loss * Variable<T>(Matrix<T>(1, 1, -1.0), false); // Negate


        if (reduction_ == "mean") {

            return loss.mean();

        } else if (reduction_ == "sum") {

            return loss.sum();

        } else {

            return loss;

        }

    }


    // ============================================================================

    // BCE with Logits Loss Implementation

    // ============================================================================


    template<typename T>


    Variable<T> BCEWithLogitsLoss<T>::forward(const Variable<T>& predictions, const Variable<T>& targets) {

        // TODO: Implement BCE with logits (more numerically stable)

        // Use the identity: BCE_with_logits(x, y) = max(x, 0) - x*y + log(1 + exp(-|x|))

        // This avoids computing sigmoid explicitly


        // Placeholder: Apply sigmoid then BCE

        Variable<T> sigmoid_pred = predictions.sigmoid();

        BCELoss<T> bce_loss(reduction_);

        return bce_loss.forward(sigmoid_pred, targets);

    }


    // ============================================================================

    // Hinge Loss Implementation

    // ============================================================================


    template<typename T>


    Variable<T> HingeLoss<T>::forward(const Variable<T>& predictions, const Variable<T>& targets) {

        // TODO: Implement hinge loss

        // Hinge(y_pred, y_true) = max(0, 1 - y_true * y_pred)

        // Steps:

        // 1. Compute margin: 1 - targets * predictions

        // 2. Apply max(0, margin) - this requires implementing max operation

        // 3. Apply reduction


        Variable<T> one_var(Matrix<T>(1, 1, 1.0), false);

        Variable<T> margin = one_var - targets * predictions;


        // TODO: Implement max(0, margin) operation

        // For now, placeholder implementation

        Variable<T> loss = margin; // Placeholder


        if (reduction_ == "mean") {

            return loss.mean();

        } else if (reduction_ == "sum") {

            return loss.sum();

        } else {

            return loss;

        }

    }


    // ============================================================================

    // Huber Loss Implementation

    // ============================================================================


    template<typename T>


    Variable<T> HuberLoss<T>::forward(const Variable<T>& predictions, const Variable<T>& targets) {

        // TODO: Implement Huber loss

        // Huber(y_pred, y_true) = {

        //   0.5 * (y_pred - y_true)²     if |y_pred - y_true| <= delta

        //   delta * |y_pred - y_true| - 0.5 * delta²   otherwise

        // }

        // Steps:

        // 1. Compute absolute difference: |predictions - targets|

        // 2. Create mask for |diff| <= delta

        // 3. Apply conditional logic

        // 4. Apply reduction


        Variable<T> diff = predictions - targets;

        Variable<T> abs_diff = diff; // TODO: Implement abs() operation


        // Placeholder: Use MSE for now

        Variable<T> squared_diff = diff * diff;

        Variable<T> half_var(Matrix<T>(1, 1, 0.5), false);

        Variable<T> loss = half_var * squared_diff;


        if (reduction_ == "mean") {

            return loss.mean();

        } else if (reduction_ == "sum") {

            return loss.sum();

        } else {

            return loss;

        }

    }


    // ============================================================================

    // Explicit Template Instantiations

    // ============================================================================


    template class MSELoss<float>;

    template class MSELoss<double>;

    template class CrossEntropyLoss<float>;

    template class CrossEntropyLoss<double>;

    template class BCELoss<float>;

    template class BCELoss<double>;

    template class BCEWithLogitsLoss<float>;

    template class BCEWithLogitsLoss<double>;

    template class HingeLoss<float>;

    template class HingeLoss<double>;

    template class HuberLoss<float>;

    template class HuberLoss<double>;


} // namespace dl::loss

dl::loss::BCELoss
Binary Cross Entropy Loss with autograd support.
Definition losses.hpp:121

dl::loss::BCELoss::forward
Variable< T > forward(const Variable< T > &predictions, const Variable< T > &targets) override
Forward pass: compute binary cross entropy loss.
Definition losses.cpp:86

dl::loss::BCEWithLogitsLoss
Binary Cross Entropy with Logits Loss.
Definition losses.hpp:148

dl::loss::BCEWithLogitsLoss::forward
Variable< T > forward(const Variable< T > &predictions, const Variable< T > &targets) override
Forward pass: compute BCE loss from logits.
Definition losses.cpp:121

dl::loss::CrossEntropyLoss
Cross Entropy Loss with autograd support.
Definition losses.hpp:83

dl::loss::CrossEntropyLoss::forward
Variable< T > forward(const Variable< T > &predictions, const Variable< T > &targets) override
Forward pass: compute cross entropy loss.
Definition losses.cpp:61

dl::loss::HingeLoss
Hinge Loss with autograd support.
Definition losses.hpp:176

dl::loss::HingeLoss::forward
Variable< T > forward(const Variable< T > &predictions, const Variable< T > &targets) override
Forward pass: compute hinge loss.
Definition losses.cpp:137

dl::loss::HuberLoss
Huber Loss with autograd support.
Definition losses.hpp:207

dl::loss::HuberLoss::forward
Variable< T > forward(const Variable< T > &predictions, const Variable< T > &targets) override
Forward pass: compute Huber loss.
Definition losses.cpp:166

dl::loss::MSELoss
Mean Squared Error Loss with autograd support.
Definition losses.hpp:55

dl::loss::MSELoss::forward
Variable< T > forward(const Variable< T > &predictions, const Variable< T > &targets) override
Forward pass: compute MSE loss.
Definition losses.cpp:12

utils::Matrix
Definition matrix.hpp:46

utils::Variable
Variable class that supports automatic differentiation.
Definition autograd.hpp:58

utils::Variable::mean
Variable< T > mean() const
Definition autograd.cpp:102

utils::Variable::sigmoid
Variable< T > sigmoid() const
Definition autograd.cpp:113

utils::Variable::log
Variable< T > log() const
Definition autograd.cpp:158

utils::Variable::exp
Variable< T > exp() const
Definition autograd.cpp:147

utils::Variable::sum
Variable< T > sum() const
Definition autograd.cpp:91

losses.hpp
PyTorch-like loss functions with automatic differentiation.

dl::loss
Definition losses.hpp:15