Add the cross-entropy loss. (#287)

2025-06-20 12:06:35 +00:00 · 2023-07-31 14:26:36 +01:00
parent ffeafbfc43
commit 1064b9b031
2 changed files with 21 additions and 1 deletions
--- a/candle-nn/src/loss.rs
+++ b/candle-nn/src/loss.rs
@ -26,3 +26,20 @@ pub fn nll(inp: &Tensor, target: &Tensor) -> Result<Tensor> {
        .sum_all()?
        .affine(-1f64 / b_sz as f64, 0.)
 }
+
+/// The cross-entropy loss.
+///
+/// Arguments
+///
+/// * [inp]: The input tensor of dimensions `N, C` where `N` is the batch size and `C` the number
+///          of categories. This is expected to raw logits.
+/// * [target]: The ground truth labels as a tensor of u32 of dimension `N`.
+///
+/// The resulting tensor is a scalar containing the average value over the batch.
+pub fn cross_entropy(inp: &Tensor, target: &Tensor) -> Result<Tensor> {
+    if inp.rank() != 2 {
+        candle::bail!("cross_entropy expects an input tensor of rank 2")
+    }
+    let inp = crate::ops::log_softmax(inp, 1)?;
+    nll(&inp, target)
+}