diff --git a/python/mxnet/gluon/loss.py b/python/mxnet/gluon/loss.py index 45c3dee08139..40fdaa51573e 100644 --- a/python/mxnet/gluon/loss.py +++ b/python/mxnet/gluon/loss.py @@ -424,7 +424,7 @@ class KLDivLoss(Loss): prob = \softmax({pred}) - L = \sum_i {label}_i * \big[\log({label}_i) - log({pred}_i)\big] + L = \sum_i {label}_i * \big[\log({label}_i) - \log({prob}_i)\big] `label` and `pred` can have arbitrary shape as long as they have the same