lightning/pytorch_lightning/metrics/functional/confusion_matrix.py

# Copyright The PyTorch Lightning team.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
from typing import Optional

import torch

from pytorch_lightning.metrics.classification.helpers import _input_format_classification
from pytorch_lightning.utilities import rank_zero_warn


def _confusion_matrix_update(
    preds: torch.Tensor, target: torch.Tensor, num_classes: int, threshold: float = 0.5
) -> torch.Tensor:
    preds, target, mode = _input_format_classification(preds, target, threshold)
    if mode not in ('binary', 'multi-label'):
        preds = preds.argmax(dim=1)
        target = target.argmax(dim=1)
    unique_mapping = (target.view(-1) * num_classes + preds.view(-1)).to(torch.long)
    bins = torch.bincount(unique_mapping, minlength=num_classes**2)
    confmat = bins.reshape(num_classes, num_classes)
    return confmat


def _confusion_matrix_compute(confmat: torch.Tensor, normalize: Optional[str] = None) -> torch.Tensor:
    allowed_normalize = ('true', 'pred', 'all', None)
    assert normalize in allowed_normalize, \
        f"Argument average needs to one of the following: {allowed_normalize}"
    confmat = confmat.float()
    if normalize is not None:
        if normalize == 'true':
            cm = confmat / confmat.sum(axis=1, keepdim=True)
        elif normalize == 'pred':
            cm = confmat / confmat.sum(axis=0, keepdim=True)
        elif normalize == 'all':
            cm = confmat / confmat.sum()
        nan_elements = cm[torch.isnan(cm)].nelement()
        if nan_elements != 0:
            cm[torch.isnan(cm)] = 0
            rank_zero_warn(f'{nan_elements} nan values found in confusion matrix have been replaced with zeros.')
        return cm
    return confmat


def confusion_matrix(
    preds: torch.Tensor,
    target: torch.Tensor,
    num_classes: int,
    normalize: Optional[str] = None,
    threshold: float = 0.5
) -> torch.Tensor:
    """
    Computes the confusion matrix. Works with binary, multiclass, and multilabel data.
    Accepts logits from a model output or integer class values in prediction.
    Works with multi-dimensional preds and target.

    If preds and target are the same shape and preds is a float tensor, we use the ``self.threshold`` argument.
    This is the case for binary and multi-label logits.

    If preds has an extra dimension as in the case of multi-class scores we perform an argmax on ``dim=1``.

    Args:
        preds: (float or long tensor), Either a ``(N, ...)`` tensor with labels or
            ``(N, C, ...)`` where C is the number of classes, tensor with logits/probabilities
        target: ``target`` (long tensor), tensor with shape ``(N, ...)`` with ground true labels
        num_classes: Number of classes in the dataset.
        normalize: Normalization mode for confusion matrix. Choose from

            - ``None``: no normalization (default)
            - ``'true'``: normalization over the targets (most commonly used)
            - ``'pred'``: normalization over the predictions
            - ``'all'``: normalization over the whole matrix

        threshold:
            Threshold value for binary or multi-label logits. default: 0.5

    Example:

        >>> from pytorch_lightning.metrics.functional import confusion_matrix
        >>> target = torch.tensor([1, 1, 0, 0])
        >>> preds = torch.tensor([0, 1, 0, 0])
        >>> confusion_matrix(preds, target, num_classes=2)
        tensor([[2., 0.],
                [1., 1.]])
    """
    confmat = _confusion_matrix_update(preds, target, num_classes, threshold)
    return _confusion_matrix_compute(confmat, normalize)
[Metrics] Confusion matrix class interface (#4348) * docs + precision + recall + f_beta + refactor Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * rebase Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * fixes Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * added missing file * docs * docs * extra import * add confusion matrix * add to docs * add test * pep8 + isort * update tests * move util function * unify functional and class * add to init * remove old implementation * update tests * pep8 * add duplicate * fix doctest * Update pytorch_lightning/metrics/classification/confusion_matrix.py Co-authored-by: Justus Schock <12886177+justusschock@users.noreply.github.com> * changelog * bullet point args * bullet docs * bullet docs Co-authored-by: ananyahjha93 <ananya@pytorchlightning.ai> Co-authored-by: Teddy Koker <teddy.koker@gmail.com> Co-authored-by: Justus Schock <12886177+justusschock@users.noreply.github.com> Co-authored-by: chaton <thomas@grid.ai> Co-authored-by: Roger Shieh <55400948+s-rog@users.noreply.github.com> Co-authored-by: Rohit Gupta <rohitgr1998@gmail.com> 2020-10-30 10:44:25 +00:00			`# Copyright The PyTorch Lightning team.`
			`#`
			`# Licensed under the Apache License, Version 2.0 (the "License");`
			`# you may not use this file except in compliance with the License.`
			`# You may obtain a copy of the License at`
			`#`
			`# http://www.apache.org/licenses/LICENSE-2.0`
			`#`
			`# Unless required by applicable law or agreed to in writing, software`
			`# distributed under the License is distributed on an "AS IS" BASIS,`
			`# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`# See the License for the specific language governing permissions and`
			`# limitations under the License.`
			`from typing import Optional`

			`import torch`

drop duplicated metric helper (#5366) * drop duplicated metric helper * . * fix tests Co-authored-by: Nicki Skafte <skaftenicki@gmail.com> 2021-01-06 23:49:59 +00:00			`from pytorch_lightning.metrics.classification.helpers import _input_format_classification`
[Metrics] PrecisionRecallCurve, ROC and AveragePrecision class interface (#4549) * initial changes * remove old * init files * add average precision * add precision_recall_curve * add roc * cleaning * docs * pep8 * docs * pep8 * changelog * examples prune duplicate roc * format * imports * fix * format * flake8 * duplicate * fix * flake8 * docs * docs Co-authored-by: Teddy Koker <teddy.koker@gmail.com> Co-authored-by: Nicki Skafte <nugginea@gmail.com> Co-authored-by: Jirka Borovec <Borda@users.noreply.github.com> Co-authored-by: Jirka Borovec <jirka.borovec@seznam.cz> 2020-12-04 21:42:23 +00:00			`from pytorch_lightning.utilities import rank_zero_warn`
[Metrics] Confusion matrix class interface (#4348) * docs + precision + recall + f_beta + refactor Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * rebase Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * fixes Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * added missing file * docs * docs * extra import * add confusion matrix * add to docs * add test * pep8 + isort * update tests * move util function * unify functional and class * add to init * remove old implementation * update tests * pep8 * add duplicate * fix doctest * Update pytorch_lightning/metrics/classification/confusion_matrix.py Co-authored-by: Justus Schock <12886177+justusschock@users.noreply.github.com> * changelog * bullet point args * bullet docs * bullet docs Co-authored-by: ananyahjha93 <ananya@pytorchlightning.ai> Co-authored-by: Teddy Koker <teddy.koker@gmail.com> Co-authored-by: Justus Schock <12886177+justusschock@users.noreply.github.com> Co-authored-by: chaton <thomas@grid.ai> Co-authored-by: Roger Shieh <55400948+s-rog@users.noreply.github.com> Co-authored-by: Rohit Gupta <rohitgr1998@gmail.com> 2020-10-30 10:44:25 +00:00

formatting 6/n: metrics (#5722) * yapf metrics * op 2021-02-01 08:24:07 +00:00			`def _confusion_matrix_update(`
			`preds: torch.Tensor, target: torch.Tensor, num_classes: int, threshold: float = 0.5`
			`) -> torch.Tensor:`
drop duplicated metric helper (#5366) * drop duplicated metric helper * . * fix tests Co-authored-by: Nicki Skafte <skaftenicki@gmail.com> 2021-01-06 23:49:59 +00:00			`preds, target, mode = _input_format_classification(preds, target, threshold)`
			`if mode not in ('binary', 'multi-label'):`
			`preds = preds.argmax(dim=1)`
			`target = target.argmax(dim=1)`
[Metrics] Confusion matrix class interface (#4348) * docs + precision + recall + f_beta + refactor Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * rebase Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * fixes Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * added missing file * docs * docs * extra import * add confusion matrix * add to docs * add test * pep8 + isort * update tests * move util function * unify functional and class * add to init * remove old implementation * update tests * pep8 * add duplicate * fix doctest * Update pytorch_lightning/metrics/classification/confusion_matrix.py Co-authored-by: Justus Schock <12886177+justusschock@users.noreply.github.com> * changelog * bullet point args * bullet docs * bullet docs Co-authored-by: ananyahjha93 <ananya@pytorchlightning.ai> Co-authored-by: Teddy Koker <teddy.koker@gmail.com> Co-authored-by: Justus Schock <12886177+justusschock@users.noreply.github.com> Co-authored-by: chaton <thomas@grid.ai> Co-authored-by: Roger Shieh <55400948+s-rog@users.noreply.github.com> Co-authored-by: Rohit Gupta <rohitgr1998@gmail.com> 2020-10-30 10:44:25 +00:00			`unique_mapping = (target.view(-1) * num_classes + preds.view(-1)).to(torch.long)`
formatting 6/n: metrics (#5722) * yapf metrics * op 2021-02-01 08:24:07 +00:00			`bins = torch.bincount(unique_mapping, minlength=num_classes**2)`
[Metrics] Confusion matrix class interface (#4348) * docs + precision + recall + f_beta + refactor Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * rebase Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * fixes Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * added missing file * docs * docs * extra import * add confusion matrix * add to docs * add test * pep8 + isort * update tests * move util function * unify functional and class * add to init * remove old implementation * update tests * pep8 * add duplicate * fix doctest * Update pytorch_lightning/metrics/classification/confusion_matrix.py Co-authored-by: Justus Schock <12886177+justusschock@users.noreply.github.com> * changelog * bullet point args * bullet docs * bullet docs Co-authored-by: ananyahjha93 <ananya@pytorchlightning.ai> Co-authored-by: Teddy Koker <teddy.koker@gmail.com> Co-authored-by: Justus Schock <12886177+justusschock@users.noreply.github.com> Co-authored-by: chaton <thomas@grid.ai> Co-authored-by: Roger Shieh <55400948+s-rog@users.noreply.github.com> Co-authored-by: Rohit Gupta <rohitgr1998@gmail.com> 2020-10-30 10:44:25 +00:00			`confmat = bins.reshape(num_classes, num_classes)`
			`return confmat`


formatting 6/n: metrics (#5722) * yapf metrics * op 2021-02-01 08:24:07 +00:00			`def _confusion_matrix_compute(confmat: torch.Tensor, normalize: Optional[str] = None) -> torch.Tensor:`
[Metrics] Confusion matrix class interface (#4348) * docs + precision + recall + f_beta + refactor Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * rebase Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * fixes Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * added missing file * docs * docs * extra import * add confusion matrix * add to docs * add test * pep8 + isort * update tests * move util function * unify functional and class * add to init * remove old implementation * update tests * pep8 * add duplicate * fix doctest * Update pytorch_lightning/metrics/classification/confusion_matrix.py Co-authored-by: Justus Schock <12886177+justusschock@users.noreply.github.com> * changelog * bullet point args * bullet docs * bullet docs Co-authored-by: ananyahjha93 <ananya@pytorchlightning.ai> Co-authored-by: Teddy Koker <teddy.koker@gmail.com> Co-authored-by: Justus Schock <12886177+justusschock@users.noreply.github.com> Co-authored-by: chaton <thomas@grid.ai> Co-authored-by: Roger Shieh <55400948+s-rog@users.noreply.github.com> Co-authored-by: Rohit Gupta <rohitgr1998@gmail.com> 2020-10-30 10:44:25 +00:00			`allowed_normalize = ('true', 'pred', 'all', None)`
			`assert normalize in allowed_normalize, \`
			`f"Argument average needs to one of the following: {allowed_normalize}"`
			`confmat = confmat.float()`
			`if normalize is not None:`
			`if normalize == 'true':`
			`cm = confmat / confmat.sum(axis=1, keepdim=True)`
			`elif normalize == 'pred':`
			`cm = confmat / confmat.sum(axis=0, keepdim=True)`
			`elif normalize == 'all':`
			`cm = confmat / confmat.sum()`
			`nan_elements = cm[torch.isnan(cm)].nelement()`
			`if nan_elements != 0:`
			`cm[torch.isnan(cm)] = 0`
			`rank_zero_warn(f'{nan_elements} nan values found in confusion matrix have been replaced with zeros.')`
			`return cm`
			`return confmat`


			`def confusion_matrix(`
formatting 6/n: metrics (#5722) * yapf metrics * op 2021-02-01 08:24:07 +00:00			`preds: torch.Tensor,`
			`target: torch.Tensor,`
			`num_classes: int,`
			`normalize: Optional[str] = None,`
			`threshold: float = 0.5`
[Metrics] Confusion matrix class interface (#4348) * docs + precision + recall + f_beta + refactor Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * rebase Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * fixes Co-authored-by: Teddy Koker <teddy.koker@gmail.com> * added missing file * docs * docs * extra import * add confusion matrix * add to docs * add test * pep8 + isort * update tests * move util function * unify functional and class * add to init * remove old implementation * update tests * pep8 * add duplicate * fix doctest * Update pytorch_lightning/metrics/classification/confusion_matrix.py Co-authored-by: Justus Schock <12886177+justusschock@users.noreply.github.com> * changelog * bullet point args * bullet docs * bullet docs Co-authored-by: ananyahjha93 <ananya@pytorchlightning.ai> Co-authored-by: Teddy Koker <teddy.koker@gmail.com> Co-authored-by: Justus Schock <12886177+justusschock@users.noreply.github.com> Co-authored-by: chaton <thomas@grid.ai> Co-authored-by: Roger Shieh <55400948+s-rog@users.noreply.github.com> Co-authored-by: Rohit Gupta <rohitgr1998@gmail.com> 2020-10-30 10:44:25 +00:00			`) -> torch.Tensor:`
			`"""`
			`Computes the confusion matrix. Works with binary, multiclass, and multilabel data.`
			`Accepts logits from a model output or integer class values in prediction.`
			`Works with multi-dimensional preds and target.`

			If preds and target are the same shape and preds is a float tensor, we use the ``self.threshold`` argument.
			`This is the case for binary and multi-label logits.`

			If preds has an extra dimension as in the case of multi-class scores we perform an argmax on ``dim=1``.

			`Args:`
			preds: (float or long tensor), Either a ``(N, ...)`` tensor with labels or
			``(N, C, ...)`` where C is the number of classes, tensor with logits/probabilities
			target: ``target`` (long tensor), tensor with shape ``(N, ...)`` with ground true labels
			`num_classes: Number of classes in the dataset.`
			`normalize: Normalization mode for confusion matrix. Choose from`

			- ``None``: no normalization (default)
			- ``'true'``: normalization over the targets (most commonly used)
			- ``'pred'``: normalization over the predictions
			- ``'all'``: normalization over the whole matrix

			`threshold:`
			`Threshold value for binary or multi-label logits. default: 0.5`

			`Example:`

			`>>> from pytorch_lightning.metrics.functional import confusion_matrix`
			`>>> target = torch.tensor([1, 1, 0, 0])`
			`>>> preds = torch.tensor([0, 1, 0, 0])`
			`>>> confusion_matrix(preds, target, num_classes=2)`
			`tensor([[2., 0.],`
			`[1., 1.]])`
			`"""`
			`confmat = _confusion_matrix_update(preds, target, num_classes, threshold)`
			`return _confusion_matrix_compute(confmat, normalize)`