PlantNetLibre-300K/epoch.py

# SPDX-License-Identifier: BSD-2-Clause
#
# Copyright (c) 2021, Pl@ntNet
# All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions are met:
#
# 1. Redistributions of source code must retain the above copyright notice, this
#   list of conditions and the following disclaimer.
#
# 2. Redistributions in binary form must reproduce the above copyright notice,
#   this list of conditions and the following disclaimer in the documentation
#   and/or other materials provided with the distribution.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
# SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
# CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
# OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

import torch
from tqdm import tqdm
from utils import (
    count_correct_topk,
    count_correct_avgk,
    update_correct_per_class,
    update_correct_per_class_topk,
    update_correct_per_class_avgk,
)

import torch.nn.functional as F
from collections import defaultdict


def train_epoch(
    model,
    optimizer,
    train_loader,
    criteria,
    loss_train,
    acc_train,
    topk_acc_train,
    list_k,
    n_train,
    use_gpu,
):
    """Single train epoch pass. At the end of the epoch, updates the lists loss_train, acc_train and topk_acc_train"""
    model.train()
    # Initialize variables
    loss_epoch_train = 0
    n_correct_train = 0
    # Containers for tracking nb of correctly classified examples (in the top-k sense) and top-k accuracy for each k in list_k
    n_correct_topk_train = defaultdict(int)
    topk_acc_epoch_train = {}

    for batch_idx, (batch_x_train, batch_y_train) in enumerate(
        tqdm(train_loader, desc="train", position=0)
    ):
        if use_gpu:
            batch_x_train, batch_y_train = batch_x_train.cuda(), batch_y_train.cuda()
        optimizer.zero_grad()
        batch_output_train = model(batch_x_train)

        loss_batch_train = criteria(batch_output_train, batch_y_train)
        loss_epoch_train += loss_batch_train.item()
        loss_batch_train.backward()
        optimizer.step()

        # Update variables
        with torch.no_grad():
            n_correct_train += torch.sum(
                torch.eq(batch_y_train, torch.argmax(batch_output_train, dim=-1))
            ).item()
            for k in list_k:
                n_correct_topk_train[k] += count_correct_topk(
                    scores=batch_output_train, labels=batch_y_train, k=k
                ).item()

    # At the end of epoch compute average of statistics over batches and store them
    with torch.no_grad():
        loss_epoch_train /= batch_idx
        epoch_accuracy_train = n_correct_train / n_train
        for k in list_k:
            topk_acc_epoch_train[k] = n_correct_topk_train[k] / n_train

        loss_train.append(loss_epoch_train)
        acc_train.append(epoch_accuracy_train)
        topk_acc_train.append(topk_acc_epoch_train)

    return loss_epoch_train, epoch_accuracy_train, topk_acc_epoch_train


def val_epoch(
    model,
    val_loader,
    criteria,
    loss_val,
    acc_val,
    topk_acc_val,
    avgk_acc_val,
    class_acc_val,
    list_k,
    dataset_attributes,
    use_gpu,
):
    """Single val epoch pass.
    At the end of the epoch, updates the lists loss_val, acc_val, topk_acc_val and avgk_acc_val
    """

    model.eval()
    with torch.no_grad():
        n_val = dataset_attributes["n_val"]
        # Initialization of variables
        loss_epoch_val = 0
        n_correct_val = 0
        n_correct_topk_val, n_correct_avgk_val = defaultdict(int), defaultdict(int)
        topk_acc_epoch_val, avgk_acc_epoch_val = {}, {}
        # Store avg-k threshold for every k in list_k
        lmbda_val = {}
        # Store class accuracy, and top-k and average-k class accuracy for every k in list_k
        class_acc_dict = {}
        class_acc_dict["class_acc"] = defaultdict(int)
        class_acc_dict["class_topk_acc"], class_acc_dict["class_avgk_acc"] = {}, {}
        for k in list_k:
            (
                class_acc_dict["class_topk_acc"][k],
                class_acc_dict["class_avgk_acc"][k],
            ) = defaultdict(int), defaultdict(int)
        # Store estimated probas and labels of the whole validation set to compute lambda
        list_val_proba = []
        list_val_labels = []
        for batch_idx, (batch_x_val, batch_y_val) in enumerate(
            tqdm(val_loader, desc="val", position=0)
        ):
            if use_gpu:
                batch_x_val, batch_y_val = batch_x_val.cuda(), batch_y_val.cuda()
            batch_output_val = model(batch_x_val)
            batch_proba = F.softmax(batch_output_val)
            # Store batch probas and labels
            list_val_proba.append(batch_proba)
            list_val_labels.append(batch_y_val)

            loss_batch_val = criteria(batch_output_val, batch_y_val)
            loss_epoch_val += loss_batch_val.item()

            n_correct_val += torch.sum(
                torch.eq(batch_y_val, torch.argmax(batch_output_val, dim=-1))
            ).item()
            update_correct_per_class(
                batch_proba, batch_y_val, class_acc_dict["class_acc"]
            )
            # Update top-k count and top-k count for each class
            for k in list_k:
                n_correct_topk_val[k] += count_correct_topk(
                    scores=batch_output_val, labels=batch_y_val, k=k
                ).item()
                update_correct_per_class_topk(
                    batch_proba, batch_y_val, class_acc_dict["class_topk_acc"][k], k
                )

        # Get probas and labels for the entire validation set
        val_probas = torch.cat(list_val_proba)
        val_labels = torch.cat(list_val_labels)

        flat_val_probas = torch.flatten(val_probas)
        sorted_probas, _ = torch.sort(flat_val_probas, descending=True)

        for k in list_k:
            # Computes threshold for every k and count nb of correctly classifier examples in the avg-k sense (globally and for each class)
            lmbda_val[k] = 0.5 * (
                sorted_probas[n_val * k - 1] + sorted_probas[n_val * k]
            )
            n_correct_avgk_val[k] += count_correct_avgk(
                probas=val_probas, labels=val_labels, lmbda=lmbda_val[k]
            ).item()
            update_correct_per_class_avgk(
                val_probas,
                val_labels,
                class_acc_dict["class_avgk_acc"][k],
                lmbda_val[k],
            )

        # After seeing val set update the statistics over batches and store them
        loss_epoch_val /= batch_idx
        epoch_accuracy_val = n_correct_val / n_val
        # Get top-k acc and avg-k acc
        for k in list_k:
            topk_acc_epoch_val[k] = n_correct_topk_val[k] / n_val
            avgk_acc_epoch_val[k] = n_correct_avgk_val[k] / n_val
        # Get class top-k acc and class avg-k acc
        for class_id in class_acc_dict["class_acc"].keys():
            n_class_val = dataset_attributes["class2num_instances"]["val"][class_id]

            class_acc_dict["class_acc"][class_id] = (
                class_acc_dict["class_acc"][class_id] / n_class_val
            )
            for k in list_k:
                class_acc_dict["class_topk_acc"][k][class_id] = (
                    class_acc_dict["class_topk_acc"][k][class_id] / n_class_val
                )
                class_acc_dict["class_avgk_acc"][k][class_id] = (
                    class_acc_dict["class_avgk_acc"][k][class_id] / n_class_val
                )

        # Update containers with current epoch values
        loss_val.append(loss_epoch_val)
        acc_val.append(epoch_accuracy_val)
        topk_acc_val.append(topk_acc_epoch_val)
        avgk_acc_val.append(avgk_acc_epoch_val)
        class_acc_val.append(class_acc_dict)

    return (
        loss_epoch_val,
        epoch_accuracy_val,
        topk_acc_epoch_val,
        avgk_acc_epoch_val,
        lmbda_val,
    )


def test_epoch(
    model, test_loader, criteria, list_k, lmbda, use_gpu, dataset_attributes
):
    print()
    model.eval()
    with torch.no_grad():
        n_test = dataset_attributes["n_test"]
        loss_epoch_test = 0
        n_correct_test = 0
        topk_acc_epoch_test, avgk_acc_epoch_test = {}, {}
        n_correct_topk_test, n_correct_avgk_test = defaultdict(int), defaultdict(int)

        class_acc_dict = {}
        class_acc_dict["class_acc"] = defaultdict(int)
        class_acc_dict["class_topk_acc"], class_acc_dict["class_avgk_acc"] = {}, {}
        for k in list_k:
            (
                class_acc_dict["class_topk_acc"][k],
                class_acc_dict["class_avgk_acc"][k],
            ) = defaultdict(int), defaultdict(int)

        for batch_idx, (batch_x_test, batch_y_test) in enumerate(
            tqdm(test_loader, desc="test", position=0)
        ):
            if use_gpu:
                batch_x_test, batch_y_test = batch_x_test.cuda(), batch_y_test.cuda()
            batch_output_test = model(batch_x_test)
            batch_proba_test = F.softmax(batch_output_test)
            loss_batch_test = criteria(batch_output_test, batch_y_test)
            loss_epoch_test += loss_batch_test.item()

            n_correct_test += torch.sum(
                torch.eq(batch_y_test, torch.argmax(batch_output_test, dim=-1))
            ).item()
            update_correct_per_class(
                batch_proba_test, batch_y_test, class_acc_dict["class_acc"]
            )
            for k in list_k:
                n_correct_topk_test[k] += count_correct_topk(
                    scores=batch_output_test, labels=batch_y_test, k=k
                ).item()
                n_correct_avgk_test[k] += count_correct_avgk(
                    probas=batch_proba_test, labels=batch_y_test, lmbda=lmbda[k]
                ).item()
                update_correct_per_class_topk(
                    batch_output_test,
                    batch_y_test,
                    class_acc_dict["class_topk_acc"][k],
                    k,
                )
                update_correct_per_class_avgk(
                    batch_proba_test,
                    batch_y_test,
                    class_acc_dict["class_avgk_acc"][k],
                    lmbda[k],
                )

        # After seeing test set update the statistics over batches and store them
        loss_epoch_test /= batch_idx
        acc_epoch_test = n_correct_test / n_test
        for k in list_k:
            topk_acc_epoch_test[k] = n_correct_topk_test[k] / n_test
            avgk_acc_epoch_test[k] = n_correct_avgk_test[k] / n_test

        for class_id in class_acc_dict["class_acc"].keys():
            n_class_test = dataset_attributes["class2num_instances"]["test"][class_id]
            class_acc_dict["class_acc"][class_id] = (
                class_acc_dict["class_acc"][class_id] / n_class_test
            )
            for k in list_k:
                class_acc_dict["class_topk_acc"][k][class_id] = (
                    class_acc_dict["class_topk_acc"][k][class_id] / n_class_test
                )
                class_acc_dict["class_avgk_acc"][k][class_id] = (
                    class_acc_dict["class_avgk_acc"][k][class_id] / n_class_test
                )

    return (
        loss_epoch_test,
        acc_epoch_test,
        topk_acc_epoch_test,
        avgk_acc_epoch_test,
        class_acc_dict,
    )