omnidet/train_distance_semantic.py

"""
Distance estimation and Semantic segmentation training for OmniDet.

# author: Varun Ravi Kumar <rvarun7777@gmail.com>

This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; Authors provide no warranty with the software
and are not liable for anything.
"""

import time

import torch
from colorama import Fore, Style

from losses.mtl_losses import UncertaintyLoss
from models.semantic_decoder import SemanticDecoder
from train_distance import DistanceModelBase
from train_semantic import SemanticModel, SemanticInit


class DistanceSemanticModelBase(DistanceModelBase, SemanticInit):
    def __init__(self, args):
        super().__init__(args)

        self.models["semantic"] = SemanticDecoder(self.encoder_channels,
                                                  n_classes=args.semantic_num_classes).to(self.device)
        self.parameters_to_train += list(self.models["semantic"].parameters())

        if args.use_multiple_gpu:
            self.models["semantic"] = torch.nn.DataParallel(self.models["semantic"])

    def distance_semantic_train(self):
        """Trainer function for distance and semantic prediction"""

        for self.epoch in range(self.args.epochs):
            # switch to train mode
            self.set_train()
            data_loading_time = 0
            gpu_time = 0
            before_op_time = time.time()

            # MTL loss initialization
            for batch_idx, inputs in enumerate(self.train_loader):
                data_loading_time += (time.time() - before_op_time)
                before_op_time = time.time()
                self.inputs_to_device(inputs)

                # -- DISTANCE AND SEMANTIC SEGMENTATION MODEL PREDICTIONS AND LOSS CALCULATIONS --
                _, outputs, losses = self.distance_semantic_loss_predictions(inputs)

                # -- MTL LOSS --
                losses["mtl_loss"] = self.mtl_loss(losses)

                # -- COMPUTE GRADIENT AND DO OPTIMIZER STEP --
                self.optimizer.zero_grad()
                losses["mtl_loss"].backward()
                self.optimizer.step()

                duration = time.time() - before_op_time
                gpu_time += duration

                if batch_idx % self.args.log_frequency == 0:
                    self.log_time(batch_idx, duration, losses["mtl_loss"].mean().cpu().data,
                                  data_loading_time, gpu_time)
                    self.distance_statistics("train", inputs, outputs, losses)
                    SemanticModel.semantic_statistics(self, "train", inputs, outputs, losses)
                    data_loading_time = 0
                    gpu_time = 0

                if self.step % self.args.val_frequency == 0:
                    # -- SAVE SEMANTIC MODEL WITH BEST WEIGHTS BASED ON VALIDATION IoU --
                    self.save_best_semantic_weights()

                self.step += 1
                before_op_time = time.time()

            self.lr_scheduler.step()

            if (self.epoch + 1) % self.args.save_frequency == 0:
                self.save_model()

        print("Training complete!")

    def distance_semantic_loss_predictions(self, inputs):
        losses = dict()
        # -- SEMANTIC SEGMENTATION --
        outputs, features = self.predict_semantic_seg(inputs)
        # -- SEMANTIC SEGMENTATION LOSS --
        losses["semantic_loss"] = self.semantic_criterion(outputs["semantic", 0],
                                                          inputs["semantic_labels", 0, 0])
        if self.args.use_multiple_gpu:
            losses["semantic_loss"] = losses["semantic_loss"].unsqueeze(0)

        # -- DISTANCE ESTIMATION --
        distance_outputs, features = self.predict_distances(inputs, features=features)
        outputs.update(distance_outputs)
        # -- POSE ESTIMATION --
        outputs.update(self.predict_poses(inputs, features))
        # -- PHOTOMETRIC LOSSES --
        distance_losses, distance_outputs = self.photometric_losses(inputs, outputs)
        losses.update(distance_losses)
        outputs.update(distance_outputs)

        return features, outputs, losses

    def predict_semantic_seg(self, inputs):
        outputs = dict()
        features = self.models["encoder"](inputs["color_aug", 0, 0])
        if self.args.pose_model_type == "shared":
            outputs.update(self.models["semantic"](features[0]))
        else:
            outputs.update(self.models["semantic"](features))
        return outputs, features

    @torch.no_grad()
    def semantic_val(self):
        """Validate the semantic model"""
        self.set_eval()
        losses = dict()
        for inputs in self.val_loader:
            self.inputs_to_device(inputs)

            outputs, _ = self.predict_semantic_seg(inputs)
            losses["semantic_loss"] = self.semantic_criterion(outputs["semantic", 0],
                                                              inputs["semantic_labels", 0, 0])
            if self.args.use_multiple_gpu:
                losses["semantic_loss"] = losses["semantic_loss"].unsqueeze(0)

            _, predictions = torch.max(outputs["semantic", 0].data, 1)
            self.metric.add(predictions, inputs["semantic_labels", 0, 0])

        outputs["class_iou"], outputs["mean_iou"] = self.metric.value()
        # Compute stats for the tensorboard
        SemanticModel.semantic_statistics(self, "val", inputs, outputs, losses)
        self.metric.reset()
        del inputs, losses
        self.set_train()
        return outputs

    def save_best_semantic_weights(self):
        # Semantic Seg. validation on each step and save model on improvements.
        val_metrics = self.semantic_val()
        print(f"{Fore.RED}epoch {self.epoch:>3} | Semantic IoU: {val_metrics['mean_iou']:.3f}{Style.RESET_ALL}")
        if val_metrics["mean_iou"] >= self.best_semantic_iou:
            print(f"{Fore.RED}=> Saving semantic segmentation model weights with mean_iou of"
                  f" {val_metrics['mean_iou']:.3f} at step {self.step} on {self.epoch} epoch.{Style.RESET_ALL}")
            self.best_semantic_iou = val_metrics["mean_iou"]
            if self.epoch > 50:  # Weights are quite large! Sometimes, life is a compromise.
                self.save_model()


class DistanceSemanticModel(DistanceSemanticModelBase):
    def __init__(self, args):
        super().__init__(args)
        self.mtl_loss = UncertaintyLoss(tasks=self.args.train).to(self.device)
        self.parameters_to_train += list(self.mtl_loss.parameters())
        if args.use_multiple_gpu:
            self.mtl_loss = torch.nn.DataParallel(self.mtl_loss)
        self.configure_optimizers()
        self.pre_init()