Source code for deepdisc.astrodet.detectron

import datetime
import json
import logging
import os
import sys
import time

import cv2
import detectron2
import numpy as np
from astropy.io import fits
from detectron2.utils.logger import setup_logger

setup_logger()
from typing import Dict, List, Optional, Tuple

import detectron2.data as data
import detectron2.data.transforms as T

import torch
from detectron2.data import build_detection_train_loader
from detectron2.data.transforms import Augmentation, Transform
from detectron2.engine import HookBase
from detectron2.engine.hooks import LRScheduler
from detectron2.layers import Conv2d, ShapeSpec, cat, get_norm, nonzero_tuple
from detectron2.modeling import ROI_HEADS_REGISTRY
from detectron2.modeling.matcher import Matcher
from detectron2.modeling.poolers import ROIPooler
from detectron2.modeling.roi_heads import CascadeROIHeads, StandardROIHeads
from detectron2.structures import Boxes, BoxMode, ImageList, Instances, pairwise_iou
from detectron2.utils import comm
from detectron2.utils.collect_env import collect_env_info
from detectron2.utils.env import seed_all_rng
from detectron2.utils.events import (
    CommonMetricPrinter,
    EventStorage,
    JSONWriter,
    TensorboardXWriter,
    get_event_storage,
)
from detectron2.utils.file_io import PathManager
from detectron2.utils.logger import log_every_n_seconds, setup_logger
from detectron2.utils.visualizer import Visualizer
from fvcore.common.param_scheduler import ParamScheduler
from fvcore.transforms.transform import Transform, TransformList
from torch import nn
from torch.distributions.beta import Beta
from torch.distributions.categorical import Categorical
from torch.distributions.independent import Independent
from torch.distributions.mixture_same_family import MixtureSameFamily
from torch.distributions.normal import Normal
from torch.nn import functional as F



[docs]
def plot_stretch_Q(
    dataset_dicts,
    astro_metadata,
    num=0,
    stretches=[0.01, 0.1, 0.5, 1],
    Qs=[1, 10, 5, 100],
    ceil_percentile=99.5,
):
    """
    Plots different normalizations of your image using the stretch, Q parameters.

    Parameters
    ----------
    dataset_dicts : dict
        detectron dataset dictionary
    num : int
        Dataset number/index to use
    stretches : array
        List of stretch params you want to permutate through to find optimal image normalization.
        Default is [0.01, 0.1, 0.5, 1]
    Qs : array
        List of Q params you want to permutate through to find optimal image normalization.
        Default is [1, 10, 5, 100]

    Code adapted from:
        https://pmelchior.github.io/scarlet/tutorials/display.html

    Returns
    -------
    fig : Figure object

    """

    d = dataset_dicts[num]

    fig, ax = plt.subplots(len(stretches), len(Qs), figsize=(9, 9))
    for i, stretch in enumerate(stretches):
        for j, Q in enumerate(Qs):
            img = read_image(
                d,
                normalize="lupton",
                stretch=stretch,
                Q=Q,
                ceil_percentile=ceil_percentile,
            )
            # Scale the RGB channels for the image
            visualizer = Visualizer(img, metadata=astro_metadata)
            out = visualizer.draw_dataset_dict(d)
            ax[i][j].imshow(out.get_image(), origin="lower")
            ax[i][j].set_title("Stretch {}, Q {}".format(stretch, Q), fontsize=10)
            ax[i][j].axis("off")

    return fig



"""Note:SaveHook is in charge of saving the trained model"""


[docs]
class SaveHook(HookBase):

    """
    This Hook saves the model during training

    Parameters
    ----------
    save_period: int
        How many iterations to run before a checkpoint is saved
    """
    

[docs]
    output_name = "model_temp"


    
    def __init__(self, save_period):

[docs]
        self._period = save_period



[docs]
    def set_output_name(self, name):
        self.output_name = name


    #def after_train(self):
    #    self.trainer.checkpointer.save(self.output_name)  # Note: Set the name of the output model here


[docs]
    def after_step(self):
        next_iter = self.trainer.iter + 1
        is_final = next_iter == self.trainer.max_iter
        if is_final or (self._period > 0 and next_iter % self._period == 0):  # or (next_iter == 1):
            print("saving", self.output_name)
            self.trainer.checkpointer.save(f'{self.output_name}_{next_iter//self._period}')
            if is_final:
                self.trainer.checkpointer.save(self.output_name)



        
#

[docs]
class LossEvalHook(HookBase):

    """
    Validation loss code adopted from https://gist.github.com/ortegatron/c0dad15e49c2b74de8bb09a5615d9f6b

    Parameters
    ----------
    eval_period: int
        How many iterations to run before validation loss is calculated
    model: torch.NN.module
        The model being trained
    data_loader: detectron2 DataLoader
        The dataloader that loads in the evaluation dataset
    """

    def __init__(self, eval_period, model, data_loader):

[docs]
        self._model = model


[docs]
        self._period = eval_period


[docs]
        self._data_loader = data_loader



[docs]
    def _do_loss_eval(self):
        # Copying inference_on_dataset from evaluator.py
        total = len(self._data_loader)
        num_warmup = min(5, total - 1)

        start_time = time.perf_counter()
        total_compute_time = 0
        losses = []
        losses_dicts =[]
        with torch.no_grad():
            for idx, inputs in enumerate(self._data_loader):
                if idx == num_warmup:
                    start_time = time.perf_counter()
                    total_compute_time = 0
                start_compute_time = time.perf_counter()
                if torch.cuda.is_available():
                    torch.cuda.synchronize()
                total_compute_time += time.perf_counter() - start_compute_time
                iters_after_start = idx + 1 - num_warmup * int(idx >= num_warmup)
                seconds_per_img = total_compute_time / iters_after_start
                if idx >= num_warmup * 2 or seconds_per_img > 5:
                    total_seconds_per_img = (time.perf_counter() - start_time) / iters_after_start
                    eta = datetime.timedelta(seconds=int(total_seconds_per_img * (total - idx - 1)))
                    log_every_n_seconds(
                        logging.INFO,
                        "Loss on Validation  done {}/{}. {:.4f} s / img. ETA={}".format(
                            idx + 1, total, seconds_per_img, str(eta)
                        ),
                        n=5,
                    )
                loss_batch, metrics_dict = self._get_loss(inputs)
                losses.append(loss_batch)
                losses_dicts.append(metrics_dict)
        mean_loss = np.mean(losses)
        averaged_losses_dict ={}
        for d in losses_dicts:
            for key, value in d.items():
                if key not in averaged_losses_dict:
                    averaged_losses_dict[key] = [0, 0]  # [sum, count]
                averaged_losses_dict[key][0] += value
                averaged_losses_dict[key][1] += 1
        averaged_losses_dict = {key: total / count for key, (total, count) in averaged_losses_dict.items()}
        # print('validation_loss', mean_loss)
        self.trainer.storage.put_scalar("validation_loss", mean_loss)
        self.trainer.add_val_loss(mean_loss)
        self.trainer.valloss = mean_loss
        
        self.trainer.add_val_loss_dict(averaged_losses_dict)
        self.trainer.vallossdict = averaged_losses_dict

        comm.synchronize()
        return losses



[docs]
    def _get_loss(self, data):
        # How loss is calculated on train_loop
        metrics_dict = self._model(data)
        metrics_dict = {
            k: v.detach().cpu().item() if isinstance(v, torch.Tensor) else float(v)
            for k, v in metrics_dict.items()
        }
        total_losses_reduced = sum(loss for loss in metrics_dict.values())
        return total_losses_reduced, metrics_dict



[docs]
    def after_step(self):
        next_iter = self.trainer.iter + 1
        is_final = next_iter == self.trainer.max_iter
        if is_final or (self._period > 0 and next_iter % self._period == 0):  # or (next_iter == 1):
            self._do_loss_eval()
        self.trainer.storage.put_scalars(timetest=12)





[docs]
class CustomLRScheduler(HookBase):
    """
    A hook which executes a torch builtin LR scheduler and summarizes the LR.
    It is executed after every iteration.

    Parameters
    ----------
    optimizer: torch optimizer
        the training optimizer
    scheduler: torch scheduler
        The learning rate scheduler

    """

    def __init__(self, optimizer=None, scheduler=None):
        """
        Args:
            optimizer (torch.optim.Optimizer):
            scheduler (torch.optim.LRScheduler or fvcore.common.param_scheduler.ParamScheduler):
                if a :class:`ParamScheduler` object, it defines the multiplier over the base LR
                in the optimizer.

        If any argument is not given, will try to obtain it from the trainer.
        """

[docs]
        self._optimizer = optimizer


[docs]
        self._scheduler = scheduler



[docs]
    def before_train(self):
        # print(self.scheduler)
        self._optimizer = self._optimizer or self.trainer.optimizer
        print(self.scheduler)
        if isinstance(self.scheduler, ParamScheduler):
            self._scheduler = LRMultiplier(
                self._optimizer,
                self.scheduler,
                self.trainer.max_iter,
                last_iter=self.trainer.iter - 1,
            )
        self._best_param_group_id = LRScheduler.get_best_param_group_id(self._optimizer)


    @staticmethod

[docs]
    def get_best_param_group_id(optimizer):
        # NOTE: some heuristics on what LR to summarize
        # summarize the param group with most parameters
        largest_group = max(len(g["params"]) for g in optimizer.param_groups)

        if largest_group == 1:
            # If all groups have one parameter,
            # then find the most common initial LR, and use it for summary
            lr_count = Counter([g["lr"] for g in optimizer.param_groups])
            lr = lr_count.most_common()[0][0]
            for i, g in enumerate(optimizer.param_groups):
                if g["lr"] == lr:
                    return i
        else:
            for i, g in enumerate(optimizer.param_groups):
                if len(g["params"]) == largest_group:
                    return i



[docs]
    def after_step(self):
        lr = self._optimizer.param_groups[self._best_param_group_id]["lr"]
        self.trainer.storage.put_scalar("lr", lr, smoothing_hint=False)
        self.scheduler.step()


    @property

[docs]
    def scheduler(self):
        return self._scheduler or self.trainer.scheduler



[docs]
    def state_dict(self):
        if isinstance(self.scheduler, _LRScheduler):
            return self.scheduler.state_dict()
        return {}



[docs]
    def load_state_dict(self, state_dict):
        if isinstance(self.scheduler, _LRScheduler):
            logger = logging.getLogger(__name__)
            logger.info("Loading scheduler from state_dict ...")
            self.scheduler.load_state_dict(state_dict)





[docs]
class GenericWrapperTransform(Transform):
    """
    Code from Deshwal on Stack Overflow
    Generic wrapper for any transform (for color transform only. You can give functionality to apply_coods, apply_segmentation too)
    """

    def __init__(self, custom_function):
        """
        Args:
            custom_function (Callable): operation to be applied to the image which takes in an ndarray and returns an ndarray.
        """
        if not callable(custom_function):
            raise ValueError("'custom_function' should be callable")

        super().__init__()
        self._set_attributes(locals())


[docs]
    def apply_image(self, img):
        """
        apply transformation to image array based on the `custom_function`
        """
        return self.custom_function(img)



[docs]
    def apply_coords(self, coords):
        """
        Apply transformations to Bounding Box Coordinates. Currently is won't do anything but we can change this based on our use case
        """
        return coords



[docs]
    def inverse(self):
        return T.NoOpTransform()



[docs]
    def apply_segmentation(self, segmentation):
        """
        Apply transformations to segmentation. currently is won't do anything but we can change this based on our use case
        """
        return segmentation





[docs]
class CustomAug(Augmentation):
    """
    Given a probability and a custom function, return a GenericWrapperTransform object whose `apply_image`
    will be called to perform augmentation
    """

    def __init__(self, custom_function, prob=1.0):
        """
        Args:
            custom_op: Operation to use. Must be a function takes an ndarray and returns an ndarray
            prob (float): probability of applying the function
        """
        super().__init__()
        self._init(locals())


[docs]
    def get_transform(self, image):
        """
        Based on probability, choose whether you want to apply the given function or not
        """
        do = self._rand_range() < self.prob
        if do:
            return GenericWrapperTransform(self.custom_function)
        else:
            return (
                T.NoOpTransform()
            )  # it returns a Transform which just returns the original Image array only


        


[docs]
class ShapeAug(Augmentation):
    """
    Given a probability and a custom function, return a GenericWrapperTransform object whose `apply_image`
    will be called to perform augmentation
    """

    def __init__(self, custom_function, prob=1.0):
        """
        Args:
            custom_op: Operation to use. Must be a function takes an ndarray and returns an ndarray
            prob (float): probability of applying the function
        """
        super().__init__()
        self._init(locals())


[docs]
    def get_transform(self, image, instances):
        """
        Based on probability, choose whether you want to apply the given function or not
        """
        do = self._rand_range() < self.prob
        if do:
            return GenericWrapperTransform(self.custom_function)
        else:
            return (
                T.NoOpTransform()
            )  # it returns a Transform which just returns the original Image array only





[docs]
class KRandomAugmentationList(Augmentation):
    """
    Select and Apply "K" augmentations in "RANDOM" order with "Every"  __call__ method invoke
    """

    def __init__(self, augs, k: int = -1, cropaug=None):
        """
        Args:
            augs: list of [Augmentation or Transform]
            k: Number of augment to use from the given list in range [1,len_augs].
            If None, use all. If it is -1, generate K randomly between [1,len_augs]
        """
        super().__init__()

[docs]
        self.max_range = len(augs)


[docs]
        self.k = k


[docs]
        self.augs = augs  # set augs to use as fixed if we have to use same augs everytime


[docs]
        self.cropaug = cropaug



[docs]
    def _setup_augs(self, augs, k: int):
        """
        Setup the argument list. Generates the list of argument to use from the given list
        args:
            augs: list of [Augmentation or Transform])
            k: Number of augment to use from the given list in range [1,len_augs].
            If False, use all. If it is -1, generate K randomly between [1,len_augs]
        """
        if k == -1:  # Generate a random number
            k = np.random.randint(1, len(augs) + 1)

        elif k is None:  # use all
            k = self.max_range

        temp = np.random.choice(augs, k, replace=False)  # get k augments randomly
        augl = [_transform_to_aug(x) for x in temp]
        if self.cropaug is None:
            pass
        else:
            augl.insert(-1, self.cropaug)

        return augl



[docs]
    def __call__(self, aug_input) -> Transform:
        tfms = []

        for x in self._setup_augs(self.augs, self.k):  # generate auguments to use randomly on the fly
            tfm = x(aug_input)
            tfms.append(tfm)
        return TransformList(tfms)



[docs]
    def __repr__(self):
        msgs = [str(x) for x in self.augs]
        return "AugmentationList[{}]".format(", ".join(msgs))



[docs]
    __str__ = __repr__




## Added for importing

[docs]
class _TransformToAug(Augmentation):
    def __init__(self, tfm: Transform):

[docs]
        self.tfm = tfm



[docs]
    def get_transform(self, *args):
        return self.tfm



[docs]
    def __repr__(self):
        return repr(self.tfm)



[docs]
    __str__ = __repr__





[docs]
def _transform_to_aug(tfm_or_aug):
    """
    Wrap Transform into Augmentation.
    Private, used internally to implement custom augmentations.
    """
    assert isinstance(tfm_or_aug, (Transform, Augmentation)), tfm_or_aug
    if isinstance(tfm_or_aug, Augmentation):
        return tfm_or_aug
    else:
        return _TransformToAug(tfm_or_aug)