ISAT_with_sam/sam_ann/segment_any/segment_any.py

# -*- coding: utf-8 -*-
# @Author  : LG

# from segment_anything import sam_model_registry, SamPredictor
# from segment_anything_hq import sam_model_registry, SamPredictor
# from mobile_sam import sam_model_registry, SamPredictor
import torch
import numpy as np
import timm
import os

class SegAny:
    def __init__(self, checkpoint):
        if 'mobile_sam' in os.path.basename(checkpoint):
            # mobile sam
            from mobile_sam import sam_model_registry, SamPredictor
            print('- mobile sam!')
            self.model_type = "vit_t"
        elif 'sam_hq_vit' in os.path.basename(checkpoint):
            # sam hq
            from segment_anything_hq import sam_model_registry, SamPredictor
            print('- sam hq!')
            if 'vit_b' in os.path.basename(checkpoint):
                self.model_type = "vit_b"
            elif 'vit_l' in os.path.basename(checkpoint):
                self.model_type = "vit_l"
            elif 'vit_h' in os.path.basename(checkpoint):
                self.model_type = "vit_h"
            elif 'vit_tiny' in os.path.basename(checkpoint):
                self.model_type = "vit_tiny"
            else:
                raise ValueError('The checkpoint named {} is not supported.'.format(checkpoint))
        elif 'sam_vit' in os.path.basename(checkpoint):
            # sam
            from segment_anything import sam_model_registry, SamPredictor
            print('- sam!')
            if 'vit_b' in os.path.basename(checkpoint):
                self.model_type = "vit_b"
            elif 'vit_l' in os.path.basename(checkpoint):
                self.model_type = "vit_l"
            elif 'vit_h' in os.path.basename(checkpoint):
                self.model_type = "vit_h"
            else:
                raise ValueError('The checkpoint named {} is not supported.'.format(checkpoint))
        else:
            raise ValueError('The checkpoint named {} is not supported.'.format(checkpoint))
        torch.cuda.empty_cache()

        self.device = 'cuda' if torch.cuda.is_available() else 'cpu'
        sam = sam_model_registry[self.model_type](checkpoint=checkpoint)
        sam.to(device=self.device)
        self.predictor_with_point_prompt = SamPredictor(sam)
        self.image = None

    def set_image(self, image):
        self.image = image
        self.predictor_with_point_prompt.set_image(image)

    def reset_image(self):
        self.predictor_with_point_prompt.reset_image()
        self.image = None
        torch.cuda.empty_cache()

    def predict_with_point_prompt(self, input_point, input_label):
        input_point = np.array(input_point)
        input_label = np.array(input_label)

        masks, scores, logits = self.predictor_with_point_prompt.predict(
            point_coords=input_point,
            point_labels=input_label,
            multimask_output=True,
        )
        mask_input = logits[np.argmax(scores), :, :]  # Choose the model's best mask
        masks, _, _ = self.predictor_with_point_prompt.predict(
            point_coords=input_point,
            point_labels=input_label,
            mask_input=mask_input[None, :, :],
            multimask_output=False,
        )
        torch.cuda.empty_cache()
        return masks