Spaces:

JasonSmithSO
/

FooocusEnhanced

Configuration error

App Files Files Community

FooocusEnhanced / custom_controlnet_aux /sam /__init__.py

JasonSmithSO

Upload 777 files

0034848 verified 4 months ago

raw

history blame contribute delete

2.97 kB

	# Copyright (c) Meta Platforms, Inc. and affiliates.
	# All rights reserved.

	# This source code is licensed under the license found in the
	# LICENSE file in the root directory of this source tree.

	import os
	import warnings
	from typing import Union

	import cv2
	import numpy as np
	import torch
	from PIL import Image

	from custom_controlnet_aux.util import HWC3, common_input_validate, resize_image_with_pad, custom_hf_download, SAM_MODEL_NAME
	from .automatic_mask_generator import SamAutomaticMaskGenerator
	from .build_sam import sam_model_registry


	class SamDetector:
	def __init__(self, mask_generator: SamAutomaticMaskGenerator):
	self.mask_generator = mask_generator

	@classmethod
	def from_pretrained(cls, pretrained_model_or_path=SAM_MODEL_NAME, model_type="vit_t", filename="mobile_sam.pt", subfolder=None):
	"""
	Possible model_type : vit_h, vit_l, vit_b, vit_t
	download weights from https://github.com/facebookresearch/segment-anything
	"""
	model_path = custom_hf_download(pretrained_model_or_path, filename)

	sam = sam_model_registry[model_type](checkpoint=model_path)
	mask_generator = SamAutomaticMaskGenerator(sam)

	return cls(mask_generator)

	def to(self, device):
	model = self.mask_generator.predictor.model.to(device)
	model.train(False) #Update attention_bias in https://github.com/Fannovel16/comfyui_controlnet_aux/blob/main/src/custom_controlnet_aux/segment_anything/modeling/tiny_vit_sam.py#L251
	self.mask_generator = SamAutomaticMaskGenerator(model)
	return self


	def show_anns(self, anns):
	if len(anns) == 0:
	return
	sorted_anns = sorted(anns, key=(lambda x: x['area']), reverse=True)
	h, w = anns[0]['segmentation'].shape
	final_img = Image.fromarray(np.zeros((h, w, 3), dtype=np.uint8), mode="RGB")
	for ann in sorted_anns:
	m = ann['segmentation']
	img = np.empty((m.shape[0], m.shape[1], 3), dtype=np.uint8)
	for i in range(3):
	img[:,:,i] = np.random.randint(255, dtype=np.uint8)
	final_img.paste(Image.fromarray(img, mode="RGB"), (0, 0), Image.fromarray(np.uint8(m*255)))

	return np.array(final_img, dtype=np.uint8)

	def __call__(self, input_image: Union[np.ndarray, Image.Image]=None, detect_resolution=512, output_type="pil", upscale_method="INTER_CUBIC", **kwargs) -> Image.Image:
	input_image, output_type = common_input_validate(input_image, output_type, **kwargs)
	input_image, remove_pad = resize_image_with_pad(input_image, detect_resolution, upscale_method)

	# Generate Masks
	masks = self.mask_generator.generate(input_image)
	# Create map
	map = self.show_anns(masks)

	detected_map = HWC3(remove_pad(map))

	if output_type == "pil":
	detected_map = Image.fromarray(detected_map)

	return detected_map