SyncDreamer

Runtime error

App Files Files Community

liuyuan-pal commited on Sep 14, 2023

Commit

df916e6

1 Parent(s): a14768e

update

Browse files

Files changed (11) hide show

.gitattributes +1 -0
app.py +26 -4
detection_test.py +30 -9
hf_demo/examples/basket.png +0 -0
hf_demo/examples/cat.png +3 -0
hf_demo/examples/crab.png +3 -0
hf_demo/examples/elephant.png +3 -0
hf_demo/examples/flower.png +3 -0
hf_demo/examples/forest.png +3 -0
hf_demo/examples/monkey.png +0 -0
hf_demo/examples/teapot.png +3 -0

.gitattributes CHANGED Viewed

@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
 ckpt/* filter=lfs diff=lfs merge=lfs -text

 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
 ckpt/* filter=lfs diff=lfs merge=lfs -text
+hf_demo/examples/* filter=lfs diff=lfs merge=lfs -text

app.py CHANGED Viewed

@@ -7,7 +7,6 @@ import torch
 import os
 import fire
 from omegaconf import OmegaConf
-from rembg import remove
 from ldm.util import add_margin, instantiate_from_config
 from sam_utils import sam_init, sam_out_nosave
@@ -39,6 +38,28 @@ _USER_GUIDE3 = "Generated multiview images are shown below!"
 deployed = True
 def resize_inputs(image_input, crop_size):
     alpha_np = np.asarray(image_input)[:, :, 3]
     coords = np.stack(np.nonzero(alpha_np), 1)[:, (1, 0)]
@@ -95,9 +116,9 @@ def white_background(img):
     rgb = (rgb*255).astype(np.uint8)
     return Image.fromarray(rgb)
-def sam_predict(predictor, raw_im):
     raw_im.thumbnail([512, 512], Image.Resampling.LANCZOS)
-    image_nobg = remove(raw_im.convert('RGBA'), alpha_matting=True)
     arr = np.asarray(image_nobg)[:, :, -1]
     x_nonzero = np.nonzero(arr.sum(axis=0))
     y_nonzero = np.nonzero(arr.sum(axis=1))
@@ -140,6 +161,7 @@ def run_demo():
     # init sam model
     mask_predictor = sam_init()
     # with open('instructions_12345.md', 'r') as f:
     #     article = f.read()
@@ -192,7 +214,7 @@ def run_demo():
         output_block = gr.Image(type='pil', image_mode='RGB', label="Outputs of SyncDreamer", height=256, interactive=False)
         update_guide = lambda GUIDE_TEXT: gr.update(value=GUIDE_TEXT)
-        image_block.change(fn=partial(sam_predict, mask_predictor), inputs=[image_block], outputs=[sam_block], queue=False)\
                    .success(fn=partial(update_guide, _USER_GUIDE1), outputs=[guide_text], queue=False)
         crop_size_slider.change(fn=resize_inputs, inputs=[sam_block, crop_size_slider], outputs=[input_block], queue=False)\

 import os
 import fire
 from omegaconf import OmegaConf
 from ldm.util import add_margin, instantiate_from_config
 from sam_utils import sam_init, sam_out_nosave
 deployed = True
+class BackgroundRemoval:
+    def __init__(self, device='cuda'):
+        from carvekit.api.high import HiInterface
+        self.interface = HiInterface(
+            object_type="object",  # Can be "object" or "hairs-like".
+            batch_size_seg=5,
+            batch_size_matting=1,
+            device=device,
+            seg_mask_size=640,  # Use 640 for Tracer B7 and 320 for U2Net
+            matting_mask_size=2048,
+            trimap_prob_threshold=231,
+            trimap_dilation=30,
+            trimap_erosion_iters=5,
+            fp16=True,
+        )
+    @torch.no_grad()
+    def __call__(self, image):
+        # image: [H, W, 3] array in [0, 255].
+        image = self.interface([image])[0]
+        return image
 def resize_inputs(image_input, crop_size):
     alpha_np = np.asarray(image_input)[:, :, 3]
     coords = np.stack(np.nonzero(alpha_np), 1)[:, (1, 0)]
     rgb = (rgb*255).astype(np.uint8)
     return Image.fromarray(rgb)
+def sam_predict(predictor, removal, raw_im):
     raw_im.thumbnail([512, 512], Image.Resampling.LANCZOS)
+    image_nobg = removal(raw_im.convert('RGB'))
     arr = np.asarray(image_nobg)[:, :, -1]
     x_nonzero = np.nonzero(arr.sum(axis=0))
     y_nonzero = np.nonzero(arr.sum(axis=1))
     # init sam model
     mask_predictor = sam_init()
+    removal = BackgroundRemoval()
     # with open('instructions_12345.md', 'r') as f:
     #     article = f.read()
         output_block = gr.Image(type='pil', image_mode='RGB', label="Outputs of SyncDreamer", height=256, interactive=False)
         update_guide = lambda GUIDE_TEXT: gr.update(value=GUIDE_TEXT)
+        image_block.change(fn=partial(sam_predict, mask_predictor, removal), inputs=[image_block], outputs=[sam_block], queue=False)\
                    .success(fn=partial(update_guide, _USER_GUIDE1), outputs=[guide_text], queue=False)
         crop_size_slider.change(fn=resize_inputs, inputs=[sam_block, crop_size_slider], outputs=[input_block], queue=False)\

detection_test.py CHANGED Viewed

@@ -1,18 +1,39 @@
 import numpy as np
 from PIL import Image
 from skimage.io import imsave
-from app import white_background
-from ldm.util import add_margin
 from sam_utils import sam_out_nosave, sam_init
-from rembg import remove
-raw_im = Image.open('hf_demo/examples/basket.png')
 predictor = sam_init()
 raw_im.thumbnail([512, 512], Image.Resampling.LANCZOS)
 width, height = raw_im.size
-image_nobg = remove(raw_im.convert('RGBA'), alpha_matting=True)
 arr = np.asarray(image_nobg)[:, :, -1]
 x_nonzero = np.nonzero(arr.sum(axis=0))
 y_nonzero = np.nonzero(arr.sum(axis=1))
@@ -20,16 +41,16 @@ x_min = int(x_nonzero[0].min())
 y_min = int(y_nonzero[0].min())
 x_max = int(x_nonzero[0].max())
 y_max = int(y_nonzero[0].max())
-# image_nobg.save('./nobg.png')
 image_nobg.thumbnail([512, 512], Image.Resampling.LANCZOS)
 image_sam = sam_out_nosave(predictor, image_nobg.convert("RGB"), (x_min, y_min, x_max, y_max))
-# imsave('./mask.png', np.asarray(image_sam)[:,:,3]*255)
 image_sam = np.asarray(image_sam, np.float32) / 255
 out_mask = image_sam[:, :, 3:]
 out_rgb = image_sam[:, :, :3] * out_mask + 1 - out_mask
 out_img = (np.concatenate([out_rgb, out_mask], 2) * 255).astype(np.uint8)
 image_sam = Image.fromarray(out_img, mode='RGBA')
-# image_sam.save('./output.png')

+import torch
 import numpy as np
 from PIL import Image
 from skimage.io import imsave
 from sam_utils import sam_out_nosave, sam_init
+class BackgroundRemoval:
+    def __init__(self, device='cuda'):
+        from carvekit.api.high import HiInterface
+        self.interface = HiInterface(
+            object_type="object",  # Can be "object" or "hairs-like".
+            batch_size_seg=5,
+            batch_size_matting=1,
+            device=device,
+            seg_mask_size=640,  # Use 640 for Tracer B7 and 320 for U2Net
+            matting_mask_size=2048,
+            trimap_prob_threshold=231,
+            trimap_dilation=30,
+            trimap_erosion_iters=5,
+            fp16=True,
+        )
+    @torch.no_grad()
+    def __call__(self, image):
+        # image: [H, W, 3] array in [0, 255].
+        # image = Image.fromarray(image)
+        image = self.interface([image])[0]
+        # image = np.array(image)
+        return image
+raw_im = Image.open('hf_demo/examples/flower.png')
 predictor = sam_init()
 raw_im.thumbnail([512, 512], Image.Resampling.LANCZOS)
 width, height = raw_im.size
+image_nobg = BackgroundRemoval()(raw_im.convert('RGB'))
 arr = np.asarray(image_nobg)[:, :, -1]
 x_nonzero = np.nonzero(arr.sum(axis=0))
 y_nonzero = np.nonzero(arr.sum(axis=1))
 y_min = int(y_nonzero[0].min())
 x_max = int(x_nonzero[0].max())
 y_max = int(y_nonzero[0].max())
+image_nobg.save('./nobg.png')
 image_nobg.thumbnail([512, 512], Image.Resampling.LANCZOS)
 image_sam = sam_out_nosave(predictor, image_nobg.convert("RGB"), (x_min, y_min, x_max, y_max))
+imsave('./mask.png', np.asarray(image_sam)[:,:,3])
 image_sam = np.asarray(image_sam, np.float32) / 255
 out_mask = image_sam[:, :, 3:]
 out_rgb = image_sam[:, :, :3] * out_mask + 1 - out_mask
 out_img = (np.concatenate([out_rgb, out_mask], 2) * 255).astype(np.uint8)
 image_sam = Image.fromarray(out_img, mode='RGBA')
+image_sam.save('./output.png')