Spaces:

petergpt
/

bgremoval

Sleeping

App Files Files Community

petergpt commited on Dec 20, 2024

Commit

4d7e87d

verified ·

1 Parent(s): 36a76ae

Update app.py

Browse files

Files changed (1) hide show

app.py +52 -41

app.py CHANGED Viewed

@@ -4,12 +4,16 @@ from transformers import AutoModelForImageSegmentation
 from PIL import Image
 from torchvision import transforms
 import gradio as gr
-# Load the model
-birefnet = AutoModelForImageSegmentation.from_pretrained('zhengpeng7/BiRefNet_lite', trust_remote_code=True)
-device = 'cuda' if torch.cuda.is_available() else 'cpu'
-birefnet.to(device)
-birefnet.eval()
 # Preprocessing
 image_size = (1024, 1024)
@@ -19,19 +23,20 @@ transform_image = transforms.Compose([
     transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
 ])
-def run_inference(images):
-    # Convert all images into a batch tensor
     inputs = []
     original_sizes = []
     for img in images:
         original_sizes.append(img.size)
         inputs.append(transform_image(img))
     input_tensor = torch.stack(inputs).to(device)
-    # Run inference
-    with torch.no_grad():
-        preds = birefnet(input_tensor)[-1].sigmoid().cpu()
     # Post-process
     results = []
     for i, img in enumerate(images):
@@ -41,43 +46,49 @@ def run_inference(images):
         result = Image.new("RGBA", original_sizes[i], (0, 0, 0, 0))
         result.paste(img, mask=mask)
         results.append(result)
     return results
 def extract_objects(filepaths):
     images = [Image.open(p).convert("RGB") for p in filepaths]
     start_time = time.time()
-    # Attempt to process all at once
     try:
-        results = run_inference(images)
         end_time = time.time()
         total_time = end_time - start_time
         summary = f"Total request time: {total_time:.2f}s\nProcessed {len(images)} images successfully."
         return results, summary
     except torch.OutOfMemoryError:
-        # Only if we fail, do we attempt to find a feasible batch size
-        torch.cuda.empty_cache()
-        fail_time = time.time()
-        initial_attempt_time = fail_time - start_time
-        # Binary search to find max feasible batch size
-        low, high = 1, len(images)
-        best = None
-        best_count = 0
-        while low <= high:
-            mid = (low + high) // 2
-            batch = images[:mid]
-            try:
-                res = run_inference(batch)
-                best = res
-                best_count = mid
-                low = mid + 1  # try bigger
-            except torch.OutOfMemoryError:
-                torch.cuda.empty_cache()
-                high = mid - 1  # try smaller
         end_time = time.time()
         total_time = end_time - start_time
@@ -86,14 +97,14 @@ def extract_objects(filepaths):
             summary = (
                 f"Initial attempt OOM after {initial_attempt_time:.2f}s.\n"
                 f"Could not process even a single image.\n"
-                f"Total time with fallback attempts: {total_time:.2f}s."
             )
             return [], summary
         else:
             summary = (
-                f"Initial attempt OOM after {initial_attempt_time:.2f}s. "
-                f"After fallback tests, found that {best_count} images can be processed.\n"
-                f"Total time including fallback: {total_time:.2f}s.\n"
                 f"Next time, try using up to {best_count} images."
             )
             return best, summary
@@ -103,7 +114,7 @@ iface = gr.Interface(
     inputs=gr.Files(label="Upload Multiple Images", type="filepath", file_count="multiple"),
     outputs=[gr.Gallery(label="Processed Images"), gr.Textbox(label="Timing Info")],
     title="BiRefNet Bulk Background Removal with On-Demand Fallback",
-    description="Upload as many images as you want. If OOM occurs, a quick fallback will find the max feasible number of images without adding overhead unless needed."
 )
 iface.launch()

 from PIL import Image
 from torchvision import transforms
 import gradio as gr
+import gc
+def load_model():
+    model = AutoModelForImageSegmentation.from_pretrained('zhengpeng7/BiRefNet_lite', trust_remote_code=True)
+    device = 'cuda' if torch.cuda.is_available() else 'cpu'
+    model.to(device)
+    model.eval()
+    return model, device
+birefnet, device = load_model()
 # Preprocessing
 image_size = (1024, 1024)
     transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
 ])
+def run_inference(images, model, device):
     inputs = []
     original_sizes = []
     for img in images:
         original_sizes.append(img.size)
         inputs.append(transform_image(img))
     input_tensor = torch.stack(inputs).to(device)
+    try:
+        with torch.no_grad():
+            preds = model(input_tensor)[-1].sigmoid().cpu()
+    except torch.OutOfMemoryError:
+        del input_tensor
+        torch.cuda.empty_cache()
+        raise
     # Post-process
     results = []
     for i, img in enumerate(images):
         result = Image.new("RGBA", original_sizes[i], (0, 0, 0, 0))
         result.paste(img, mask=mask)
         results.append(result)
+    # Cleanup
+    del input_tensor, preds
+    gc.collect()
+    torch.cuda.empty_cache()
     return results
+def binary_search_max(images):
+    # After OOM, try to find max feasible batch
+    low, high = 1, len(images)
+    best = None
+    best_count = 0
+    while low <= high:
+        mid = (low + high) // 2
+        batch = images[:mid]
+        try:
+            # Re-load model to avoid leftover memory fragmentation
+            global birefnet, device
+            birefnet, device = load_model()
+            res = run_inference(batch, birefnet, device)
+            best = res
+            best_count = mid
+            low = mid + 1
+        except torch.OutOfMemoryError:
+            high = mid - 1
+    return best, best_count
 def extract_objects(filepaths):
     images = [Image.open(p).convert("RGB") for p in filepaths]
     start_time = time.time()
+    # First attempt: all images
     try:
+        results = run_inference(images, birefnet, device)
         end_time = time.time()
         total_time = end_time - start_time
         summary = f"Total request time: {total_time:.2f}s\nProcessed {len(images)} images successfully."
         return results, summary
     except torch.OutOfMemoryError:
+        # OOM occurred, try to find feasible batch size now
+        oom_time = time.time()
+        initial_attempt_time = oom_time - start_time
+        best, best_count = binary_search_max(images)
         end_time = time.time()
         total_time = end_time - start_time
             summary = (
                 f"Initial attempt OOM after {initial_attempt_time:.2f}s.\n"
                 f"Could not process even a single image.\n"
+                f"Total time including fallback attempts: {total_time:.2f}s."
             )
             return [], summary
         else:
             summary = (
+                f"Initial attempt OOM after {initial_attempt_time:.2f}s.\n"
+                f"Found that {best_count} images can be processed without OOM.\n"
+                f"Total time including fallback attempts: {total_time:.2f}s.\n"
                 f"Next time, try using up to {best_count} images."
             )
             return best, summary
     inputs=gr.Files(label="Upload Multiple Images", type="filepath", file_count="multiple"),
     outputs=[gr.Gallery(label="Processed Images"), gr.Textbox(label="Timing Info")],
     title="BiRefNet Bulk Background Removal with On-Demand Fallback",
+    description="Upload as many images as you want. If OOM occurs, a fallback will find the max feasible number. Extra cleanup steps and reinitialization for more consistent results."
 )
 iface.launch()