Spaces:

jebin2
/

comic-panel-extractor

Running

App Files Files Community

jebin2 commited on Jul 20

Commit

e05ccab

1 Parent(s): 5ada1b3

made thin border

Browse files

Files changed (6) hide show

.gitignore +4 -1
comic_panel_extractor/cli.py +0 -2
comic_panel_extractor/image_processor.py +32 -1
comic_panel_extractor/main.py +6 -4
comic_panel_extractor/panel_extractor.py +2 -2
requirements.txt +2 -1

.gitignore CHANGED Viewed

@@ -205,4 +205,7 @@ cython_debug/
 marimo/_static/
 marimo/_lsp/
 __marimo__/
-temp_dir

 marimo/_static/
 marimo/_lsp/
 __marimo__/
+temp_dir
+input.jpg
+comic_panel_extractor/api_outputs/
+temp.py

comic_panel_extractor/cli.py CHANGED Viewed

@@ -68,8 +68,6 @@ Examples:
 					for key, value in config_data.items():
 						if hasattr(config, key):
 							setattr(config, key, value)
-				if args.verbose:
-					print(f"📄 Loaded configuration from: {args.config}")
 			except Exception as e:
 				print(f"⚠️  Warning: Could not load config file: {e}", file=sys.stderr)

 					for key, value in config_data.items():
 						if hasattr(config, key):
 							setattr(config, key, value)
 			except Exception as e:
 				print(f"⚠️  Warning: Could not load config file: {e}", file=sys.stderr)

comic_panel_extractor/image_processor.py CHANGED Viewed

@@ -50,9 +50,40 @@ class ImageProcessor:
         cv2.imwrite(str(dilated_path), dilated)
         return str(gray_path), str(binary_path), str(dilated_path)
     def clean_dilated_image(self, dilated_path: str,
-                           output_filename: str = "5_dilated_cleaned.jpg",
                            max_neighbors: int = 2) -> str:
         """Clean dilated image by thinning thick borders."""
         dilated = cv2.imread(dilated_path, cv2.IMREAD_GRAYSCALE)

         cv2.imwrite(str(dilated_path), dilated)
         return str(gray_path), str(binary_path), str(dilated_path)
+    def thin_image_borders(self, processed_image_path: str, output_filename: str = "5_thin_border.jpg") -> str:
+        """
+        Clean dilated image by thinning thick borders and removing hanging clusters.
+        """
+        from skimage.morphology import skeletonize, remove_small_objects
+        from skimage.measure import label
+        # Load image
+        img = cv2.imread(processed_image_path, cv2.IMREAD_GRAYSCALE)
+        _, binary = cv2.threshold(img, 128, 1, cv2.THRESH_BINARY_INV)  # invert, binary mask (0,1)
+        # Skeletonize
+        skeleton = skeletonize(binary).astype(np.uint8)
+        # Remove small hanging clusters
+        labeled = label(skeleton, connectivity=2)
+        cleaned = remove_small_objects(labeled, min_size=150)  # Adjust min_size for more/less pruning
+        # Convert back to 0–255 uint8 image
+        final = (cleaned > 0).astype(np.uint8) * 255
+        # Invert back if needed
+        result = 255 - final
+        # Save
+        output_path = f'{self.config.output_folder}/{output_filename}'
+        cv2.imwrite(output_path, result)
+        print(f"✅ Cleaned and thinned image saved to: {output_path}")
+        return str(output_path)
     def clean_dilated_image(self, dilated_path: str,
+                           output_filename: str = "6_dilated_cleaned.jpg",
                            max_neighbors: int = 2) -> str:
         """Clean dilated image by thinning thick borders."""
         dilated = cv2.imread(dilated_path, cv2.IMREAD_GRAYSCALE)

comic_panel_extractor/main.py CHANGED Viewed

@@ -32,14 +32,16 @@ class ComicPanelExtractor:
         masked_image_path = self.image_processor.mask_text_regions([bubble["bbox"] for bubble in text_bubbles])
         # Step 2: Preprocess image
-        _, _, dilated_path = self.image_processor.preprocess_image(masked_image_path)
         # Step 3: Clean dilated image
-        cleaned_path = self.image_processor.clean_dilated_image(dilated_path)
         # Step 4: Extract panels
         panel_images, panel_data, all_panel_path = self.panel_extractor.extract_panels(
-            cleaned_path, min_width_ratio=0.1
         )
         return panel_images, panel_data, all_panel_path

         masked_image_path = self.image_processor.mask_text_regions([bubble["bbox"] for bubble in text_bubbles])
         # Step 2: Preprocess image
+        _, _, processed_image_path = self.image_processor.preprocess_image(masked_image_path)
+        # Step 3: Thin border line
+        processed_image_path = self.image_processor.thin_image_borders(processed_image_path)
         # Step 3: Clean dilated image
+        # processed_image_path = self.image_processor.clean_dilated_image(processed_image_path)
         # Step 4: Extract panels
         panel_images, panel_data, all_panel_path = self.panel_extractor.extract_panels(
+            processed_image_path, min_width_ratio=0.1
         )
         return panel_images, panel_data, all_panel_path

comic_panel_extractor/panel_extractor.py CHANGED Viewed

@@ -102,7 +102,7 @@ class PanelExtractor:
         width = dilated.shape[1]
         row_slice = dilated[y1:y2, :]
         col_black_percentage = np.sum(row_slice == 0, axis=0) / (y2 - y1) * 100
         # Find column gutters
         col_gutters = []
         in_gutter = False
@@ -169,7 +169,7 @@ class PanelExtractor:
             panel_data.append(panel_info)
             # Save panel image
-            panel_path = f'{self.config.output_folder}/panel_{idx}.jpg'
             cv2.imwrite(str(panel_path), panel_img)
             all_panel_path.append(panel_path)

         width = dilated.shape[1]
         row_slice = dilated[y1:y2, :]
         col_black_percentage = np.sum(row_slice == 0, axis=0) / (y2 - y1) * 100
         # Find column gutters
         col_gutters = []
         in_gutter = False
             panel_data.append(panel_info)
             # Save panel image
+            panel_path = f'{self.config.output_folder}/panel_{idx}_{(x1, y1, x2, y2)}.jpg'
             cv2.imwrite(str(panel_path), panel_img)
             all_panel_path.append(panel_path)

requirements.txt CHANGED Viewed

@@ -5,4 +5,5 @@ easyocr
 fastapi
 uvicorn
 python-multipart
-jinja2

 fastapi
 uvicorn
 python-multipart
+jinja2
+scikit-image