Spaces:

Realcat
/

image-matching-webui

Running

App Files Files Community

Realcat commited on Nov 10, 2024

Commit

aebdae7

1 Parent(s): 7dc6568

add: ray dashboard port and serve port

Browse files

Files changed (7) hide show

README.md +1 -1
api/__init__.py +42 -0
api/client.py +4 -11
api/config/api.yaml +51 -0
api/server.py +116 -145
api/types.py +0 -16
requirements.txt +3 -0

README.md CHANGED Viewed

@@ -107,7 +107,7 @@ docker run -it -p 7860:7860 vincentqin/image-matching-webui:latest python app.py
 ### Run demo
 ``` bash
-python3 ./app.py
 ```
 then open http://localhost:7860 in your browser.

 ### Run demo
 ``` bash
+python3 app.py
 ```
 then open http://localhost:7860 in your browser.

api/__init__.py CHANGED Viewed

	@@ -0,0 +1,42 @@

+import sys
+from typing import List
+from pydantic import BaseModel
+import base64
+import io
+import numpy as np
+from fastapi.exceptions import HTTPException
+from PIL import Image
+from pathlib import Path
+sys.path.append(str(Path(__file__).parents[1]))
+from hloc import logger
+class ImagesInput(BaseModel):
+    data: List[str] = []
+    max_keypoints: List[int] = []
+    timestamps: List[str] = []
+    grayscale: bool = False
+    image_hw: List[List[int]] = [[], []]
+    feature_type: int = 0
+    rotates: List[float] = []
+    scales: List[float] = []
+    reference_points: List[List[float]] = []
+    binarize: bool = False
+def decode_base64_to_image(encoding):
+    if encoding.startswith("data:image/"):
+        encoding = encoding.split(";")[1].split(",")[1]
+    try:
+        image = Image.open(io.BytesIO(base64.b64decode(encoding)))
+        return image
+    except Exception as e:
+        logger.warning(f"API cannot decode image: {e}")
+        raise HTTPException(
+            status_code=500, detail="Invalid encoded image"
+        ) from e
+def to_base64_nparray(encoding: str) -> np.ndarray:
+    return np.array(decode_base64_to_image(encoding)).astype("uint8")

api/client.py CHANGED Viewed

@@ -9,7 +9,7 @@ import cv2
 import numpy as np
 import requests
-ENDPOINT = "http://127.0.0.1:8001"
 if "REMOTE_URL_RAILWAY" in os.environ:
     ENDPOINT = os.environ["REMOTE_URL_RAILWAY"]
@@ -23,10 +23,8 @@ API_URL_EXTRACT = f"{ENDPOINT}/v1/extract"
 def read_image(path: str) -> str:
     """
     Read an image from a file, encode it as a JPEG and then as a base64 string.
     Args:
         path (str): The path to the image to read.
     Returns:
         str: The base64 encoded image.
     """
@@ -45,12 +43,10 @@ def read_image(path: str) -> str:
 def do_api_requests(url=API_URL_EXTRACT, **kwargs):
     """
     Helper function to send an API request to the image matching service.
     Args:
         url (str): The URL of the API endpoint to use. Defaults to the
             feature extraction endpoint.
         **kwargs: Additional keyword arguments to pass to the API.
     Returns:
         List[Dict[str, np.ndarray]]: A list of dictionaries containing the
             extracted features. The keys are "keypoints", "descriptors", and
@@ -99,11 +95,9 @@ def do_api_requests(url=API_URL_EXTRACT, **kwargs):
 def send_request_match(path0: str, path1: str) -> Dict[str, np.ndarray]:
     """
     Send a request to the API to generate a match between two images.
     Args:
         path0 (str): The path to the first image.
         path1 (str): The path to the second image.
     Returns:
         Dict[str, np.ndarray]: A dictionary containing the generated matches.
             The keys are "keypoints0", "keypoints1", "matches0", and "matches1",
@@ -134,10 +128,8 @@ def send_request_extract(
 ) -> List[Dict[str, np.ndarray]]:
     """
     Send a request to the API to extract features from an image.
     Args:
         input_images (str): The path to the image.
     Returns:
         List[Dict[str, np.ndarray]]: A list of dictionaries containing the
             extracted features. The keys are "keypoints", "descriptors", and
@@ -152,7 +144,8 @@ def send_request_extract(
         url=API_URL_EXTRACT,
         **inputs,
     )
-    print("Keypoints detected: {}".format(len(response[0]["keypoints"])))
     # draw matching, debug only
     if viz:
@@ -214,7 +207,7 @@ if __name__ == "__main__":
     #     )
     # request extract
-    for i in range(10):
         t1 = time.time()
         preds = send_request_extract(args.image0)
         t2 = time.time()

 import numpy as np
 import requests
+ENDPOINT = "http://127.0.0.1:8000"
 if "REMOTE_URL_RAILWAY" in os.environ:
     ENDPOINT = os.environ["REMOTE_URL_RAILWAY"]
 def read_image(path: str) -> str:
     """
     Read an image from a file, encode it as a JPEG and then as a base64 string.
     Args:
         path (str): The path to the image to read.
     Returns:
         str: The base64 encoded image.
     """
 def do_api_requests(url=API_URL_EXTRACT, **kwargs):
     """
     Helper function to send an API request to the image matching service.
     Args:
         url (str): The URL of the API endpoint to use. Defaults to the
             feature extraction endpoint.
         **kwargs: Additional keyword arguments to pass to the API.
     Returns:
         List[Dict[str, np.ndarray]]: A list of dictionaries containing the
             extracted features. The keys are "keypoints", "descriptors", and
 def send_request_match(path0: str, path1: str) -> Dict[str, np.ndarray]:
     """
     Send a request to the API to generate a match between two images.
     Args:
         path0 (str): The path to the first image.
         path1 (str): The path to the second image.
     Returns:
         Dict[str, np.ndarray]: A dictionary containing the generated matches.
             The keys are "keypoints0", "keypoints1", "matches0", and "matches1",
 ) -> List[Dict[str, np.ndarray]]:
     """
     Send a request to the API to extract features from an image.
     Args:
         input_images (str): The path to the image.
     Returns:
         List[Dict[str, np.ndarray]]: A list of dictionaries containing the
             extracted features. The keys are "keypoints", "descriptors", and
         url=API_URL_EXTRACT,
         **inputs,
     )
+    # breakpoint()
+    # print("Keypoints detected: {}".format(len(response[0]["keypoints"])))
     # draw matching, debug only
     if viz:
     #     )
     # request extract
+    for i in range(1000):
         t1 = time.time()
         preds = send_request_extract(args.image0)
         t2 = time.time()

api/config/api.yaml ADDED Viewed

	@@ -0,0 +1,51 @@

+# This file was generated using the `serve build` command on Ray v2.38.0.
+proxy_location: EveryNode
+http_options:
+  host: 0.0.0.0
+  port: 8000
+grpc_options:
+  port: 9000
+  grpc_servicer_functions: []
+logging_config:
+  encoding: TEXT
+  log_level: INFO
+  logs_dir: null
+  enable_access_log: true
+applications:
+- name: app1
+  route_prefix: /
+  import_path: api.server:service
+  runtime_env: {}
+  deployments:
+  - name: ImageMatchingService
+    num_replicas: 4
+    ray_actor_options:
+      num_cpus: 2.0
+      num_gpus: 1.0
+api:
+  feature:
+    output: feats-superpoint-n4096-rmax1600
+    model:
+      name: superpoint
+      nms_radius: 3
+      max_keypoints: 4096
+      keypoint_threshold: 0.005
+    preprocessing:
+      grayscale: True
+      force_resize: True
+      resize_max: 1600
+      width: 640
+      height: 480
+      dfactor: 8
+  matcher:
+    output: matches-NN-mutual
+    model:
+      name: nearest_neighbor
+      do_mutual_check: True
+      match_threshold: 0.2
+  dense: False

api/server.py CHANGED Viewed

@@ -1,24 +1,21 @@
 # server.py
-import base64
-import io
-import sys
 import warnings
 from pathlib import Path
 from typing import Any, Dict, Optional, Union
 import cv2
 import matplotlib.pyplot as plt
 import numpy as np
 import torch
-import uvicorn
 from fastapi import FastAPI, File, UploadFile
-from fastapi.exceptions import HTTPException
 from fastapi.responses import JSONResponse
 from PIL import Image
-sys.path.append(str(Path(__file__).parents[1]))
-from api.types import ImagesInput
 from hloc import DEVICE, extract_features, logger, match_dense, match_features
 from hloc.utils.viz import add_text, plot_keypoints
 from ui import get_version
@@ -26,23 +23,16 @@ from ui.utils import filter_matches, get_feature_model, get_model
 from ui.viz import display_matches, fig2im, plot_images
 warnings.simplefilter("ignore")
-def decode_base64_to_image(encoding):
-    if encoding.startswith("data:image/"):
-        encoding = encoding.split(";")[1].split(",")[1]
-    try:
-        image = Image.open(io.BytesIO(base64.b64decode(encoding)))
-        return image
-    except Exception as e:
-        logger.warning(f"API cannot decode image: {e}")
-        raise HTTPException(
-            status_code=500, detail="Invalid encoded image"
-        ) from e
-def to_base64_nparray(encoding: str) -> np.ndarray:
-    return np.array(decode_base64_to_image(encoding)).astype("uint8")
 class ImageMatchingAPI(torch.nn.Module):
@@ -68,14 +58,12 @@ class ImageMatchingAPI(torch.nn.Module):
     ) -> None:
         """
         Initializes an instance of the ImageMatchingAPI class.
         Args:
             conf (dict): A dictionary containing the configuration parameters.
             device (str, optional): The device to use for computation. Defaults to "cpu".
             detect_threshold (float, optional): The threshold for detecting keypoints. Defaults to 0.015.
             max_keypoints (int, optional): The maximum number of keypoints to extract. Defaults to 1024.
             match_threshold (float, optional): The threshold for matching keypoints. Defaults to 0.2.
         Returns:
             None
         """
@@ -170,13 +158,22 @@ class ImageMatchingAPI(torch.nn.Module):
             pred = match_features.match_images(self.matcher, pred0, pred1)
         return pred
     @torch.inference_mode()
     def extract(self, img0: np.ndarray, **kwargs) -> Dict[str, np.ndarray]:
         """Extract features from a single image.
         Args:
             img0 (np.ndarray): image
         Returns:
             Dict[str, np.ndarray]: feature dict
         """
@@ -190,17 +187,13 @@ class ImageMatchingAPI(torch.nn.Module):
         pred = extract_features.extract(
             self.extractor, img0, self.extract_conf["preprocessing"]
         )
-        pred = {
-            k: v.cpu().detach()[0].numpy() if isinstance(v, torch.Tensor) else v
-            for k, v in pred.items()
-        }
         # back to origin scale
         s0 = pred["original_size"] / pred["size"]
         pred["keypoints_orig"] = (
             match_features.scale_keypoints(pred["keypoints"] + 0.5, s0) - 0.5
         )
         # TODO: rotate back
         binarize = kwargs.get("binarize", False)
         if binarize:
             assert "descriptors" in pred
@@ -216,13 +209,11 @@ class ImageMatchingAPI(torch.nn.Module):
     ) -> Dict[str, np.ndarray]:
         """
         Forward pass of the image matching API.
         Args:
             img0: A 3D NumPy array of shape (H, W, C) representing the first image.
                   Values are in the range [0, 1] and are in RGB mode.
             img1: A 3D NumPy array of shape (H, W, C) representing the second image.
                   Values are in the range [0, 1] and are in RGB mode.
         Returns:
             A dictionary containing the following keys:
             - image0_orig: The original image 0.
@@ -252,11 +243,9 @@ class ImageMatchingAPI(torch.nn.Module):
         Filter matches using RANSAC. If keypoints are available, filter by keypoints.
         If lines are available, filter by lines. If both keypoints and lines are
         available, filter by keypoints.
         Args:
             pred (Dict[str, Any]): dict of matches, including original keypoints.
                                   See :func:`filter_matches` for the expected keys.
         Returns:
             Dict[str, Any]: filtered matches
         """
@@ -275,10 +264,8 @@ class ImageMatchingAPI(torch.nn.Module):
     ) -> None:
         """
         Visualize the matches.
         Args:
             log_path (Path, optional): The directory to save the images. Defaults to None.
         Returns:
             None
         """
@@ -349,96 +336,95 @@ class ImageMatchingAPI(torch.nn.Module):
             plt.close("all")
 class ImageMatchingService:
     def __init__(self, conf: dict, device: str):
         self.conf = conf
         self.api = ImageMatchingAPI(conf=conf, device=device)
-        self.app = FastAPI()
-        self.register_routes()
-    def register_routes(self):
-        @self.app.get("/version")
-        async def version():
-            return {"version": get_version()}
-        @self.app.post("/v1/match")
-        async def match(
-            image0: UploadFile = File(...), image1: UploadFile = File(...)
-        ):
-            """
-            Handle the image matching request and return the processed result.
-            Args:
-                image0 (UploadFile): The first image file for matching.
-                image1 (UploadFile): The second image file for matching.
-            Returns:
-                JSONResponse: A JSON response containing the filtered match results
-                              or an error message in case of failure.
-            """
-            try:
-                # Load the images from the uploaded files
-                image0_array = self.load_image(image0)
-                image1_array = self.load_image(image1)
-                # Perform image matching using the API
-                output = self.api(image0_array, image1_array)
-                # Keys to skip in the output
-                skip_keys = ["image0_orig", "image1_orig"]
-                # Postprocess the output to filter unwanted data
                 pred = self.postprocess(output, skip_keys)
-                # Return the filtered prediction as a JSON response
-                return JSONResponse(content=pred)
-            except Exception as e:
-                # Return an error message with status code 500 in case of exception
-                return JSONResponse(content={"error": str(e)}, status_code=500)
-        @self.app.post("/v1/extract")
-        async def extract(input_info: ImagesInput):
-            """
-            Extract keypoints and descriptors from images.
-            Args:
-                input_info: An object containing the image data and options.
-            Returns:
-                A list of dictionaries containing the keypoints and descriptors.
-            """
-            try:
-                preds = []
-                for i, input_image in enumerate(input_info.data):
-                    # Load the image from the input data
-                    image_array = to_base64_nparray(input_image)
-                    # Extract keypoints and descriptors
-                    output = self.api.extract(
-                        image_array,
-                        max_keypoints=input_info.max_keypoints[i],
-                        binarize=input_info.binarize,
-                    )
-                    # Do not return the original image and image_orig
-                    # skip_keys = ["image", "image_orig"]
-                    skip_keys = []
-                    # Postprocess the output
-                    pred = self.postprocess(output, skip_keys)
-                    preds.append(pred)
-                # Return the list of extracted features
-                return JSONResponse(content=preds)
-            except Exception as e:
-                # Return an error message if an exception occurs
-                return JSONResponse(content={"error": str(e)}, status_code=500)
     def load_image(self, file_path: Union[str, UploadFile]) -> np.ndarray:
         """
         Reads an image from a file path or an UploadFile object.
         Args:
             file_path: A file path or an UploadFile object.
         Returns:
             A numpy array representing the image.
         """
@@ -462,38 +448,23 @@ class ImageMatchingService:
         return pred
     def run(self, host: str = "0.0.0.0", port: int = 8001):
-        uvicorn.run(self.app, host=host, port=port)
-if __name__ == "__main__":
-    conf = {
-        "feature": {
-            "output": "feats-superpoint-n4096-rmax1600",
-            "model": {
-                "name": "superpoint",
-                "nms_radius": 3,
-                "max_keypoints": 4096,
-                "keypoint_threshold": 0.005,
-            },
-            "preprocessing": {
-                "grayscale": True,
-                "force_resize": True,
-                "resize_max": 1600,
-                "width": 640,
-                "height": 480,
-                "dfactor": 8,
-            },
-        },
-        "matcher": {
-            "output": "matches-NN-mutual",
-            "model": {
-                "name": "nearest_neighbor",
-                "do_mutual_check": True,
-                "match_threshold": 0.2,
-            },
-        },
-        "dense": False,
-    }
-    service = ImageMatchingService(conf=conf, device=DEVICE)
-    service.run()

 # server.py
 import warnings
 from pathlib import Path
 from typing import Any, Dict, Optional, Union
+import yaml
+import ray
+from ray import serve
 import cv2
 import matplotlib.pyplot as plt
 import numpy as np
 import torch
 from fastapi import FastAPI, File, UploadFile
 from fastapi.responses import JSONResponse
 from PIL import Image
+from api import ImagesInput, to_base64_nparray
 from hloc import DEVICE, extract_features, logger, match_dense, match_features
 from hloc.utils.viz import add_text, plot_keypoints
 from ui import get_version
 from ui.viz import display_matches, fig2im, plot_images
 warnings.simplefilter("ignore")
+app = FastAPI()
+if ray.is_initialized():
+    ray.shutdown()
+ray.init(
+    dashboard_port=8265,
+    ignore_reinit_error=True,
+)
+serve.start(
+    http_options={"host": "0.0.0.0", "port": 8000},
+)
 class ImageMatchingAPI(torch.nn.Module):
     ) -> None:
         """
         Initializes an instance of the ImageMatchingAPI class.
         Args:
             conf (dict): A dictionary containing the configuration parameters.
             device (str, optional): The device to use for computation. Defaults to "cpu".
             detect_threshold (float, optional): The threshold for detecting keypoints. Defaults to 0.015.
             max_keypoints (int, optional): The maximum number of keypoints to extract. Defaults to 1024.
             match_threshold (float, optional): The threshold for matching keypoints. Defaults to 0.2.
         Returns:
             None
         """
             pred = match_features.match_images(self.matcher, pred0, pred1)
         return pred
+    def _convert_pred(self, pred):
+        ret = {
+            k: v.cpu().detach()[0].numpy() if isinstance(v, torch.Tensor) else v
+            for k, v in pred.items()
+        }
+        ret = {
+            k: v[0].cpu().detach().numpy() if isinstance(v, list) else v
+            for k, v in ret.items()
+        }
+        return ret
     @torch.inference_mode()
     def extract(self, img0: np.ndarray, **kwargs) -> Dict[str, np.ndarray]:
         """Extract features from a single image.
         Args:
             img0 (np.ndarray): image
         Returns:
             Dict[str, np.ndarray]: feature dict
         """
         pred = extract_features.extract(
             self.extractor, img0, self.extract_conf["preprocessing"]
         )
+        pred = self._convert_pred(pred)
         # back to origin scale
         s0 = pred["original_size"] / pred["size"]
         pred["keypoints_orig"] = (
             match_features.scale_keypoints(pred["keypoints"] + 0.5, s0) - 0.5
         )
         # TODO: rotate back
         binarize = kwargs.get("binarize", False)
         if binarize:
             assert "descriptors" in pred
     ) -> Dict[str, np.ndarray]:
         """
         Forward pass of the image matching API.
         Args:
             img0: A 3D NumPy array of shape (H, W, C) representing the first image.
                   Values are in the range [0, 1] and are in RGB mode.
             img1: A 3D NumPy array of shape (H, W, C) representing the second image.
                   Values are in the range [0, 1] and are in RGB mode.
         Returns:
             A dictionary containing the following keys:
             - image0_orig: The original image 0.
         Filter matches using RANSAC. If keypoints are available, filter by keypoints.
         If lines are available, filter by lines. If both keypoints and lines are
         available, filter by keypoints.
         Args:
             pred (Dict[str, Any]): dict of matches, including original keypoints.
                                   See :func:`filter_matches` for the expected keys.
         Returns:
             Dict[str, Any]: filtered matches
         """
     ) -> None:
         """
         Visualize the matches.
         Args:
             log_path (Path, optional): The directory to save the images. Defaults to None.
         Returns:
             None
         """
             plt.close("all")
+@serve.deployment(
+    num_replicas=4,
+    ray_actor_options={"num_cpus": 2, "num_gpus": 1}
+)
+@serve.ingress(app)
 class ImageMatchingService:
     def __init__(self, conf: dict, device: str):
         self.conf = conf
         self.api = ImageMatchingAPI(conf=conf, device=device)
+    @app.get("/")
+    def root(self):
+        return "Hello, world!"
+    @app.get("/version")
+    async def version(self):
+        return {"version": get_version()}
+    @app.post("/v1/match")
+    async def match(
+        self, image0: UploadFile = File(...), image1: UploadFile = File(...)
+    ):
+        """
+        Handle the image matching request and return the processed result.
+        Args:
+            image0 (UploadFile): The first image file for matching.
+            image1 (UploadFile): The second image file for matching.
+        Returns:
+            JSONResponse: A JSON response containing the filtered match results
+                            or an error message in case of failure.
+        """
+        try:
+            # Load the images from the uploaded files
+            image0_array = self.load_image(image0)
+            image1_array = self.load_image(image1)
+            # Perform image matching using the API
+            output = self.api(image0_array, image1_array)
+            # Keys to skip in the output
+            skip_keys = ["image0_orig", "image1_orig"]
+            # Postprocess the output to filter unwanted data
+            pred = self.postprocess(output, skip_keys)
+            # Return the filtered prediction as a JSON response
+            return JSONResponse(content=pred)
+        except Exception as e:
+            # Return an error message with status code 500 in case of exception
+            return JSONResponse(content={"error": str(e)}, status_code=500)
+    @app.post("/v1/extract")
+    async def extract(self, input_info: ImagesInput):
+        """
+        Extract keypoints and descriptors from images.
+        Args:
+            input_info: An object containing the image data and options.
+        Returns:
+            A list of dictionaries containing the keypoints and descriptors.
+        """
+        try:
+            preds = []
+            for i, input_image in enumerate(input_info.data):
+                # Load the image from the input data
+                image_array = to_base64_nparray(input_image)
+                # Extract keypoints and descriptors
+                output = self.api.extract(
+                    image_array,
+                    max_keypoints=input_info.max_keypoints[i],
+                    binarize=input_info.binarize,
+                )
+                # Do not return the original image and image_orig
+                # skip_keys = ["image", "image_orig"]
+                skip_keys = []
+                # Postprocess the output
                 pred = self.postprocess(output, skip_keys)
+                preds.append(pred)
+            # Return the list of extracted features
+            return JSONResponse(content=preds)
+        except Exception as e:
+            # Return an error message if an exception occurs
+            return JSONResponse(content={"error": str(e)}, status_code=500)
     def load_image(self, file_path: Union[str, UploadFile]) -> np.ndarray:
         """
         Reads an image from a file path or an UploadFile object.
         Args:
             file_path: A file path or an UploadFile object.
         Returns:
             A numpy array representing the image.
         """
         return pred
     def run(self, host: str = "0.0.0.0", port: int = 8001):
+        import uvicorn
+        uvicorn.run(app, host=host, port=port)
+def read_config(config_path: Path) -> dict:
+    with open(config_path, "r") as f:
+        conf = yaml.safe_load(f)
+    return conf
+# api server
+conf = read_config(Path(__file__).parent / "config/api.yaml")
+service = ImageMatchingService.bind(conf=conf["api"], device=DEVICE)
+# handle = serve.run(service, route_prefix="/")
+# serve run api.server_ray:service
+# build to generate config file
+# serve build api.server_ray:service -o api/config/ray.yaml
+# serve run api/config/ray.yaml

api/types.py DELETED Viewed

@@ -1,16 +0,0 @@
-from typing import List
-from pydantic import BaseModel
-class ImagesInput(BaseModel):
-    data: List[str] = []
-    max_keypoints: List[int] = []
-    timestamps: List[str] = []
-    grayscale: bool = False
-    image_hw: List[List[int]] = [[], []]
-    feature_type: int = 0
-    rotates: List[float] = []
-    scales: List[float] = []
-    reference_points: List[List[float]] = []
-    binarize: bool = False

requirements.txt CHANGED Viewed

@@ -36,3 +36,6 @@ roma #dust3r
 tqdm
 yacs
 fastapi

 tqdm
 yacs
 fastapi
+uvicorn
+ray
+ray[serve]