Spaces:

adirathor07
/

AutoEval

Runtime error

App Files Files Community

adirathor07 commited on Jul 11, 2024

Commit

153628e

1 Parent(s): 6e88fde

added doctr folder

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

doctr/__init__.py +3 -0
doctr/__pycache__/__init__.cpython-310.pyc +0 -0
doctr/__pycache__/__init__.cpython-311.pyc +0 -0
doctr/__pycache__/__init__.cpython-38.pyc +0 -0
doctr/__pycache__/file_utils.cpython-310.pyc +0 -0
doctr/__pycache__/file_utils.cpython-311.pyc +0 -0
doctr/__pycache__/file_utils.cpython-38.pyc +0 -0
doctr/__pycache__/version.cpython-311.pyc +0 -0
doctr/__pycache__/version.cpython-38.pyc +0 -0
doctr/contrib/__init__.py +0 -0
doctr/contrib/__pycache__/__init__.cpython-311.pyc +0 -0
doctr/contrib/__pycache__/__init__.cpython-38.pyc +0 -0
doctr/contrib/artefacts.py +131 -0
doctr/contrib/base.py +105 -0
doctr/datasets/__init__.py +26 -0
doctr/datasets/__pycache__/__init__.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/__init__.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/cord.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/cord.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/detection.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/detection.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/doc_artefacts.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/doc_artefacts.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/funsd.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/funsd.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/ic03.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/ic03.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/ic13.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/ic13.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/iiit5k.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/iiit5k.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/iiithws.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/iiithws.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/imgur5k.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/imgur5k.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/loader.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/loader.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/mjsynth.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/mjsynth.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/ocr.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/ocr.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/orientation.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/orientation.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/recognition.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/recognition.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/sroie.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/sroie.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/svhn.cpython-311.pyc +0 -0
doctr/datasets/__pycache__/svhn.cpython-38.pyc +0 -0
doctr/datasets/__pycache__/svt.cpython-311.pyc +0 -0

doctr/__init__.py ADDED Viewed

	@@ -0,0 +1,3 @@

+from . import io, models, datasets, contrib, transforms, utils
+from .file_utils import is_tf_available, is_torch_available
+from .version import __version__  # noqa: F401

doctr/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (382 Bytes). View file

doctr/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (499 Bytes). View file

doctr/__pycache__/__init__.cpython-38.pyc ADDED Viewed

Binary file (399 Bytes). View file

doctr/__pycache__/file_utils.cpython-310.pyc ADDED Viewed

Binary file (2.56 kB). View file

doctr/__pycache__/file_utils.cpython-311.pyc ADDED Viewed

Binary file (4.23 kB). View file

doctr/__pycache__/file_utils.cpython-38.pyc ADDED Viewed

Binary file (2.59 kB). View file

doctr/__pycache__/version.cpython-311.pyc ADDED Viewed

Binary file (198 Bytes). View file

doctr/__pycache__/version.cpython-38.pyc ADDED Viewed

Binary file (181 Bytes). View file

doctr/contrib/__init__.py ADDED Viewed

File without changes

doctr/contrib/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (185 Bytes). View file

doctr/contrib/__pycache__/__init__.cpython-38.pyc ADDED Viewed

Binary file (167 Bytes). View file

doctr/contrib/artefacts.py ADDED Viewed

	@@ -0,0 +1,131 @@

+# Copyright (C) 2021-2024, Mindee.
+# This program is licensed under the Apache License 2.0.
+# See LICENSE or go to <https://opensource.org/licenses/Apache-2.0> for full license details.
+from typing import Any, Dict, List, Optional, Tuple
+import cv2
+import numpy as np
+from doctr.file_utils import requires_package
+from .base import _BasePredictor
+__all__ = ["ArtefactDetector"]
+default_cfgs: Dict[str, Dict[str, Any]] = {
+    "yolov8_artefact": {
+        "input_shape": (3, 1024, 1024),
+        "labels": ["bar_code", "qr_code", "logo", "photo"],
+        "url": "https://doctr-static.mindee.com/models?id=v0.8.1/yolo_artefact-f9d66f14.onnx&src=0",
+    },
+}
+class ArtefactDetector(_BasePredictor):
+    """
+    A class to detect artefacts in images
+    >>> from doctr.io import DocumentFile
+    >>> from doctr.contrib.artefacts import ArtefactDetector
+    >>> doc = DocumentFile.from_images(["path/to/image.jpg"])
+    >>> detector = ArtefactDetector()
+    >>> results = detector(doc)
+    Args:
+    ----
+        arch: the architecture to use
+        batch_size: the batch size to use
+        model_path: the path to the model to use
+        labels: the labels to use
+        input_shape: the input shape to use
+        mask_labels: the mask labels to use
+        conf_threshold: the confidence threshold to use
+        iou_threshold: the intersection over union threshold to use
+        **kwargs: additional arguments to be passed to `download_from_url`
+    """
+    def __init__(
+        self,
+        arch: str = "yolov8_artefact",
+        batch_size: int = 2,
+        model_path: Optional[str] = None,
+        labels: Optional[List[str]] = None,
+        input_shape: Optional[Tuple[int, int, int]] = None,
+        conf_threshold: float = 0.5,
+        iou_threshold: float = 0.5,
+        **kwargs: Any,
+    ) -> None:
+        super().__init__(batch_size=batch_size, url=default_cfgs[arch]["url"], model_path=model_path, **kwargs)
+        self.labels = labels or default_cfgs[arch]["labels"]
+        self.input_shape = input_shape or default_cfgs[arch]["input_shape"]
+        self.conf_threshold = conf_threshold
+        self.iou_threshold = iou_threshold
+    def preprocess(self, img: np.ndarray) -> np.ndarray:
+        return np.transpose(cv2.resize(img, (self.input_shape[2], self.input_shape[1])), (2, 0, 1)) / np.array(255.0)
+    def postprocess(self, output: List[np.ndarray], input_images: List[List[np.ndarray]]) -> List[List[Dict[str, Any]]]:
+        results = []
+        for batch in zip(output, input_images):
+            for out, img in zip(batch[0], batch[1]):
+                org_height, org_width = img.shape[:2]
+                width_scale, height_scale = org_width / self.input_shape[2], org_height / self.input_shape[1]
+                for res in out:
+                    sample_results = []
+                    for row in np.transpose(np.squeeze(res)):
+                        classes_scores = row[4:]
+                        max_score = np.amax(classes_scores)
+                        if max_score >= self.conf_threshold:
+                            class_id = np.argmax(classes_scores)
+                            x, y, w, h = row[0], row[1], row[2], row[3]
+                            # to rescaled xmin, ymin, xmax, ymax
+                            xmin = int((x - w / 2) * width_scale)
+                            ymin = int((y - h / 2) * height_scale)
+                            xmax = int((x + w / 2) * width_scale)
+                            ymax = int((y + h / 2) * height_scale)
+                            sample_results.append({
+                                "label": self.labels[class_id],
+                                "confidence": float(max_score),
+                                "box": [xmin, ymin, xmax, ymax],
+                            })
+                    # Filter out overlapping boxes
+                    boxes = [res["box"] for res in sample_results]
+                    scores = [res["confidence"] for res in sample_results]
+                    keep_indices = cv2.dnn.NMSBoxes(boxes, scores, self.conf_threshold, self.iou_threshold)  # type: ignore[arg-type]
+                    sample_results = [sample_results[i] for i in keep_indices]
+                    results.append(sample_results)
+        self._results = results
+        return results
+    def show(self, **kwargs: Any) -> None:
+        """
+        Display the results
+        Args:
+        ----
+            **kwargs: additional keyword arguments to be passed to `plt.show`
+        """
+        requires_package("matplotlib", "`.show()` requires matplotlib installed")
+        import matplotlib.pyplot as plt
+        from matplotlib.patches import Rectangle
+        # visualize the results with matplotlib
+        if self._results and self._inputs:
+            for img, res in zip(self._inputs, self._results):
+                plt.figure(figsize=(10, 10))
+                plt.imshow(img)
+                for obj in res:
+                    xmin, ymin, xmax, ymax = obj["box"]
+                    label = obj["label"]
+                    plt.text(xmin, ymin, f"{label} {obj['confidence']:.2f}", color="red")
+                    plt.gca().add_patch(
+                        Rectangle((xmin, ymin), xmax - xmin, ymax - ymin, fill=False, edgecolor="red", linewidth=2)
+                    )
+                plt.show(**kwargs)

doctr/contrib/base.py ADDED Viewed

	@@ -0,0 +1,105 @@

+# Copyright (C) 2021-2024, Mindee.
+# This program is licensed under the Apache License 2.0.
+# See LICENSE or go to <https://opensource.org/licenses/Apache-2.0> for full license details.
+from typing import Any, List, Optional
+import numpy as np
+from doctr.file_utils import requires_package
+from doctr.utils.data import download_from_url
+class _BasePredictor:
+    """
+    Base class for all predictors
+    Args:
+    ----
+        batch_size: the batch size to use
+        url: the url to use to download a model if needed
+        model_path: the path to the model to use
+        **kwargs: additional arguments to be passed to `download_from_url`
+    """
+    def __init__(self, batch_size: int, url: Optional[str] = None, model_path: Optional[str] = None, **kwargs) -> None:
+        self.batch_size = batch_size
+        self.session = self._init_model(url, model_path, **kwargs)
+        self._inputs: List[np.ndarray] = []
+        self._results: List[Any] = []
+    def _init_model(self, url: Optional[str] = None, model_path: Optional[str] = None, **kwargs: Any) -> Any:
+        """
+        Download the model from the given url if needed
+        Args:
+        ----
+            url: the url to use
+            model_path: the path to the model to use
+            **kwargs: additional arguments to be passed to `download_from_url`
+        Returns:
+        -------
+            Any: the ONNX loaded model
+        """
+        requires_package("onnxruntime", "`.contrib` module requires `onnxruntime` to be installed.")
+        import onnxruntime as ort
+        if not url and not model_path:
+            raise ValueError("You must provide either a url or a model_path")
+        onnx_model_path = model_path if model_path else str(download_from_url(url, cache_subdir="models", **kwargs))  # type: ignore[arg-type]
+        return ort.InferenceSession(onnx_model_path, providers=["CUDAExecutionProvider", "CPUExecutionProvider"])
+    def preprocess(self, img: np.ndarray) -> np.ndarray:
+        """
+        Preprocess the input image
+        Args:
+        ----
+            img: the input image to preprocess
+        Returns:
+        -------
+            np.ndarray: the preprocessed image
+        """
+        raise NotImplementedError
+    def postprocess(self, output: List[np.ndarray], input_images: List[List[np.ndarray]]) -> Any:
+        """
+        Postprocess the model output
+        Args:
+        ----
+            output: the model output to postprocess
+            input_images: the input images used to generate the output
+        Returns:
+        -------
+            Any: the postprocessed output
+        """
+        raise NotImplementedError
+    def __call__(self, inputs: List[np.ndarray]) -> Any:
+        """
+        Call the model on the given inputs
+        Args:
+        ----
+            inputs: the inputs to use
+        Returns:
+        -------
+            Any: the postprocessed output
+        """
+        self._inputs = inputs
+        model_inputs = self.session.get_inputs()
+        batched_inputs = [inputs[i : i + self.batch_size] for i in range(0, len(inputs), self.batch_size)]
+        processed_batches = [
+            np.array([self.preprocess(img) for img in batch], dtype=np.float32) for batch in batched_inputs
+        ]
+        outputs = [self.session.run(None, {model_inputs[0].name: batch}) for batch in processed_batches]
+        return self.postprocess(outputs, batched_inputs)

doctr/datasets/__init__.py ADDED Viewed

	@@ -0,0 +1,26 @@

+from doctr.file_utils import is_tf_available
+from .generator import *
+from .cord import *
+from .detection import *
+from .doc_artefacts import *
+from .funsd import *
+from .ic03 import *
+from .ic13 import *
+from .iiit5k import *
+from .iiithws import *
+from .imgur5k import *
+from .mjsynth import *
+from .ocr import *
+from .recognition import *
+from .orientation import *
+from .sroie import *
+from .svhn import *
+from .svt import *
+from .synthtext import *
+from .utils import *
+from .vocabs import *
+from .wildreceipt import *
+if is_tf_available():
+    from .loader import *

doctr/datasets/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (949 Bytes). View file

doctr/datasets/__pycache__/__init__.cpython-38.pyc ADDED Viewed

Binary file (655 Bytes). View file

doctr/datasets/__pycache__/cord.cpython-311.pyc ADDED Viewed

Binary file (6.39 kB). View file

doctr/datasets/__pycache__/cord.cpython-38.pyc ADDED Viewed

Binary file (3.5 kB). View file

doctr/datasets/__pycache__/detection.cpython-311.pyc ADDED Viewed

Binary file (6.35 kB). View file

doctr/datasets/__pycache__/detection.cpython-38.pyc ADDED Viewed

Binary file (3.75 kB). View file

doctr/datasets/__pycache__/doc_artefacts.cpython-311.pyc ADDED Viewed

Binary file (5.45 kB). View file

doctr/datasets/__pycache__/doc_artefacts.cpython-38.pyc ADDED Viewed

Binary file (3.12 kB). View file

doctr/datasets/__pycache__/funsd.cpython-311.pyc ADDED Viewed

Binary file (6.27 kB). View file

doctr/datasets/__pycache__/funsd.cpython-38.pyc ADDED Viewed

Binary file (3.63 kB). View file

doctr/datasets/__pycache__/ic03.cpython-311.pyc ADDED Viewed

Binary file (7.13 kB). View file

doctr/datasets/__pycache__/ic03.cpython-38.pyc ADDED Viewed

Binary file (3.93 kB). View file

doctr/datasets/__pycache__/ic13.cpython-311.pyc ADDED Viewed

Binary file (6.18 kB). View file

doctr/datasets/__pycache__/ic13.cpython-38.pyc ADDED Viewed

Binary file (3.78 kB). View file

doctr/datasets/__pycache__/iiit5k.cpython-311.pyc ADDED Viewed

Binary file (5.34 kB). View file

doctr/datasets/__pycache__/iiit5k.cpython-38.pyc ADDED Viewed

Binary file (3.36 kB). View file

doctr/datasets/__pycache__/iiithws.cpython-311.pyc ADDED Viewed

Binary file (4.14 kB). View file

doctr/datasets/__pycache__/iiithws.cpython-38.pyc ADDED Viewed

Binary file (2.67 kB). View file

doctr/datasets/__pycache__/imgur5k.cpython-311.pyc ADDED Viewed

Binary file (10.5 kB). View file

doctr/datasets/__pycache__/imgur5k.cpython-38.pyc ADDED Viewed

Binary file (5.51 kB). View file

doctr/datasets/__pycache__/loader.cpython-311.pyc ADDED Viewed

Binary file (4.77 kB). View file

doctr/datasets/__pycache__/loader.cpython-38.pyc ADDED Viewed

Binary file (3.18 kB). View file

doctr/datasets/__pycache__/mjsynth.cpython-311.pyc ADDED Viewed

Binary file (5.16 kB). View file

doctr/datasets/__pycache__/mjsynth.cpython-38.pyc ADDED Viewed

Binary file (3.81 kB). View file

doctr/datasets/__pycache__/ocr.cpython-311.pyc ADDED Viewed

Binary file (4.35 kB). View file

doctr/datasets/__pycache__/ocr.cpython-38.pyc ADDED Viewed

Binary file (2.47 kB). View file

doctr/datasets/__pycache__/orientation.cpython-311.pyc ADDED Viewed

Binary file (1.9 kB). View file

doctr/datasets/__pycache__/orientation.cpython-38.pyc ADDED Viewed

Binary file (1.4 kB). View file

doctr/datasets/__pycache__/recognition.cpython-311.pyc ADDED Viewed

Binary file (3.64 kB). View file

doctr/datasets/__pycache__/recognition.cpython-38.pyc ADDED Viewed

Binary file (2.14 kB). View file

doctr/datasets/__pycache__/sroie.cpython-311.pyc ADDED Viewed

Binary file (6.43 kB). View file

doctr/datasets/__pycache__/sroie.cpython-38.pyc ADDED Viewed

Binary file (3.73 kB). View file

doctr/datasets/__pycache__/svhn.cpython-311.pyc ADDED Viewed

Binary file (7.8 kB). View file

doctr/datasets/__pycache__/svhn.cpython-38.pyc ADDED Viewed

Binary file (4.23 kB). View file

doctr/datasets/__pycache__/svt.cpython-311.pyc ADDED Viewed

Binary file (6.8 kB). View file