Spaces:

uartimcs
/

donut-booking-gradio

Running

App Files Files Community

uartimcs commited on Nov 20, 2024

Commit

550991a

verified ·

1 Parent(s): c2511af

Delete synthdog

Browse files

Files changed (42) hide show

synthdog/README.md +0 -63
synthdog/config_en.yaml +0 -119
synthdog/config_ja.yaml +0 -119
synthdog/config_ko.yaml +0 -119
synthdog/config_zh.yaml +0 -119
synthdog/elements/__init__.py +0 -12
synthdog/elements/background.py +0 -24
synthdog/elements/content.py +0 -118
synthdog/elements/document.py +0 -65
synthdog/elements/paper.py +0 -17
synthdog/elements/textbox.py +0 -43
synthdog/layouts/__init__.py +0 -9
synthdog/layouts/grid.py +0 -68
synthdog/layouts/grid_stack.py +0 -74
synthdog/resources/background/bedroom_83.jpg +0 -0
synthdog/resources/background/bob+dylan_83.jpg +0 -0
synthdog/resources/background/coffee_122.jpg +0 -0
synthdog/resources/background/coffee_18.jpeg +0 -3
synthdog/resources/background/crater_141.jpg +0 -3
synthdog/resources/background/cream_124.jpg +0 -3
synthdog/resources/background/eagle_110.jpg +0 -0
synthdog/resources/background/farm_25.jpg +0 -0
synthdog/resources/background/hiking_18.jpg +0 -0
synthdog/resources/corpus/enwiki.txt +0 -0
synthdog/resources/corpus/jawiki.txt +0 -0
synthdog/resources/corpus/kowiki.txt +0 -0
synthdog/resources/corpus/zhwiki.txt +0 -0
synthdog/resources/font/en/NotoSans-Regular.ttf +0 -0
synthdog/resources/font/en/NotoSerif-Regular.ttf +0 -0
synthdog/resources/font/ja/NotoSansJP-Regular.otf +0 -3
synthdog/resources/font/ja/NotoSerifJP-Regular.otf +0 -3
synthdog/resources/font/ko/NotoSansKR-Regular.otf +0 -3
synthdog/resources/font/ko/NotoSerifKR-Regular.otf +0 -3
synthdog/resources/font/zh/NotoSansSC-Regular.otf +0 -3
synthdog/resources/font/zh/NotoSerifSC-Regular.otf +0 -3
synthdog/resources/paper/paper_1.jpg +0 -3
synthdog/resources/paper/paper_2.jpg +0 -3
synthdog/resources/paper/paper_3.jpg +0 -3
synthdog/resources/paper/paper_4.jpg +0 -3
synthdog/resources/paper/paper_5.jpg +0 -3
synthdog/resources/paper/paper_6.jpg +0 -3
synthdog/template.py +0 -130

synthdog/README.md DELETED Viewed

@@ -1,63 +0,0 @@
-# SynthDoG 🐶: Synthetic Document Generator
-SynthDoG is synthetic document generator for visual document understanding (VDU).
-![image](../misc/sample_synthdog.png)
-## Prerequisites
-- python>=3.6
-- [synthtiger](https://github.com/clovaai/synthtiger) (`pip install synthtiger`)
-## Usage
-```bash
-# Set environment variable (for macOS)
-$ export OBJC_DISABLE_INITIALIZE_FORK_SAFETY=YES
-synthtiger -o ./outputs/SynthDoG_en -c 50 -w 4 -v template.py SynthDoG config_en.yaml
-{'config': 'config_en.yaml',
- 'count': 50,
- 'name': 'SynthDoG',
- 'output': './outputs/SynthDoG_en',
- 'script': 'template.py',
- 'verbose': True,
- 'worker': 4}
-{'aspect_ratio': [1, 2],
-     .
-     .
- 'quality': [50, 95],
- 'short_size': [720, 1024]}
-Generated 1 data (task 3)
-Generated 2 data (task 0)
-Generated 3 data (task 1)
-     .
-     .
-Generated 49 data (task 48)
-Generated 50 data (task 49)
-46.32 seconds elapsed
-```
-Some important arguments:
-- `-o` : directory path to save data.
-- `-c` : number of data to generate.
-- `-w` : number of workers.
-- `-s` : random seed.
-- `-v` : print error messages.
-To generate ECJK samples:
-```bash
-# english
-synthtiger -o {dataset_path} -c {num_of_data} -w {num_of_workers} -v template.py SynthDoG config_en.yaml
-# chinese
-synthtiger -o {dataset_path} -c {num_of_data} -w {num_of_workers} -v template.py SynthDoG config_zh.yaml
-# japanese
-synthtiger -o {dataset_path} -c {num_of_data} -w {num_of_workers} -v template.py SynthDoG config_ja.yaml
-# korean
-synthtiger -o {dataset_path} -c {num_of_data} -w {num_of_workers} -v template.py SynthDoG config_ko.yaml
-```

synthdog/config_en.yaml DELETED Viewed

@@ -1,119 +0,0 @@
-quality: [50, 95]
-landscape: 0.5
-short_size: [720, 1024]
-aspect_ratio: [1, 2]
-background:
-  image:
-    paths: [resources/background]
-    weights: [1]
-  effect:
-    args:
-      # gaussian blur
-      - prob: 1
-        args:
-          sigma: [0, 10]
-document:
-  fullscreen: 0.5
-  landscape: 0.5
-  short_size: [480, 1024]
-  aspect_ratio: [1, 2]
-  paper:
-    image:
-      paths: [resources/paper]
-      weights: [1]
-      alpha: [0, 0.2]
-      grayscale: 1
-      crop: 1
-  content:
-    margin: [0, 0.1]
-    text:
-      path: resources/corpus/enwiki.txt
-    font:
-      paths: [resources/font/en]
-      weights: [1]
-      bold: 0
-    layout:
-      text_scale: [0.0334, 0.1]
-      max_row: 10
-      max_col: 3
-      fill: [0.5, 1]
-      full: 0.1
-      align: [left, right, center]
-      stack_spacing: [0.0334, 0.0334]
-      stack_fill: [0.5, 1]
-      stack_full: 0.1
-    textbox:
-      fill: [0.5, 1]
-    textbox_color:
-      prob: 0.2
-      args:
-        gray: [0, 64]
-        colorize: 1
-    content_color:
-      prob: 0.2
-      args:
-        gray: [0, 64]
-        colorize: 1
-  effect:
-    args:
-      # elastic distortion
-      - prob: 1
-        args:
-          alpha: [0, 1]
-          sigma: [0, 0.5]
-      # gaussian noise
-      - prob: 1
-        args:
-          scale: [0, 8]
-          per_channel: 0
-      # perspective
-      - prob: 1
-        args:
-          weights: [750, 50, 50, 25, 25, 25, 25, 50]
-          args:
-            - percents: [[0.75, 1], [0.75, 1], [0.75, 1], [0.75, 1]]
-            - percents: [[0.75, 1], [1, 1], [0.75, 1], [1, 1]]
-            - percents: [[1, 1], [0.75, 1], [1, 1], [0.75, 1]]
-            - percents: [[0.75, 1], [1, 1], [1, 1], [1, 1]]
-            - percents: [[1, 1], [0.75, 1], [1, 1], [1, 1]]
-            - percents: [[1, 1], [1, 1], [0.75, 1], [1, 1]]
-            - percents: [[1, 1], [1, 1], [1, 1], [0.75, 1]]
-            - percents: [[1, 1], [1, 1], [1, 1], [1, 1]]
-effect:
-  args:
-    # color
-    - prob: 0.2
-      args:
-        rgb: [[0, 255], [0, 255], [0, 255]]
-        alpha: [0, 0.2]
-    # shadow
-    - prob: 1
-      args:
-        intensity: [0, 160]
-        amount: [0, 1]
-        smoothing: [0.5, 1]
-        bidirectional: 0
-    # contrast
-    - prob: 1
-      args:
-        alpha: [1, 1.5]
-    # brightness
-    - prob: 1
-      args:
-        beta: [-48, 0]
-    # motion blur
-    - prob: 0.5
-      args:
-        k: [3, 5]
-        angle: [0, 360]
-    # gaussian blur
-    - prob: 1
-      args:
-        sigma: [0, 1.5]

synthdog/config_ja.yaml DELETED Viewed

@@ -1,119 +0,0 @@
-quality: [50, 95]
-landscape: 0.5
-short_size: [720, 1024]
-aspect_ratio: [1, 2]
-background:
-  image:
-    paths: [resources/background]
-    weights: [1]
-  effect:
-    args:
-      # gaussian blur
-      - prob: 1
-        args:
-          sigma: [0, 10]
-document:
-  fullscreen: 0.5
-  landscape: 0.5
-  short_size: [480, 1024]
-  aspect_ratio: [1, 2]
-  paper:
-    image:
-      paths: [resources/paper]
-      weights: [1]
-      alpha: [0, 0.2]
-      grayscale: 1
-      crop: 1
-  content:
-    margin: [0, 0.1]
-    text:
-      path: resources/corpus/jawiki.txt
-    font:
-      paths: [resources/font/ja]
-      weights: [1]
-      bold: 0
-    layout:
-      text_scale: [0.0334, 0.1]
-      max_row: 10
-      max_col: 3
-      fill: [0.5, 1]
-      full: 0.1
-      align: [left, right, center]
-      stack_spacing: [0.0334, 0.0334]
-      stack_fill: [0.5, 1]
-      stack_full: 0.1
-    textbox:
-      fill: [0.5, 1]
-    textbox_color:
-      prob: 0.2
-      args:
-        gray: [0, 64]
-        colorize: 1
-    content_color:
-      prob: 0.2
-      args:
-        gray: [0, 64]
-        colorize: 1
-  effect:
-    args:
-      # elastic distortion
-      - prob: 1
-        args:
-          alpha: [0, 1]
-          sigma: [0, 0.5]
-      # gaussian noise
-      - prob: 1
-        args:
-          scale: [0, 8]
-          per_channel: 0
-      # perspective
-      - prob: 1
-        args:
-          weights: [750, 50, 50, 25, 25, 25, 25, 50]
-          args:
-            - percents: [[0.75, 1], [0.75, 1], [0.75, 1], [0.75, 1]]
-            - percents: [[0.75, 1], [1, 1], [0.75, 1], [1, 1]]
-            - percents: [[1, 1], [0.75, 1], [1, 1], [0.75, 1]]
-            - percents: [[0.75, 1], [1, 1], [1, 1], [1, 1]]
-            - percents: [[1, 1], [0.75, 1], [1, 1], [1, 1]]
-            - percents: [[1, 1], [1, 1], [0.75, 1], [1, 1]]
-            - percents: [[1, 1], [1, 1], [1, 1], [0.75, 1]]
-            - percents: [[1, 1], [1, 1], [1, 1], [1, 1]]
-effect:
-  args:
-    # color
-    - prob: 0.2
-      args:
-        rgb: [[0, 255], [0, 255], [0, 255]]
-        alpha: [0, 0.2]
-    # shadow
-    - prob: 1
-      args:
-        intensity: [0, 160]
-        amount: [0, 1]
-        smoothing: [0.5, 1]
-        bidirectional: 0
-    # contrast
-    - prob: 1
-      args:
-        alpha: [1, 1.5]
-    # brightness
-    - prob: 1
-      args:
-        beta: [-48, 0]
-    # motion blur
-    - prob: 0.5
-      args:
-        k: [3, 5]
-        angle: [0, 360]
-    # gaussian blur
-    - prob: 1
-      args:
-        sigma: [0, 1.5]

synthdog/config_ko.yaml DELETED Viewed

@@ -1,119 +0,0 @@
-quality: [50, 95]
-landscape: 0.5
-short_size: [720, 1024]
-aspect_ratio: [1, 2]
-background:
-  image:
-    paths: [resources/background]
-    weights: [1]
-  effect:
-    args:
-      # gaussian blur
-      - prob: 1
-        args:
-          sigma: [0, 10]
-document:
-  fullscreen: 0.5
-  landscape: 0.5
-  short_size: [480, 1024]
-  aspect_ratio: [1, 2]
-  paper:
-    image:
-      paths: [resources/paper]
-      weights: [1]
-      alpha: [0, 0.2]
-      grayscale: 1
-      crop: 1
-  content:
-    margin: [0, 0.1]
-    text:
-      path: resources/corpus/kowiki.txt
-    font:
-      paths: [resources/font/ko]
-      weights: [1]
-      bold: 0
-    layout:
-      text_scale: [0.0334, 0.1]
-      max_row: 10
-      max_col: 3
-      fill: [0.5, 1]
-      full: 0.1
-      align: [left, right, center]
-      stack_spacing: [0.0334, 0.0334]
-      stack_fill: [0.5, 1]
-      stack_full: 0.1
-    textbox:
-      fill: [0.5, 1]
-    textbox_color:
-      prob: 0.2
-      args:
-        gray: [0, 64]
-        colorize: 1
-    content_color:
-      prob: 0.2
-      args:
-        gray: [0, 64]
-        colorize: 1
-  effect:
-    args:
-      # elastic distortion
-      - prob: 1
-        args:
-          alpha: [0, 1]
-          sigma: [0, 0.5]
-      # gaussian noise
-      - prob: 1
-        args:
-          scale: [0, 8]
-          per_channel: 0
-      # perspective
-      - prob: 1
-        args:
-          weights: [750, 50, 50, 25, 25, 25, 25, 50]
-          args:
-            - percents: [[0.75, 1], [0.75, 1], [0.75, 1], [0.75, 1]]
-            - percents: [[0.75, 1], [1, 1], [0.75, 1], [1, 1]]
-            - percents: [[1, 1], [0.75, 1], [1, 1], [0.75, 1]]
-            - percents: [[0.75, 1], [1, 1], [1, 1], [1, 1]]
-            - percents: [[1, 1], [0.75, 1], [1, 1], [1, 1]]
-            - percents: [[1, 1], [1, 1], [0.75, 1], [1, 1]]
-            - percents: [[1, 1], [1, 1], [1, 1], [0.75, 1]]
-            - percents: [[1, 1], [1, 1], [1, 1], [1, 1]]
-effect:
-  args:
-    # color
-    - prob: 0.2
-      args:
-        rgb: [[0, 255], [0, 255], [0, 255]]
-        alpha: [0, 0.2]
-    # shadow
-    - prob: 1
-      args:
-        intensity: [0, 160]
-        amount: [0, 1]
-        smoothing: [0.5, 1]
-        bidirectional: 0
-    # contrast
-    - prob: 1
-      args:
-        alpha: [1, 1.5]
-    # brightness
-    - prob: 1
-      args:
-        beta: [-48, 0]
-    # motion blur
-    - prob: 0.5
-      args:
-        k: [3, 5]
-        angle: [0, 360]
-    # gaussian blur
-    - prob: 1
-      args:
-        sigma: [0, 1.5]

synthdog/config_zh.yaml DELETED Viewed

@@ -1,119 +0,0 @@
-quality: [50, 95]
-landscape: 0.5
-short_size: [720, 1024]
-aspect_ratio: [1, 2]
-background:
-  image:
-    paths: [resources/background]
-    weights: [1]
-  effect:
-    args:
-      # gaussian blur
-      - prob: 1
-        args:
-          sigma: [0, 10]
-document:
-  fullscreen: 0.5
-  landscape: 0.5
-  short_size: [480, 1024]
-  aspect_ratio: [1, 2]
-  paper:
-    image:
-      paths: [resources/paper]
-      weights: [1]
-      alpha: [0, 0.2]
-      grayscale: 1
-      crop: 1
-  content:
-    margin: [0, 0.1]
-    text:
-      path: resources/corpus/zhwiki.txt
-    font:
-      paths: [resources/font/zh]
-      weights: [1]
-      bold: 0
-    layout:
-      text_scale: [0.0334, 0.1]
-      max_row: 10
-      max_col: 3
-      fill: [0.5, 1]
-      full: 0.1
-      align: [left, right, center]
-      stack_spacing: [0.0334, 0.0334]
-      stack_fill: [0.5, 1]
-      stack_full: 0.1
-    textbox:
-      fill: [0.5, 1]
-    textbox_color:
-      prob: 0.2
-      args:
-        gray: [0, 64]
-        colorize: 1
-    content_color:
-      prob: 0.2
-      args:
-        gray: [0, 64]
-        colorize: 1
-  effect:
-    args:
-      # elastic distortion
-      - prob: 1
-        args:
-          alpha: [0, 1]
-          sigma: [0, 0.5]
-      # gaussian noise
-      - prob: 1
-        args:
-          scale: [0, 8]
-          per_channel: 0
-      # perspective
-      - prob: 1
-        args:
-          weights: [750, 50, 50, 25, 25, 25, 25, 50]
-          args:
-            - percents: [[0.75, 1], [0.75, 1], [0.75, 1], [0.75, 1]]
-            - percents: [[0.75, 1], [1, 1], [0.75, 1], [1, 1]]
-            - percents: [[1, 1], [0.75, 1], [1, 1], [0.75, 1]]
-            - percents: [[0.75, 1], [1, 1], [1, 1], [1, 1]]
-            - percents: [[1, 1], [0.75, 1], [1, 1], [1, 1]]
-            - percents: [[1, 1], [1, 1], [0.75, 1], [1, 1]]
-            - percents: [[1, 1], [1, 1], [1, 1], [0.75, 1]]
-            - percents: [[1, 1], [1, 1], [1, 1], [1, 1]]
-effect:
-  args:
-    # color
-    - prob: 0.2
-      args:
-        rgb: [[0, 255], [0, 255], [0, 255]]
-        alpha: [0, 0.2]
-    # shadow
-    - prob: 1
-      args:
-        intensity: [0, 160]
-        amount: [0, 1]
-        smoothing: [0.5, 1]
-        bidirectional: 0
-    # contrast
-    - prob: 1
-      args:
-        alpha: [1, 1.5]
-    # brightness
-    - prob: 1
-      args:
-        beta: [-48, 0]
-    # motion blur
-    - prob: 0.5
-      args:
-        k: [3, 5]
-        angle: [0, 360]
-    # gaussian blur
-    - prob: 1
-      args:
-        sigma: [0, 1.5]

synthdog/elements/__init__.py DELETED Viewed

@@ -1,12 +0,0 @@
-"""
-Donut
-Copyright (c) 2022-present NAVER Corp.
-MIT License
-"""
-from elements.background import Background
-from elements.content import Content
-from elements.document import Document
-from elements.paper import Paper
-from elements.textbox import TextBox
-__all__ = ["Background", "Content", "Document", "Paper", "TextBox"]

synthdog/elements/background.py DELETED Viewed

@@ -1,24 +0,0 @@
-"""
-Donut
-Copyright (c) 2022-present NAVER Corp.
-MIT License
-"""
-from synthtiger import components, layers
-class Background:
-    def __init__(self, config):
-        self.image = components.BaseTexture(**config.get("image", {}))
-        self.effect = components.Iterator(
-            [
-                components.Switch(components.GaussianBlur()),
-            ],
-            **config.get("effect", {})
-        )
-    def generate(self, size):
-        bg_layer = layers.RectLayer(size, (255, 255, 255, 255))
-        self.image.apply([bg_layer])
-        self.effect.apply([bg_layer])
-        return bg_layer

synthdog/elements/content.py DELETED Viewed

@@ -1,118 +0,0 @@
-"""
-Donut
-Copyright (c) 2022-present NAVER Corp.
-MIT License
-"""
-from collections import OrderedDict
-import numpy as np
-from synthtiger import components
-from elements.textbox import TextBox
-from layouts import GridStack
-class TextReader:
-    def __init__(self, path, cache_size=2 ** 28, block_size=2 ** 20):
-        self.fp = open(path, "r", encoding="utf-8")
-        self.length = 0
-        self.offsets = [0]
-        self.cache = OrderedDict()
-        self.cache_size = cache_size
-        self.block_size = block_size
-        self.bucket_size = cache_size // block_size
-        self.idx = 0
-        while True:
-            text = self.fp.read(self.block_size)
-            if not text:
-                break
-            self.length += len(text)
-            self.offsets.append(self.fp.tell())
-    def __len__(self):
-        return self.length
-    def __iter__(self):
-        return self
-    def __next__(self):
-        char = self.get()
-        self.next()
-        return char
-    def move(self, idx):
-        self.idx = idx
-    def next(self):
-        self.idx = (self.idx + 1) % self.length
-    def prev(self):
-        self.idx = (self.idx - 1) % self.length
-    def get(self):
-        key = self.idx // self.block_size
-        if key in self.cache:
-            text = self.cache[key]
-        else:
-            if len(self.cache) >= self.bucket_size:
-                self.cache.popitem(last=False)
-            offset = self.offsets[key]
-            self.fp.seek(offset, 0)
-            text = self.fp.read(self.block_size)
-            self.cache[key] = text
-        self.cache.move_to_end(key)
-        char = text[self.idx % self.block_size]
-        return char
-class Content:
-    def __init__(self, config):
-        self.margin = config.get("margin", [0, 0.1])
-        self.reader = TextReader(**config.get("text", {}))
-        self.font = components.BaseFont(**config.get("font", {}))
-        self.layout = GridStack(config.get("layout", {}))
-        self.textbox = TextBox(config.get("textbox", {}))
-        self.textbox_color = components.Switch(components.Gray(), **config.get("textbox_color", {}))
-        self.content_color = components.Switch(components.Gray(), **config.get("content_color", {}))
-    def generate(self, size):
-        width, height = size
-        layout_left = width * np.random.uniform(self.margin[0], self.margin[1])
-        layout_top = height * np.random.uniform(self.margin[0], self.margin[1])
-        layout_width = max(width - layout_left * 2, 0)
-        layout_height = max(height - layout_top * 2, 0)
-        layout_bbox = [layout_left, layout_top, layout_width, layout_height]
-        text_layers, texts = [], []
-        layouts = self.layout.generate(layout_bbox)
-        self.reader.move(np.random.randint(len(self.reader)))
-        for layout in layouts:
-            font = self.font.sample()
-            for bbox, align in layout:
-                x, y, w, h = bbox
-                text_layer, text = self.textbox.generate((w, h), self.reader, font)
-                self.reader.prev()
-                if text_layer is None:
-                    continue
-                text_layer.center = (x + w / 2, y + h / 2)
-                if align == "left":
-                    text_layer.left = x
-                if align == "right":
-                    text_layer.right = x + w
-                self.textbox_color.apply([text_layer])
-                text_layers.append(text_layer)
-                texts.append(text)
-        self.content_color.apply(text_layers)
-        return text_layers, texts

synthdog/elements/document.py DELETED Viewed

@@ -1,65 +0,0 @@
-"""
-Donut
-Copyright (c) 2022-present NAVER Corp.
-MIT License
-"""
-import numpy as np
-from synthtiger import components
-from elements.content import Content
-from elements.paper import Paper
-class Document:
-    def __init__(self, config):
-        self.fullscreen = config.get("fullscreen", 0.5)
-        self.landscape = config.get("landscape", 0.5)
-        self.short_size = config.get("short_size", [480, 1024])
-        self.aspect_ratio = config.get("aspect_ratio", [1, 2])
-        self.paper = Paper(config.get("paper", {}))
-        self.content = Content(config.get("content", {}))
-        self.effect = components.Iterator(
-            [
-                components.Switch(components.ElasticDistortion()),
-                components.Switch(components.AdditiveGaussianNoise()),
-                components.Switch(
-                    components.Selector(
-                        [
-                            components.Perspective(),
-                            components.Perspective(),
-                            components.Perspective(),
-                            components.Perspective(),
-                            components.Perspective(),
-                            components.Perspective(),
-                            components.Perspective(),
-                            components.Perspective(),
-                        ]
-                    )
-                ),
-            ],
-            **config.get("effect", {}),
-        )
-    def generate(self, size):
-        width, height = size
-        fullscreen = np.random.rand() < self.fullscreen
-        if not fullscreen:
-            landscape = np.random.rand() < self.landscape
-            max_size = width if landscape else height
-            short_size = np.random.randint(
-                min(width, height, self.short_size[0]),
-                min(width, height, self.short_size[1]) + 1,
-            )
-            aspect_ratio = np.random.uniform(
-                min(max_size / short_size, self.aspect_ratio[0]),
-                min(max_size / short_size, self.aspect_ratio[1]),
-            )
-            long_size = int(short_size * aspect_ratio)
-            size = (long_size, short_size) if landscape else (short_size, long_size)
-        text_layers, texts = self.content.generate(size)
-        paper_layer = self.paper.generate(size)
-        self.effect.apply([*text_layers, paper_layer])
-        return paper_layer, text_layers, texts

synthdog/elements/paper.py DELETED Viewed

@@ -1,17 +0,0 @@
-"""
-Donut
-Copyright (c) 2022-present NAVER Corp.
-MIT License
-"""
-from synthtiger import components, layers
-class Paper:
-    def __init__(self, config):
-        self.image = components.BaseTexture(**config.get("image", {}))
-    def generate(self, size):
-        paper_layer = layers.RectLayer(size, (255, 255, 255, 255))
-        self.image.apply([paper_layer])
-        return paper_layer

synthdog/elements/textbox.py DELETED Viewed

@@ -1,43 +0,0 @@
-"""
-Donut
-Copyright (c) 2022-present NAVER Corp.
-MIT License
-"""
-import numpy as np
-from synthtiger import layers
-class TextBox:
-    def __init__(self, config):
-        self.fill = config.get("fill", [1, 1])
-    def generate(self, size, text, font):
-        width, height = size
-        char_layers, chars = [], []
-        fill = np.random.uniform(self.fill[0], self.fill[1])
-        width = np.clip(width * fill, height, width)
-        font = {**font, "size": int(height)}
-        left, top = 0, 0
-        for char in text:
-            if char in "\r\n":
-                continue
-            char_layer = layers.TextLayer(char, **font)
-            char_scale = height / char_layer.height
-            char_layer.bbox = [left, top, *(char_layer.size * char_scale)]
-            if char_layer.right > width:
-                break
-            char_layers.append(char_layer)
-            chars.append(char)
-            left = char_layer.right
-        text = "".join(chars).strip()
-        if len(char_layers) == 0 or len(text) == 0:
-            return None, None
-        text_layer = layers.Group(char_layers).merge()
-        return text_layer, text

synthdog/layouts/__init__.py DELETED Viewed

@@ -1,9 +0,0 @@
-"""
-Donut
-Copyright (c) 2022-present NAVER Corp.
-MIT License
-"""
-from layouts.grid import Grid
-from layouts.grid_stack import GridStack
-__all__ = ["Grid", "GridStack"]

synthdog/layouts/grid.py DELETED Viewed

@@ -1,68 +0,0 @@
-"""
-Donut
-Copyright (c) 2022-present NAVER Corp.
-MIT License
-"""
-import numpy as np
-class Grid:
-    def __init__(self, config):
-        self.text_scale = config.get("text_scale", [0.05, 0.1])
-        self.max_row = config.get("max_row", 5)
-        self.max_col = config.get("max_col", 3)
-        self.fill = config.get("fill", [0, 1])
-        self.full = config.get("full", 0)
-        self.align = config.get("align", ["left", "right", "center"])
-    def generate(self, bbox):
-        left, top, width, height = bbox
-        text_scale = np.random.uniform(self.text_scale[0], self.text_scale[1])
-        text_size = min(width, height) * text_scale
-        grids = np.random.permutation(self.max_row * self.max_col)
-        for grid in grids:
-            row = grid // self.max_col + 1
-            col = grid % self.max_col + 1
-            if text_size * (col * 2 - 1) <= width and text_size * row <= height:
-                break
-        else:
-            return None
-        bound = max(1 - text_size / width * (col - 1), 0)
-        full = np.random.rand() < self.full
-        fill = np.random.uniform(self.fill[0], self.fill[1])
-        fill = 1 if full else fill
-        fill = np.clip(fill, 0, bound)
-        padding = np.random.randint(4) if col > 1 else np.random.randint(1, 4)
-        padding = (bool(padding // 2), bool(padding % 2))
-        weights = np.zeros(col * 2 + 1)
-        weights[1:-1] = text_size / width
-        probs = 1 - np.random.rand(col * 2 + 1)
-        probs[0] = 0 if not padding[0] else probs[0]
-        probs[-1] = 0 if not padding[-1] else probs[-1]
-        probs[1::2] *= max(fill - sum(weights[1::2]), 0) / sum(probs[1::2])
-        probs[::2] *= max(1 - fill - sum(weights[::2]), 0) / sum(probs[::2])
-        weights += probs
-        widths = [width * weights[c] for c in range(col * 2 + 1)]
-        heights = [text_size for _ in range(row)]
-        xs = np.cumsum([0] + widths)
-        ys = np.cumsum([0] + heights)
-        layout = []
-        for c in range(col):
-            align = self.align[np.random.randint(len(self.align))]
-            for r in range(row):
-                x, y = xs[c * 2 + 1], ys[r]
-                w, h = xs[c * 2 + 2] - x, ys[r + 1] - y
-                bbox = [left + x, top + y, w, h]
-                layout.append((bbox, align))
-        return layout

synthdog/layouts/grid_stack.py DELETED Viewed

@@ -1,74 +0,0 @@
-"""
-Donut
-Copyright (c) 2022-present NAVER Corp.
-MIT License
-"""
-import numpy as np
-from layouts import Grid
-class GridStack:
-    def __init__(self, config):
-        self.text_scale = config.get("text_scale", [0.05, 0.1])
-        self.max_row = config.get("max_row", 5)
-        self.max_col = config.get("max_col", 3)
-        self.fill = config.get("fill", [0, 1])
-        self.full = config.get("full", 0)
-        self.align = config.get("align", ["left", "right", "center"])
-        self.stack_spacing = config.get("stack_spacing", [0, 0.05])
-        self.stack_fill = config.get("stack_fill", [1, 1])
-        self.stack_full = config.get("stack_full", 0)
-        self._grid = Grid(
-            {
-                "text_scale": self.text_scale,
-                "max_row": self.max_row,
-                "max_col": self.max_col,
-                "align": self.align,
-            }
-        )
-    def generate(self, bbox):
-        left, top, width, height = bbox
-        stack_spacing = np.random.uniform(self.stack_spacing[0], self.stack_spacing[1])
-        stack_spacing *= min(width, height)
-        stack_full = np.random.rand() < self.stack_full
-        stack_fill = np.random.uniform(self.stack_fill[0], self.stack_fill[1])
-        stack_fill = 1 if stack_full else stack_fill
-        full = np.random.rand() < self.full
-        fill = np.random.uniform(self.fill[0], self.fill[1])
-        fill = 1 if full else fill
-        self._grid.fill = [fill, fill]
-        layouts = []
-        line = 0
-        while True:
-            grid_size = (width, height * stack_fill - line)
-            text_scale = np.random.uniform(self.text_scale[0], self.text_scale[1])
-            text_size = min(width, height) * text_scale
-            text_scale = text_size / min(grid_size)
-            self._grid.text_scale = [text_scale, text_scale]
-            layout = self._grid.generate([left, top + line, *grid_size])
-            if layout is None:
-                break
-            line = max(y + h - top for (_, y, _, h), _ in layout) + stack_spacing
-            layouts.append(layout)
-        line = max(line - stack_spacing, 0)
-        space = max(height - line, 0)
-        spaces = np.random.rand(len(layouts) + 1)
-        spaces *= space / sum(spaces) if sum(spaces) > 0 else 0
-        spaces = np.cumsum(spaces)
-        for layout, space in zip(layouts, spaces):
-            for bbox, _ in layout:
-                x, y, w, h = bbox
-                bbox[:] = [x, y + space, w, h]
-        return layouts

synthdog/resources/background/bedroom_83.jpg DELETED Viewed

Binary file (71.6 kB)

synthdog/resources/background/bob+dylan_83.jpg DELETED Viewed

Binary file (418 kB)

synthdog/resources/background/coffee_122.jpg DELETED Viewed

Binary file (58.3 kB)

synthdog/resources/background/coffee_18.jpeg DELETED Viewed

Git LFS Details

SHA256: 3be69b618a13243f755bb686b14cc5ded952d328f3fd06ed0932599aa993e27c
Pointer size: 132 Bytes
Size of remote file: 1.78 MB

synthdog/resources/background/crater_141.jpg DELETED Viewed

Git LFS Details

SHA256: 8993258d37d02a95c3d4de7a25c81af44c86281086631fdd3edfdf8b94f0844b
Pointer size: 132 Bytes
Size of remote file: 1.82 MB

synthdog/resources/background/cream_124.jpg DELETED Viewed

Git LFS Details

SHA256: a12e36c3edbb8eae45ceada56b3e38963398e85618fc582a9910fbdb63156ff9
Pointer size: 132 Bytes
Size of remote file: 2.24 MB

synthdog/resources/background/eagle_110.jpg DELETED Viewed

Binary file (221 kB)

synthdog/resources/background/farm_25.jpg DELETED Viewed

Binary file (704 kB)

synthdog/resources/background/hiking_18.jpg DELETED Viewed

Binary file (515 kB)

synthdog/resources/corpus/enwiki.txt DELETED Viewed

The diff for this file is too large to render. See raw diff

synthdog/resources/corpus/jawiki.txt DELETED Viewed

The diff for this file is too large to render. See raw diff

synthdog/resources/corpus/kowiki.txt DELETED Viewed

The diff for this file is too large to render. See raw diff

synthdog/resources/corpus/zhwiki.txt DELETED Viewed

The diff for this file is too large to render. See raw diff

synthdog/resources/font/en/NotoSans-Regular.ttf DELETED Viewed

Binary file (399 kB)

synthdog/resources/font/en/NotoSerif-Regular.ttf DELETED Viewed

Binary file (375 kB)

synthdog/resources/font/ja/NotoSansJP-Regular.otf DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:47c29251c03bd7731461efd9aff279d04058025c24fc08ed49552aeec20adc6d
-size 4548148

synthdog/resources/font/ja/NotoSerifJP-Regular.otf DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:9a0f0ab1c97dc9b1bb857f3259f5de23c6caa224c14d12878575b0a84676db8f
-size 6169384

synthdog/resources/font/ko/NotoSansKR-Regular.otf DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:2f62e282b5ff3694c09af182d0dfc29d46ce6b85303c0da74f159c098e75991b
-size 4744644

synthdog/resources/font/ko/NotoSerifKR-Regular.otf DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:13196f84ee798b18eddd80077051e5d88ff869696c43200dc54c66807884f74e
-size 7437596

synthdog/resources/font/zh/NotoSansSC-Regular.otf DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:63fdadb47c21197170f3cda6c60e98e481b8a1eb28e5f44102da51bec17d123b
-size 8481960

synthdog/resources/font/zh/NotoSerifSC-Regular.otf DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:66080541a111a7a31179700496013aac4b64a53cc41f570bd21c2628c75e4628
-size 11214568

synthdog/resources/paper/paper_1.jpg DELETED Viewed

Git LFS Details

SHA256: 6be25c214d7772f44cf2406db54de5b75dd085b98c0bbe003f56ae1231a788af
Pointer size: 132 Bytes
Size of remote file: 2.39 MB

synthdog/resources/paper/paper_2.jpg DELETED Viewed

Git LFS Details

SHA256: 323283e8e6210a73223798274949ce083d97c6162860bf13b3bbbf6821796e0d
Pointer size: 132 Bytes
Size of remote file: 1.88 MB

synthdog/resources/paper/paper_3.jpg DELETED Viewed

Git LFS Details

SHA256: 189bda5655f2ef2b63ed07d28a511f716a2e2e7bcdc8efb0def77e80330cb356
Pointer size: 132 Bytes
Size of remote file: 2.52 MB

synthdog/resources/paper/paper_4.jpg DELETED Viewed

Git LFS Details

SHA256: b92e05d77aa06569d9f515205f911df9b48350202a1f4ea8c59a25bd25550f48
Pointer size: 132 Bytes
Size of remote file: 1.92 MB

synthdog/resources/paper/paper_5.jpg DELETED Viewed

Git LFS Details

SHA256: 04235c5a60d58bf27dd1435132bae141adc20439cf5802b6e3348513d1707a6b
Pointer size: 132 Bytes
Size of remote file: 3.35 MB

synthdog/resources/paper/paper_6.jpg DELETED Viewed

Git LFS Details

SHA256: 224b7e7782954e6e23fd1dcde419ead910a09501cd61cdcfb02e40310deda315
Pointer size: 132 Bytes
Size of remote file: 1.69 MB

synthdog/template.py DELETED Viewed

@@ -1,130 +0,0 @@
-"""
-Donut
-Copyright (c) 2022-present NAVER Corp.
-MIT License
-"""
-import json
-import os
-import re
-from typing import Any, List
-import numpy as np
-from elements import Background, Document
-from PIL import Image
-from synthtiger import components, layers, templates
-class SynthDoG(templates.Template):
-    def __init__(self, config=None, split_ratio: List[float] = [0.8, 0.1, 0.1]):
-        super().__init__(config)
-        if config is None:
-            config = {}
-        self.quality = config.get("quality", [50, 95])
-        self.landscape = config.get("landscape", 0.5)
-        self.short_size = config.get("short_size", [720, 1024])
-        self.aspect_ratio = config.get("aspect_ratio", [1, 2])
-        self.background = Background(config.get("background", {}))
-        self.document = Document(config.get("document", {}))
-        self.effect = components.Iterator(
-            [
-                components.Switch(components.RGB()),
-                components.Switch(components.Shadow()),
-                components.Switch(components.Contrast()),
-                components.Switch(components.Brightness()),
-                components.Switch(components.MotionBlur()),
-                components.Switch(components.GaussianBlur()),
-            ],
-            **config.get("effect", {}),
-        )
-        # config for splits
-        self.splits = ["train", "validation", "test"]
-        self.split_ratio = split_ratio
-        self.split_indexes = np.random.choice(3, size=10000, p=split_ratio)
-    def generate(self):
-        landscape = np.random.rand() < self.landscape
-        short_size = np.random.randint(self.short_size[0], self.short_size[1] + 1)
-        aspect_ratio = np.random.uniform(self.aspect_ratio[0], self.aspect_ratio[1])
-        long_size = int(short_size * aspect_ratio)
-        size = (long_size, short_size) if landscape else (short_size, long_size)
-        bg_layer = self.background.generate(size)
-        paper_layer, text_layers, texts = self.document.generate(size)
-        document_group = layers.Group([*text_layers, paper_layer])
-        document_space = np.clip(size - document_group.size, 0, None)
-        document_group.left = np.random.randint(document_space[0] + 1)
-        document_group.top = np.random.randint(document_space[1] + 1)
-        roi = np.array(paper_layer.quad, dtype=int)
-        layer = layers.Group([*document_group.layers, bg_layer]).merge()
-        self.effect.apply([layer])
-        image = layer.output(bbox=[0, 0, *size])
-        label = " ".join(texts)
-        label = label.strip()
-        label = re.sub(r"\s+", " ", label)
-        quality = np.random.randint(self.quality[0], self.quality[1] + 1)
-        data = {
-            "image": image,
-            "label": label,
-            "quality": quality,
-            "roi": roi,
-        }
-        return data
-    def init_save(self, root):
-        if not os.path.exists(root):
-            os.makedirs(root, exist_ok=True)
-    def save(self, root, data, idx):
-        image = data["image"]
-        label = data["label"]
-        quality = data["quality"]
-        roi = data["roi"]
-        # split
-        split_idx = self.split_indexes[idx % len(self.split_indexes)]
-        output_dirpath = os.path.join(root, self.splits[split_idx])
-        # save image
-        image_filename = f"image_{idx}.jpg"
-        image_filepath = os.path.join(output_dirpath, image_filename)
-        os.makedirs(os.path.dirname(image_filepath), exist_ok=True)
-        image = Image.fromarray(image[..., :3].astype(np.uint8))
-        image.save(image_filepath, quality=quality)
-        # save metadata (gt_json)
-        metadata_filename = "metadata.jsonl"
-        metadata_filepath = os.path.join(output_dirpath, metadata_filename)
-        os.makedirs(os.path.dirname(metadata_filepath), exist_ok=True)
-        metadata = self.format_metadata(image_filename=image_filename, keys=["text_sequence"], values=[label])
-        with open(metadata_filepath, "a") as fp:
-            json.dump(metadata, fp, ensure_ascii=False)
-            fp.write("\n")
-    def end_save(self, root):
-        pass
-    def format_metadata(self, image_filename: str, keys: List[str], values: List[Any]):
-        """
-        Fit gt_parse contents to huggingface dataset's format
-        keys and values, whose lengths are equal, are used to constrcut 'gt_parse' field in 'ground_truth' field
-        Args:
-            keys: List of task_name
-            values: List of actual gt data corresponding to each task_name
-        """
-        assert len(keys) == len(values), "Length does not match: keys({}), values({})".format(len(keys), len(values))
-        _gt_parse_v = dict()
-        for k, v in zip(keys, values):
-            _gt_parse_v[k] = v
-        gt_parse = {"gt_parse": _gt_parse_v}
-        gt_parse_str = json.dumps(gt_parse, ensure_ascii=False)
-        metadata = {"file_name": image_filename, "ground_truth": gt_parse_str}
-        return metadata