PDF-Data_Extractor / src /configuration.py
Wasim
Sync: robust vehicle parser + full project
2e237ce
raw
history blame
1.11 kB
import logging
import os
from pathlib import Path
SRC_PATH = Path(__file__).parent.absolute()
ROOT_PATH = Path(__file__).parent.parent.absolute()
handlers = [logging.StreamHandler()]
logging.root.handlers = []
logging.basicConfig(level=logging.INFO, format="%(asctime)s [%(levelname)s] %(message)s", handlers=handlers)
service_logger = logging.getLogger(__name__)
RESTART_IF_NO_GPU = os.environ.get("RESTART_IF_NO_GPU", "false").lower().strip() == "true"
IMAGES_ROOT_PATH = Path(ROOT_PATH, "images")
WORD_GRIDS_PATH = Path(ROOT_PATH, "word_grids")
JSONS_ROOT_PATH = Path(ROOT_PATH, "jsons")
OCR_SOURCE = Path(ROOT_PATH, "ocr", "source")
OCR_OUTPUT = Path(ROOT_PATH, "ocr", "output")
OCR_FAILED = Path(ROOT_PATH, "ocr", "failed")
JSON_TEST_FILE_PATH = Path(JSONS_ROOT_PATH, "test.json")
MODELS_PATH = Path(ROOT_PATH, "models")
XMLS_PATH = Path(ROOT_PATH, "xmls")
DOCLAYNET_TYPE_BY_ID = {
1: "Caption",
2: "Footnote",
3: "Formula",
4: "List_Item",
5: "Page_Footer",
6: "Page_Header",
7: "Picture",
8: "Section_Header",
9: "Table",
10: "Text",
11: "Title",
}