landify-cccd-ocr

Sleeping

App Files Files Community

anh-khoa-nguyen commited on Sep 14, 2025

Commit

8bf9be8

1 Parent(s): 481efa8

hotfix...

Browse files

Files changed (14) hide show

.gitattributes +2 -0
app.py +104 -73
core/extractor.py +9 -4
models/cls/ch_ppocr_mobile_v2.0_cls_infer/._inference.pdmodel +3 -0
models/cls/ch_ppocr_mobile_v2.0_cls_infer/inference.pdiparams +3 -0
models/cls/ch_ppocr_mobile_v2.0_cls_infer/inference.pdiparams.info +0 -0
models/cls/ch_ppocr_mobile_v2.0_cls_infer/inference.pdmodel +3 -0
models/det/en_PP-OCRv3_det_infer/inference.pdiparams +3 -0
models/det/en_PP-OCRv3_det_infer/inference.pdiparams.info +0 -0
models/det/en_PP-OCRv3_det_infer/inference.pdmodel +3 -0
models/rec/en_PP-OCRv3_rec_infer.tar +3 -0
models/rec/en_PP-OCRv3_rec_infer/inference.pdiparams +3 -0
models/rec/en_PP-OCRv3_rec_infer/inference.pdiparams.info +0 -0
models/rec/en_PP-OCRv3_rec_infer/inference.pdmodel +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+*.pdiparams filter=lfs diff=lfs merge=lfs -text
+*.pdmodel filter=lfs diff=lfs merge=lfs -text

app.py CHANGED Viewed

@@ -1,49 +1,73 @@
 import base64
-import datetime
 import os
 import re
 import time
 import uuid
 import cv2
 from fastapi import FastAPI, File, UploadFile, HTTPException
 from pydantic import BaseModel
-from typing import Optional
-# Import lớp Extractor từ thư mục core
-from core.extractor import Extractor
-# --- Khởi tạo ---
-# Khởi tạo ứng dụng FastAPI
 app = FastAPI(
-    title="CCCD Extraction API",
-    description="Một microservice để trích xuất thông tin từ Căn cước công dân Việt Nam.",
-    version="1.0.0"
 )
-# Đường dẫn để lưu trữ file upload
-UPLOAD_DIR = "uploads"
-os.makedirs(UPLOAD_DIR, exist_ok=True)
-# Khởi tạo một lần duy nhất đối tượng Extractor để tái sử dụng
-# Điều này giúp load model một lần và tăng tốc độ xử lý cho các request sau
-try:
-    idcard_extractor = Extractor()
-    print("CCCD Extractor loaded successfully.")
-except Exception as e:
-    print(f"Error loading CCCD Extractor: {e}")
-    idcard_extractor = None
-# --- Định nghĩa Model cho Request và Response ---
-# Model cho request nếu gửi ảnh dạng base64
-class ImageRequest(BaseModel):
-    image_base64: str
-# Model cho response trả về
 class ExtractionResponse(BaseModel):
     ID_number: Optional[str] = None
     Name: Optional[str] = None
@@ -52,91 +76,98 @@ class ExtractionResponse(BaseModel):
     Nationality: Optional[str] = None
     Place_of_origin: Optional[str] = None
     Place_of_residence: Optional[str] = None
     elapsed: float
-# --- Xây dựng API Endpoint ---
 @app.get("/")
 def read_root():
-    return {"message": "Welcome to the CCCD Extraction API. Use the /extract/ endpoint to process an image."}
 @app.post("/extract/", response_model=ExtractionResponse, tags=["CCCD Extraction"])
 async def extract_id_card_info(file: UploadFile = File(...)):
     """
-    Nhận một file ảnh CCCD, trích xuất thông tin và trả về.
     """
-    if not idcard_extractor:
-        raise HTTPException(status_code=500, detail="OCR Extractor is not available.")
-    # --- 1. Lưu file ảnh được upload ---
-    # Tạo tên file ngẫu nhiên và an toàn để tránh trùng lặp
-    file_extension = os.path.splitext(file.filename)[1]
-    random_filename = f"{uuid.uuid4()}{file_extension}"
-    file_path = os.path.join(UPLOAD_DIR, random_filename)
     try:
-        # Đọc nội dung file và lưu lại
         with open(file_path, "wb") as buffer:
             buffer.write(await file.read())
-    except Exception as e:
-        raise HTTPException(status_code=500, detail=f"Could not save uploaded file: {e}")
-    # --- 2. Xử lý ảnh và trích xuất thông tin (logic từ Django view) ---
-    start_time = time.time()
-    try:
         frame = cv2.imread(file_path)
         if frame is None:
             raise HTTPException(status_code=400, detail="Invalid image file.")
-        # Bước 1: Dùng PaddleOCR để phát hiện các vùng văn bản
         annotations = idcard_extractor.Detection(frame)
         info = {}
-        # Tìm số CCCD trước tiên
         for box in annotations:
             text_detected = box[1][0]
-            if re.search(r'\d{9,12}', text_detected):
-                # Tách số ra khỏi chuỗi nhiễu
-                id_number = re.search(r'\d{9,12}', text_detected).group(0)
-                info['ID_number'] = id_number
                 info['ID_number_box'] = box[0]
                 break
         if 'ID_number' not in info:
-            raise HTTPException(status_code=400, detail="Could not detect an ID number in the image.")
-        # Bước 2: Dùng VietOCR để nhận dạng các trường thông tin còn lại
         extracted_result = []
         for box in annotations:
-            # Bỏ qua vùng chứa số ID đã xử lý
-            if re.search(r'\d{9,12}', box[1][0]):
-                continue
-            top_left = (int(box[0][0][0]), int(box[0][0][1]))
-            top_right = (int(box[0][1][0]), int(box[0][1][1]))
-            bottom_right = (int(box[0][2][0]), int(box[0][2][1]))
-            bottom_left = (int(box[0][3][0]), int(box[0][3][1]))
-            # Warp và nhận dạng
             result_text, _ = idcard_extractor.WarpAndRec(frame, top_left, top_right, bottom_right, bottom_left)
-            extracted_result.append((result_text, box[0]))  # Lưu cả text và bounding box
-        # Bước 3: Tổng hợp thông tin
         final_info = idcard_extractor.GetInformationAndSave(extracted_result, info['ID_number'], info['ID_number_box'])
         elapsed = time.time() - start_time
         final_info["elapsed"] = round(elapsed, 2)
-        # Xóa file tạm sau khi xử lý xong
-        os.remove(file_path)
         return final_info
     except Exception as e:
-        # Nếu c�� lỗi, cũng xóa file tạm
         if os.path.exists(file_path):
-            os.remove(file_path)
-        raise HTTPException(status_code=500, detail=f"An error occurred during processing: {str(e)}")

+# app.py
 import base64
 import os
 import re
 import time
 import uuid
+import threading
+from typing import Optional
 import cv2
+import numpy as np
 from fastapi import FastAPI, File, UploadFile, HTTPException
 from pydantic import BaseModel
+# --- KHỞI TẠO ỨNG DỤNG VÀ CÁC BIẾN TOÀN CỤC ---
 app = FastAPI(
+    title="Vietnamese Citizen ID OCR & Face Extraction API",
+    description="Một microservice để trích xuất thông tin và cắt ảnh chân dung từ CCCD. Sử dụng Lazy Loading cho model.",
+    version="1.3.0-lazyload-packaged"
 )
+# Khởi tạo các biến model toàn cục là None. Chúng sẽ được tải sau.
+idcard_extractor = None
+face_cascade = None
+model_lock = threading.Lock()  # Lock để đảm bảo model chỉ được tải 1 lần trong môi trường đa luồng
+# --- HÀM TẢI MODEL (LAZY LOADING) ---
+def load_models():
+    """
+    Hàm này chỉ được gọi một lần duy nhất khi có request đầu tiên.
+    Nó tải tất cả các model AI nặng vào bộ nhớ.
+    """
+    global idcard_extractor, face_cascade
+    # Sử dụng lock để ngăn chặn nhiều request cùng lúc cố gắng tải model (race condition)
+    with model_lock:
+        # Kiểm tra lại một lần nữa bên trong lock, nếu một luồng khác đã tải xong thì bỏ qua.
+        if idcard_extractor is None:
+            print("--- LAZY LOADING MODELS (FIRST REQUEST) ---")
+            try:
+                # Import Extractor ngay tại đây, không import ở đầu file
+                from core.extractor import Extractor
+                # 1. Tải model OCR (sẽ đọc từ các file cục bộ trong thư mục /models)
+                print("Loading OCR models...")
+                idcard_extractor = Extractor()
+                print("CCCD Text Extractor loaded successfully.")
+                # 2. Tải model nhận diện khuôn mặt
+                print("Loading face detection model...")
+                face_cascade_path = os.path.join(cv2.data.haarcascades, 'haarcascade_frontalface_default.xml')
+                if not os.path.exists(face_cascade_path):
+                    raise FileNotFoundError("Không tìm thấy file haarcascade.")
+                face_cascade = cv2.CascadeClassifier(face_cascade_path)
+                print("Face cascade classifier loaded successfully.")
+            except Exception as e:
+                print(f"FATAL: Error during model loading: {e}")
+                # Đặt lại thành None để các request sau biết rằng model đã tải thất bại
+                idcard_extractor = None
+                face_cascade = None
+            print("--- MODEL LOADING COMPLETE ---")
+# --- ĐỊNH NGHĨA MODEL CHO RESPONSE ---
 class ExtractionResponse(BaseModel):
     ID_number: Optional[str] = None
     Name: Optional[str] = None
     Nationality: Optional[str] = None
     Place_of_origin: Optional[str] = None
     Place_of_residence: Optional[str] = None
+    portrait_image_base64: Optional[str] = None
     elapsed: float
+# --- API ENDPOINT ---
 @app.get("/")
 def read_root():
+    return {"message": "Welcome to the CCCD Extraction API. POST to /extract/ to process an image."}
 @app.post("/extract/", response_model=ExtractionResponse, tags=["CCCD Extraction"])
 async def extract_id_card_info(file: UploadFile = File(...)):
     """
+    Nhận ảnh CCCD, trích xuất thông tin và cắt ảnh chân dung.
+    Tải các model AI nếu đây là request đầu tiên.
     """
+    # Bước 1: Tải model nếu chưa có
+    # Nếu model đã được tải, hàm này sẽ bỏ qua rất nhanh.
+    load_models()
+    # Kiểm tra xem model đã được tải thành công chưa
+    if not idcard_extractor or not face_cascade:
+        raise HTTPException(status_code=503,
+                            detail="Server is starting or models failed to load. Please try again in a moment.")
+    # Bước 2: Tạo thư mục upload tạm thời trong /tmp và xác định đường dẫn file
+    upload_dir = "/tmp/uploads"
+    os.makedirs(upload_dir, exist_ok=True)
+    file_path = os.path.join(upload_dir, f"{uuid.uuid4()}{os.path.splitext(file.filename)[1]}")
+    start_time = time.time()
     try:
+        # Bước 3: Lưu file ảnh được upload
         with open(file_path, "wb") as buffer:
             buffer.write(await file.read())
         frame = cv2.imread(file_path)
         if frame is None:
             raise HTTPException(status_code=400, detail="Invalid image file.")
+        # Bước 4: Nhận diện và cắt ảnh chân dung
+        gray_image = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
+        gray_image = cv2.equalizeHist(gray_image)
+        faces = face_cascade.detectMultiScale(gray_image, scaleFactor=1.1, minNeighbors=5, minSize=(80, 80))
+        portrait_base64 = None
+        if len(faces) > 0:
+            faces = sorted(faces, key=lambda f: f[2] * f[3], reverse=True)
+            (x, y, w, h) = faces[0]
+            padding_y, padding_x = int(h * 0.2), int(w * 0.2)
+            portrait_img = frame[max(0, y - padding_y):min(frame.shape[0], y + h + padding_y),
+                           max(0, x - padding_x):min(frame.shape[1], x + w + padding_x)]
+            _, buffer = cv2.imencode('.jpg', portrait_img)
+            portrait_base64 = base64.b64encode(buffer).decode('utf-8')
+        # Bước 5: Trích xuất thông tin văn bản
         annotations = idcard_extractor.Detection(frame)
         info = {}
         for box in annotations:
             text_detected = box[1][0]
+            id_match = re.search(r'\d{9,12}', text_detected)
+            if id_match:
+                info['ID_number'] = id_match.group(0)
                 info['ID_number_box'] = box[0]
                 break
         if 'ID_number' not in info:
+            raise HTTPException(status_code=400, detail="Could not detect ID number.")
         extracted_result = []
         for box in annotations:
+            if re.search(r'\d{9,12}', box[1][0]): continue
+            top_left, top_right, bottom_right, bottom_left = (
+            tuple(map(int, box[0][0])), tuple(map(int, box[0][1])), tuple(map(int, box[0][2])),
+            tuple(map(int, box[0][3])))
             result_text, _ = idcard_extractor.WarpAndRec(frame, top_left, top_right, bottom_right, bottom_left)
+            extracted_result.append((result_text, box[0]))
+        # Bước 6: Tổng hợp kết quả và trả về
         final_info = idcard_extractor.GetInformationAndSave(extracted_result, info['ID_number'], info['ID_number_box'])
         elapsed = time.time() - start_time
         final_info["elapsed"] = round(elapsed, 2)
+        final_info["portrait_image_base64"] = portrait_base64
         return final_info
     except Exception as e:
+        # Ghi lại lỗi chi tiết vào log của server để gỡ lỗi
+        print(f"Error during extraction: {e}")
+        raise HTTPException(status_code=500, detail=f"An error occurred during processing: {str(e)}")
+    finally:
+        # Bước 7: Dọn dẹp file tạm sau khi xử lý xong
         if os.path.exists(file_path):
+            os.remove(file_path)

core/extractor.py CHANGED Viewed

@@ -26,10 +26,15 @@ class Extractor:
         self.config['cnn']['pretrained'] = False
         self.config['device'] = 'cpu'
-        if (ocr == None):
-            self.ocr = PaddleOCR(lang='en', use_gpu=False, ocr_version='PP-OCRv3', det_model_dir='/tmp/.paddleocr/det', rec_model_dir='/tmp/.paddleocr/rec', cls_model_dir='/tmp/.paddleocr/cls')
-        else:
-            self.ocr = ocr
         if (detector == None):
             self.detector = Predictor(self.config)
         else:

         self.config['cnn']['pretrained'] = False
         self.config['device'] = 'cpu'
+        self.ocr = PaddleOCR(
+            lang='en',
+            use_gpu=False,
+            ocr_version='PP-OCRv3',
+            det_model_dir='./models/det/en_PP-OCRv3_det_infer/',
+            rec_model_dir='./models/rec/en_PP-OCRv3_rec_infer/',
+            cls_model_dir='./models/cls/ch_ppocr_mobile_v2.0_cls_infer/'
+        )
         if (detector == None):
             self.detector = Predictor(self.config)
         else:

models/cls/ch_ppocr_mobile_v2.0_cls_infer/._inference.pdmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d86f5afbfb8cd933a1d0dbbfd8ff2b93ca3eacc6c45f4590a4a2ee107047f6d2
+size 176

models/cls/ch_ppocr_mobile_v2.0_cls_infer/inference.pdiparams ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d1efda1b80e174b4fcb168a035ac96c1af4938892bd86a55f300a6027105d08c
+size 539978

models/cls/ch_ppocr_mobile_v2.0_cls_infer/inference.pdiparams.info ADDED Viewed

Binary file (18.5 kB). View file

models/cls/ch_ppocr_mobile_v2.0_cls_infer/inference.pdmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3c4337ec61722a20b1dca2e5bfaffc313c0592bc89ad6e0d45168224186f6683
+size 1624487

models/det/en_PP-OCRv3_det_infer/inference.pdiparams ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:83676ec730627ab4502f401410a4b6a3ce1c0bb98fa249b71db055b6bddae051
+size 2377917

models/det/en_PP-OCRv3_det_infer/inference.pdiparams.info ADDED Viewed

Binary file (26.4 kB). View file

models/det/en_PP-OCRv3_det_infer/inference.pdmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c4bfb1b05d9d1d5a760801eaf6d20180ef7e47bcc675fb17d1f3a89da5fef427
+size 1590133

models/rec/en_PP-OCRv3_rec_infer.tar ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:94402088520ae3938c51eb8782da1cd7c1bc46d5531766de99f77ee9c2f23343
+size 9963520

models/rec/en_PP-OCRv3_rec_infer/inference.pdiparams ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2cea2de604d8a75fd9151b54ea2dd027659fb8cb777cde377224581110dbff13
+size 8916816

models/rec/en_PP-OCRv3_rec_infer/inference.pdiparams.info ADDED Viewed

Binary file (22 kB). View file

models/rec/en_PP-OCRv3_rec_infer/inference.pdmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f0288362f754e815030929477f7b1f96fe2e913e197537288a01bd43f768d0ab
+size 1020915