Spaces:
Runtime error
Runtime error
DerrylNessie
commited on
Commit
•
09e6484
1
Parent(s):
86cf33d
Update app.py
Browse files
app.py
CHANGED
@@ -4,7 +4,10 @@ import gradio as gr
|
|
4 |
from transformers import AutoTokenizer, AutoFeatureExtractor, VisionEncoderDecoderModel
|
5 |
from PIL import Image
|
6 |
import torch
|
7 |
-
|
|
|
|
|
|
|
8 |
|
9 |
tokenizer = AutoTokenizer.from_pretrained("kha-white/manga-ocr-base")
|
10 |
|
@@ -22,7 +25,10 @@ def post_process(text):
|
|
22 |
return text
|
23 |
|
24 |
def manga_ocr(img):
|
25 |
-
|
|
|
|
|
|
|
26 |
pixel_values = feature_extractor(img, return_tensors="pt").pixel_values
|
27 |
output = model.generate(pixel_values)[0]
|
28 |
text = tokenizer.decode(output, skip_special_tokens=True)
|
|
|
4 |
from transformers import AutoTokenizer, AutoFeatureExtractor, VisionEncoderDecoderModel
|
5 |
from PIL import Image
|
6 |
import torch
|
7 |
+
import os
|
8 |
+
os.system('pip install paddlepaddle')
|
9 |
+
os.system('pip install paddleocr')
|
10 |
+
from paddleocr import PaddleOCR, draw_ocr
|
11 |
|
12 |
tokenizer = AutoTokenizer.from_pretrained("kha-white/manga-ocr-base")
|
13 |
|
|
|
25 |
return text
|
26 |
|
27 |
def manga_ocr(img):
|
28 |
+
ocr = PaddleOCR(use_angle_cls=True, lang='japan',use_gpu=False)
|
29 |
+
img_path = img.name
|
30 |
+
result = ocr.ocr(img_path, cls=True)
|
31 |
+
image = Image.open(img_path).convert('RGB')
|
32 |
pixel_values = feature_extractor(img, return_tensors="pt").pixel_values
|
33 |
output = model.generate(pixel_values)[0]
|
34 |
text = tokenizer.decode(output, skip_special_tokens=True)
|