Update app.py
Browse files
app.py
CHANGED
@@ -4,7 +4,7 @@ import gradio as gr
|
|
4 |
from transformers import AutoTokenizer, AutoFeatureExtractor, VisionEncoderDecoderModel
|
5 |
from PIL import Image
|
6 |
import torch
|
7 |
-
import spaces
|
8 |
|
9 |
tokenizer = AutoTokenizer.from_pretrained("kha-white/manga-ocr-base")
|
10 |
|
@@ -26,7 +26,9 @@ def post_process(text):
|
|
26 |
def manga_ocr(img):
|
27 |
img = img.convert('L').convert('RGB')
|
28 |
pixel_values = feature_extractor(img, return_tensors="pt").pixel_values.to("cuda")
|
|
|
29 |
output = model.generate(pixel_values)[0]
|
|
|
30 |
text = tokenizer.decode(output, skip_special_tokens=True)
|
31 |
text = post_process(text)
|
32 |
return text
|
|
|
4 |
from transformers import AutoTokenizer, AutoFeatureExtractor, VisionEncoderDecoderModel
|
5 |
from PIL import Image
|
6 |
import torch
|
7 |
+
import spaces, time
|
8 |
|
9 |
tokenizer = AutoTokenizer.from_pretrained("kha-white/manga-ocr-base")
|
10 |
|
|
|
26 |
def manga_ocr(img):
|
27 |
img = img.convert('L').convert('RGB')
|
28 |
pixel_values = feature_extractor(img, return_tensors="pt").pixel_values.to("cuda")
|
29 |
+
start_time = time.time()
|
30 |
output = model.generate(pixel_values)[0]
|
31 |
+
print("Time taken for OCR:", time.time() - start_time)
|
32 |
text = tokenizer.decode(output, skip_special_tokens=True)
|
33 |
text = post_process(text)
|
34 |
return text
|