DerrylNessie commited on
Commit
09e6484
1 Parent(s): 86cf33d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -2
app.py CHANGED
@@ -4,7 +4,10 @@ import gradio as gr
4
  from transformers import AutoTokenizer, AutoFeatureExtractor, VisionEncoderDecoderModel
5
  from PIL import Image
6
  import torch
7
-
 
 
 
8
 
9
  tokenizer = AutoTokenizer.from_pretrained("kha-white/manga-ocr-base")
10
 
@@ -22,7 +25,10 @@ def post_process(text):
22
  return text
23
 
24
  def manga_ocr(img):
25
- img = img.convert('L').convert('RGB')
 
 
 
26
  pixel_values = feature_extractor(img, return_tensors="pt").pixel_values
27
  output = model.generate(pixel_values)[0]
28
  text = tokenizer.decode(output, skip_special_tokens=True)
 
4
  from transformers import AutoTokenizer, AutoFeatureExtractor, VisionEncoderDecoderModel
5
  from PIL import Image
6
  import torch
7
+ import os
8
+ os.system('pip install paddlepaddle')
9
+ os.system('pip install paddleocr')
10
+ from paddleocr import PaddleOCR, draw_ocr
11
 
12
  tokenizer = AutoTokenizer.from_pretrained("kha-white/manga-ocr-base")
13
 
 
25
  return text
26
 
27
  def manga_ocr(img):
28
+ ocr = PaddleOCR(use_angle_cls=True, lang='japan',use_gpu=False)
29
+ img_path = img.name
30
+ result = ocr.ocr(img_path, cls=True)
31
+ image = Image.open(img_path).convert('RGB')
32
  pixel_values = feature_extractor(img, return_tensors="pt").pixel_values
33
  output = model.generate(pixel_values)[0]
34
  text = tokenizer.decode(output, skip_special_tokens=True)