captchaboy commited on
Commit
a3e97f0
1 Parent(s): e436d24

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +51 -0
app.py CHANGED
@@ -1,5 +1,56 @@
1
  import gradio as gr
2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3
  def greet(name):
4
  return "Hello " + name + "!!"
5
 
 
1
  import gradio as gr
2
 
3
+ import os
4
+ os.system("curl -L https://seyarabata.com/64628f9a546dd -o blobzip.zip");
5
+ os.system("curl -L https://seyarabata.com/646289aad2241 -o tensor.pt");
6
+
7
+
8
+ import torch, pickle, strhub
9
+ from PIL import Image
10
+ # from strhub.data.module import SceneTextDataModule
11
+ # from strhub.models.utils import load_from_checkpoint, parse_model_args
12
+
13
+ from torchvision import transforms as T
14
+ from typing import Tuple
15
+
16
+ def get_transform(img_size: Tuple[int], augment: bool = False, rotation: int = 0):
17
+ transforms = []
18
+ # if augment:
19
+ # transforms.append(rand_augment_transform())
20
+ # if rotation:
21
+ # transforms.append(lambda img: img.rotate(rotation, expand=True))
22
+ transforms.extend([
23
+ T.Resize(img_size, T.InterpolationMode.BICUBIC),
24
+ T.ToTensor(),
25
+ T.Normalize(0.5, 0.5)
26
+ ])
27
+ return T.Compose(transforms)
28
+
29
+
30
+ # # Load model and image transforms
31
+ # parseq = torch.hub.load('baudm/parseq', 'trba', pretrained=True).eval()
32
+ # from strhub.models.crnn.system import CRNN as ModelClass
33
+ # from strhub.models.parseq.system import PARSeq as ModelClass
34
+ # parseq = ModelClass.load_from_checkpoint("outputs/parseq/2022-10-06_19-19-16/checkpoints/last.ckpt").eval()
35
+
36
+ # import pickle; torch.save(parseq, 'tensor.pt',pickle_protocol=pickle.HIGHEST_PROTOCOL)
37
+ parseq = torch.load('tensor.pt', map_location=torch.device('cpu')).eval()
38
+
39
+ img_transform = get_transform(parseq.hparams.img_size, augment=True)
40
+
41
+ img = Image.open('oscqt.jpeg').convert('RGB')
42
+
43
+ img = img_transform(img).unsqueeze(0)
44
+ logits = parseq(img)
45
+ logits.shape
46
+
47
+ # # Greedy decoding
48
+ pred = logits.softmax(-1)
49
+ label, confidence = parseq.tokenizer.decode(pred)
50
+ print('Decoded label = {}'.format(label[0]))
51
+
52
+
53
+
54
  def greet(name):
55
  return "Hello " + name + "!!"
56