Update app.py
Browse files
app.py
CHANGED
@@ -80,21 +80,21 @@ processortext2 = CustomOCRProcessor(image_processor,tokenizer)
|
|
80 |
import os
|
81 |
huggingface_token = os.environ.get("HUGGINGFACE_TOKEN")
|
82 |
model = {}
|
83 |
-
model['single-urdu'] =
|
84 |
-
model['multi-urdu'] =
|
85 |
-
model['medical'] =
|
86 |
-
model['chinese'] =
|
87 |
|
88 |
st.title("Image OCR with musadac/vilanocr")
|
89 |
model_name = st.selectbox("Choose an OCR model", ["single-urdu", "multi-urdu", "medical","chinese" ])
|
90 |
uploaded_file = st.file_uploader("Choose an image", type=["jpg", "jpeg", "png"])
|
91 |
if uploaded_file is not None:
|
92 |
-
|
93 |
img = Image.open(uploaded_file).convert("RGB")
|
94 |
pixel_values = processortext2(img.convert("RGB"), return_tensors="pt").pixel_values
|
95 |
|
96 |
with torch.no_grad():
|
97 |
-
generated_ids =
|
98 |
|
99 |
result = processortext2.batch_decode(generated_ids, skip_special_tokens=True)[0]
|
100 |
st.write("OCR Result:")
|
|
|
80 |
import os
|
81 |
huggingface_token = os.environ.get("HUGGINGFACE_TOKEN")
|
82 |
model = {}
|
83 |
+
model['single-urdu'] = "musadac/vilanocr-single-urdu"
|
84 |
+
model['multi-urdu'] = "musadac/ViLanOCR"
|
85 |
+
model['medical'] = "musadac/vilanocr-multi-medical"
|
86 |
+
model['chinese'] = "musadac/vilanocr-single-chinese"
|
87 |
|
88 |
st.title("Image OCR with musadac/vilanocr")
|
89 |
model_name = st.selectbox("Choose an OCR model", ["single-urdu", "multi-urdu", "medical","chinese" ])
|
90 |
uploaded_file = st.file_uploader("Choose an image", type=["jpg", "jpeg", "png"])
|
91 |
if uploaded_file is not None:
|
92 |
+
model2 = VisionEncoderDecoderModel.from_pretrained(model[model_name], use_auth_token=huggingface_token)
|
93 |
img = Image.open(uploaded_file).convert("RGB")
|
94 |
pixel_values = processortext2(img.convert("RGB"), return_tensors="pt").pixel_values
|
95 |
|
96 |
with torch.no_grad():
|
97 |
+
generated_ids = model2.generate(pixel_values)
|
98 |
|
99 |
result = processortext2.batch_decode(generated_ids, skip_special_tokens=True)[0]
|
100 |
st.write("OCR Result:")
|