Video-to-Multilingual-OCR

Runtime error

App Files Files Community

stupidog04 commited on Apr 16, 2023

Commit

97a7e85

•

1 Parent(s): e72880c

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -9

app.py CHANGED Viewed

@@ -10,11 +10,7 @@ import cv2
 import pandas as pd
 from transformers import TrOCRProcessor, VisionEncoderDecoderModel
 import matplotlib.pyplot as plt
-#torch.hub.download_url_to_file('https://github.com/AaronCWacker/Yggdrasil/blob/main/images/BeautyIsTruthTruthisBeauty.JPG', 'BeautyIsTruthTruthisBeauty.JPG')
-#torch.hub.download_url_to_file('https://github.com/AaronCWacker/Yggdrasil/blob/main/images/PleaseRepeatLouder.jpg', 'PleaseRepeatLouder.jpg')
-#torch.hub.download_url_to_file('https://github.com/AaronCWacker/Yggdrasil/blob/main/images/ProhibitedInWhiteHouse.JPG', 'ProhibitedInWhiteHouse.JPG')
 torch.hub.download_url_to_file('https://raw.githubusercontent.com/AaronCWacker/Yggdrasil/master/images/20-Books.jpg','20-Books.jpg')
 torch.hub.download_url_to_file('https://github.com/JaidedAI/EasyOCR/raw/master/examples/english.png', 'COVID.png')
@@ -199,9 +195,26 @@ def inference(video, lang, full_scan, number_filter, use_trocr, time_step, perio
         df_list.append({"Box": f"", "Time (s)": "", "Text": ""})
     df = pd.concat([pd.DataFrame(df_list)])
-    # generate the plot of temporal profile
     plot_fig = plot_temporal_profile(temporal_profiles)
-    return output, im, plot_fig, df
 title = '🖼️Video to Multilingual OCR👁️Gradio'
@@ -240,8 +253,9 @@ gr.Interface(
     [
         gr.outputs.Video(label='Output Video'),
         gr.outputs.Image(label='Output Preview', type='numpy'),
-        gr.Plot(label='Temporal Profile'),
-        gr.outputs.Dataframe(headers=['Box', 'Time (s)', 'Text'], type='pandas',  max_rows=15)
     ],
     title=title,
     description=description,

 import pandas as pd
 from transformers import TrOCRProcessor, VisionEncoderDecoderModel
 import matplotlib.pyplot as plt
+import io
 torch.hub.download_url_to_file('https://raw.githubusercontent.com/AaronCWacker/Yggdrasil/master/images/20-Books.jpg','20-Books.jpg')
 torch.hub.download_url_to_file('https://github.com/JaidedAI/EasyOCR/raw/master/examples/english.png', 'COVID.png')
         df_list.append({"Box": f"", "Time (s)": "", "Text": ""})
     df = pd.concat([pd.DataFrame(df_list)])
+    # Convert the Matplotlib plot to a NumPy array
     plot_fig = plot_temporal_profile(temporal_profiles)
+    buf = io.BytesIO()
+    plot_fig.savefig(buf, format='png')
+    buf.seek(0)
+    plot_image = PIL.Image.open(buf)
+    # Resize the image to fit the width of the returned image
+    im_width, im_height = im.size
+    plot_width, plot_height = plot_image.size
+    new_plot_height = int(plot_height * im_width / plot_width)
+    resized_plot_image = plot_image.resize((im_width, new_plot_height), PIL.Image.ANTIALIAS)
+    # Convert the resized image to a NumPy array
+    plot_np = np.array(resized_plot_image)
+    # Close the buffer
+    buf.close()
+    return output, im, plot_np, df  # Change this line
 title = '🖼️Video to Multilingual OCR👁️Gradio'
     [
         gr.outputs.Video(label='Output Video'),
         gr.outputs.Image(label='Output Preview', type='numpy'),
+        # gr.Plot(label='Temporal Profile'),
+        gr.outputs.Image(label='Temporal Profile', type='numpy'),
+        gr.outputs.Dataframe(headers=['Box', 'Time (s)', 'Text'], type='pandas')
     ],
     title=title,
     description=description,