Spaces:

pirahansiah
/

ComputerVision

Build error

App Files Files Community

pirahansiah commited on Aug 5, 2023

Commit

598166e

1 Parent(s): 349bd07

update threshodling methods

Browse files

Files changed (8) hide show

.vscode/launch.json +16 -0
__pycache__/Thresholding_interface.cpython-310.pyc +0 -0
__pycache__/threshold.cpython-310.pyc +0 -0
__pycache__/threshold_methods.cpython-310.pyc +0 -0
app.py +23 -43
huggingface.png +0 -0
image_0.png +0 -0
threshold_methods.py +303 -0

.vscode/launch.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+    // Use IntelliSense to learn about possible attributes.
+    // Hover to view descriptions of existing attributes.
+    // For more information, visit: https://go.microsoft.com/fwlink/?linkid=830387
+    "version": "0.2.0",
+    "configurations": [
+        {
+            "name": "Python: Current File",
+            "type": "python",
+            "request": "launch",
+            "program": "${file}",
+            "console": "integratedTerminal",
+            "justMyCode": true
+        }
+    ]
+}

__pycache__/Thresholding_interface.cpython-310.pyc ADDED Viewed

Binary file (5.82 kB). View file

__pycache__/threshold.cpython-310.pyc ADDED Viewed

Binary file (5.81 kB). View file

__pycache__/threshold_methods.cpython-310.pyc ADDED Viewed

Binary file (3.36 kB). View file

app.py CHANGED Viewed

@@ -1,50 +1,30 @@
 import gradio as gr
 import cv2
-import requests
-import os
-#pirahansiah/ComputerVision
-from ultralytics import YOLO
-file_urls = [
-    'https://onedrive.live.com/embed?resid=CEE9ECC964C491B8%2123411&authkey=%21AFboK-sTQYxPuQo'
 ]
-def download_file(url, save_name):
-    url = url
-    if not os.path.exists(save_name):
-        file = requests.get(url)
-        open(save_name, 'wb').write(file.content)
-for i, url in enumerate(file_urls):
-    download_file(
-        file_urls[i],
-        f"image_{i}.png"
-    )
-path  = [['image_0.png']]
-def show_preds_image(image_path):
-    image = cv2.imread(image_path,0)
-    return image #cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
-inputs_image = [
-    gr.components.Image(type="filepath", label="Input Image"),
-]
-outputs_image = [
-    gr.components.Image(type="numpy", label="Output Image"),
-]
-interface_image = gr.Interface(
-    fn=show_preds_image,
-    inputs=inputs_image,
-    outputs=outputs_image,
-    title="Computer Vision and Deep Learning by Farshid PirahanSiah",
-    examples=path,
-    cache_examples=False,
 )
 gr.TabbedInterface(
-    [interface_image],
-    tab_names=['Image Processing']
-).queue().launch(share=True)

 import gradio as gr
+from threshold_methods import threshold_methods
 import cv2
+new_outputs = [
+gr.outputs.Image(type="numpy", label="Output Image")
 ]
+def show_image():
+    img = cv2.imread('huggingface.png')
+    return img
+HuggingFace = gr.Interface(
+    fn=show_image,
+    live=True,
+    inputs=[],
+    outputs=new_outputs,
+    hide_controls=True,
+    hide_inputs=True,
+    show_submit_buttom=False,
+    show_clear=False,
+    show_generate=False,
+    allow_flagging=False,
+    title="https://huggingface.co/spaces/pirahansiah/ComputerVision",
 )
 gr.TabbedInterface(
+    [HuggingFace,threshold_methods],
+    tab_names=['HuggingFace','Thresholding Image Segmentation']
+).queue().launch()

huggingface.png ADDED Viewed

image_0.png ADDED Viewed

threshold_methods.py ADDED Viewed

	@@ -0,0 +1,303 @@

+import cv2
+import numpy as np
+import gradio as gr
+def pirahansiah_threshold_method_find_threshold_values_2(grayImg):
+    #http://www.jatit.org/volumes/Vol95No21/1Vol95No21.pdf
+    #https://pdfs.semanticscholar.org/05b2/d39fce4e8a99897e95f8c75416f65a5a0acc.pdf
+    assert grayImg is not None, "file could not be read, check with os.path.exists()"
+    #img = cv2.GaussianBlur(self.grayImg, (3, 3), 0)
+    img = grayImg
+    # Initialize an array to store the PSNR values for each threshold value
+    psnr_values = np.zeros(256)
+    psnr_max=0
+    th=0
+    # Iterate over all possible threshold values with a step size of 5
+    for t in range(0, 256, 5):
+        # Threshold the image using the current threshold value
+        _, binary = cv2.threshold(img, t, 255, cv2.THRESH_BINARY)
+        # Calculate the PSNR between the binary image and the original image
+        psnr = cv2.PSNR(binary, img)
+        # Store the PSNR value
+        psnr_values[t] = psnr
+        if (psnr_max<psnr):
+            psnr_max=psnr
+            th=t
+    # Calculate the mean PSNR value
+    mean_psnr = np.mean(psnr_values)
+    th=int(th/mean_psnr)
+    # Find the threshold values that satisfy the condition
+    thresh = th #np.argwhere((mean_psnr / k1 < psnr_values) & (psnr_values < mean_psnr / k2)).flatten()
+    return thresh
+def pirahansiah_threshold_method_find_threshold_values_1(grayImg):
+    #https://www.jatit.org/volumes/Vol57No2/4Vol57No2.pdf
+    assert grayImg is not None, "file could not be read, check with os.path.exists()"
+    gray = cv2.GaussianBlur(grayImg, (3, 3), 0)
+    max1=0
+    max2=0
+    # Iterate over all possible threshold values
+    for t in range(0, 256, 10):
+        # Threshold the image using the current threshold value
+        _, binary = cv2.threshold(gray, t, 255, cv2.THRESH_BINARY)
+        # Find the contours in the binary image
+        contours, hierarchy = cv2.findContours(binary, cv2.RETR_TREE, cv2.CHAIN_APPROX_SIMPLE)
+        if max1<=len(contours):
+            max1=len(contours)
+            max2=t
+    threshold_values =max2
+    return threshold_values
+path  = [['image_0.png']]
+inputs_thresh = [
+gr.inputs.Image(type="filepath", label="Input Image"),
+gr.components.Slider(label="Manual Threshold Value", value=125, minimum=10, maximum=255, step=5),
+gr.inputs.Radio(label="Threshold Methods",
+                choices=[
+                        "cv2.threshold(grayImg, 128, 255, cv2.THRESH_BINARY)"
+                        ,"cv2.threshold(grayImg, 128, 255, cv2.THRESH_BINARY_INV)"
+                        ,"cv2.threshold(grayImg, 128, 255, cv2.THRESH_TRUNC)"
+                        ,"cv2.threshold(grayImg, 128, 255, cv2.THRESH_TOZERO)"
+                        ,"cv2.threshold(grayImg, 128, 255, cv2.THRESH_TOZERO_INV)"
+                        ,"cv2.adaptiveThreshold(grayImg, 255, cv2.ADAPTIVE_THRESH_MEAN_C, cv2.THRESH_BINARY, 11, 2)"
+                        ,"cv2.threshold(grayImg, 0, 255, cv2.THRESH_BINARY + cv2.THRESH_OTSU,)"
+                        ,"Adapted from PirahanSiah Threshold Method I derivative demo"
+                        ,"Inspired by PirahanSiah Threshold Method II derivative demo"
+                    ]),
+]
+outputs_thresh = [
+gr.outputs.Image(type="numpy", label="Output Image")
+]
+def process_image(input_image, slider_val, radio_choice):
+    img = cv2.imread(input_image,0)
+    _, binaryImg = cv2.threshold(img, slider_val, 255, cv2.THRESH_BINARY)
+    if radio_choice == "cv2.threshold(grayImg, 128, 255, cv2.THRESH_BINARY)":
+            _, binaryImg=cv2.threshold(img, 128, 255, cv2.THRESH_BINARY)
+    elif radio_choice == "cv2.threshold(grayImg, 128, 255, cv2.THRESH_BINARY_INV)":
+            _, binaryImg=cv2.threshold(img, 128, 255, cv2.THRESH_BINARY_INV)
+    elif radio_choice == "cv2.threshold(grayImg, 128, 255, cv2.THRESH_TRUNC)":
+            _, binaryImg=cv2.threshold(img, 128, 255, cv2.THRESH_TRUNC)
+    elif radio_choice == "cv2.threshold(grayImg, 128, 255, cv2.THRESH_TOZERO)":
+            _, binaryImg=cv2.threshold(img, 128, 255, cv2.THRESH_TOZERO)
+    elif radio_choice == "cv2.threshold(grayImg, 128, 255, cv2.THRESH_TOZERO_INV)":
+            _, binaryImg=cv2.threshold(img, 128, 255, cv2.THRESH_TOZERO_INV)
+    elif radio_choice == "cv2.adaptiveThreshold(grayImg, 255, cv2.ADAPTIVE_THRESH_MEAN_C, cv2.THRESH_BINARY, 11, 2)":
+            binaryImg=cv2.adaptiveThreshold(img, 255, cv2.ADAPTIVE_THRESH_MEAN_C, cv2.THRESH_BINARY, 11, 2)
+    elif radio_choice == "cv2.threshold(grayImg, 0, 255, cv2.THRESH_BINARY + cv2.THRESH_OTSU,)":
+           _, binaryImg=cv2.threshold(img, 0, 255, cv2.THRESH_BINARY + cv2.THRESH_OTSU,)
+    elif radio_choice == "Adapted from PirahanSiah Threshold Method I derivative demo":
+           threshval=pirahansiah_threshold_method_find_threshold_values_1(img)
+           _, binaryImg = cv2.threshold(img, threshval, 255, cv2.THRESH_BINARY)
+    elif radio_choice == "Inspired by PirahanSiah Threshold Method II derivative demo":
+           threshval=pirahansiah_threshold_method_find_threshold_values_2(img)
+           _, binaryImg = cv2.threshold(img, threshval, 255, cv2.THRESH_BINARY)
+    return binaryImg
+def on_change(slider_val, radio_choice):
+    # Update output
+    outputs_thresh[0].update(process_image(
+        inputs_thresh[0].value,
+        slider_val,
+        radio_choice)
+    )
+threshold_methods = gr.Interface(
+    fn=process_image,
+    inputs=inputs_thresh,
+    outputs=outputs_thresh,
+    on_change=on_change,
+    examples=path,
+    title="Computer Vision and Deep Learning by Farshid PirahanSiah",
+    live=True
+    )
+# class Thresholding:
+#     def __init__(self, grayImg):
+#         self.grayImg = grayImg
+#     def manually_python(self):
+#         threshval = 128
+#         binaryImg = np.where(self.grayImg < threshval, self.grayImg, 0) if threshval < 128 else np.where(self.grayImg > threshval, self.grayImg, 0)
+#         return binaryImg
+#     def manually(self,threshval):
+#         binaryImg = np.zeros_like(self.grayImg)
+#         for i in range(self.grayImg.shape[0]): #height
+#             for j in range(self.grayImg.shape[1]): #width
+#                 if self.grayImg[i, j] < threshval:
+#                     binaryImg[i, j] = 0
+#                 else:
+#                     binaryImg[i, j] = 1
+#         return binaryImg
+#     def pirahansiah_threshold_method_find_threshold_values_2(self):
+#         #http://www.jatit.org/volumes/Vol95No21/1Vol95No21.pdf
+#         #https://pdfs.semanticscholar.org/05b2/d39fce4e8a99897e95f8c75416f65a5a0acc.pdf
+#         assert self.grayImg is not None, "file could not be read, check with os.path.exists()"
+#         #img = cv2.GaussianBlur(self.grayImg, (3, 3), 0)
+#         img = self.grayImg
+#         # Initialize an array to store the PSNR values for each threshold value
+#         psnr_values = np.zeros(256)
+#         psnr_max=0
+#         th=0
+#         # Iterate over all possible threshold values with a step size of 5
+#         for t in range(0, 256, 5):
+#             # Threshold the image using the current threshold value
+#             _, binary = cv2.threshold(img, t, 255, cv2.THRESH_BINARY)
+#             # Calculate the PSNR between the binary image and the original image
+#             psnr = cv2.PSNR(binary, img)
+#             # Store the PSNR value
+#             psnr_values[t] = psnr
+#             if (psnr_max<psnr):
+#                 psnr_max=psnr
+#                 th=t
+#         # Calculate the mean PSNR value
+#         mean_psnr = np.mean(psnr_values)
+#         th=int(th/mean_psnr)
+#         # Find the threshold values that satisfy the condition
+#         thresh = th #np.argwhere((mean_psnr / k1 < psnr_values) & (psnr_values < mean_psnr / k2)).flatten()
+#         return thresh
+#     def pirahansiah_threshold_method_find_threshold_values_1(self):
+#         #https://www.jatit.org/volumes/Vol57No2/4Vol57No2.pdf
+#         assert self.grayImg is not None, "file could not be read, check with os.path.exists()"
+#         gray = cv2.GaussianBlur(self.grayImg, (3, 3), 0)
+#         max1=0
+#         max2=0
+#         # Iterate over all possible threshold values
+#         for t in range(0, 256, 10):
+#             # Threshold the image using the current threshold value
+#             _, binary = cv2.threshold(gray, t, 255, cv2.THRESH_BINARY)
+#             # Find the contours in the binary image
+#             contours, hierarchy = cv2.findContours(binary, cv2.RETR_TREE, cv2.CHAIN_APPROX_SIMPLE)
+#             if max1<=len(contours):
+#                 max1=len(contours)
+#                 max2=t
+#         threshold_values =max2
+#         return threshold_values
+#     def opencv_th(self):
+#         font = cv2.FONT_HERSHEY_SIMPLEX
+#         fontScale = 2
+#         color = (0, 0, 0)
+#         colorInv = (255, 255, 255)
+#         thickness = 2
+#         # Set the position of the text
+#         textX = 25
+#         textY = 45
+#         textSize, _ = cv2.getTextSize("Otsu Method   ", font, fontScale, thickness)
+#         # Draw a white rectangle behind the text
+#         # Apply different thresholding methods
+#         _, binaryImg = cv2.threshold(self.grayImg, 128, 255, cv2.THRESH_BINARY)
+#         cv2.rectangle(binaryImg, (textX, textY - textSize[1]), (textX + textSize[0], textY), (255, 255, 255), -1)
+#         cv2.putText(binaryImg, 'Binary', (textX, textY), font, fontScale, color, thickness)
+#         _, binaryInvImg = cv2.threshold(self.grayImg, 128, 255, cv2.THRESH_BINARY_INV)
+#         cv2.rectangle(binaryInvImg, (textX, textY - textSize[1]), (textX + textSize[0], textY), (255, 255, 255), -1)
+#         cv2.putText(binaryInvImg, 'Binary Inv', (textX, textY), font, fontScale, color, thickness)
+#         _, truncImg = cv2.threshold(self.grayImg, 128, 255, cv2.THRESH_TRUNC)
+#         cv2.rectangle(truncImg, (textX, textY - textSize[1]), (textX + textSize[0], textY), (255, 255, 255), -1)
+#         cv2.putText(truncImg, 'Trunc', (textX, textY), font, fontScale, color, thickness)
+#         _, toZeroImg = cv2.threshold(self.grayImg, 128, 255, cv2.THRESH_TOZERO)
+#         cv2.rectangle(toZeroImg, (textX, textY - textSize[1]), (textX + textSize[0], textY), (255, 255, 255), -1)
+#         cv2.putText(toZeroImg, 'To Zero', (textX, textY), font, fontScale, color, thickness)
+#         _, toZeroInvImg = cv2.threshold(self.grayImg, 128, 255, cv2.THRESH_TOZERO_INV)
+#         cv2.rectangle(toZeroInvImg, (textX, textY - textSize[1]), (textX + textSize[0], textY), (255, 255, 255), -1)
+#         cv2.putText(toZeroInvImg, 'To Zero Inv', (textX, textY), font, fontScale, color, thickness)
+#         adaptiveImg = cv2.adaptiveThreshold(self.grayImg, 255, cv2.ADAPTIVE_THRESH_MEAN_C, cv2.THRESH_BINARY, 11, 2)
+#         cv2.rectangle(adaptiveImg, (textX, textY - textSize[1]), (textX + textSize[0], textY), (255, 255, 255), -1)
+#         cv2.putText(adaptiveImg, 'Adaptive', (textX, textY), font, fontScale, color, thickness)
+#         otsu_threshold, image_result = cv2.threshold(self.grayImg, 0, 255, cv2.THRESH_BINARY + cv2.THRESH_OTSU,)
+#         cv2.rectangle(image_result, (textX, textY - textSize[1]), (textX + textSize[0], textY), (255, 255, 255), -1)
+#         cv2.putText(image_result, 'Otsu Threshold Method', (textX, textY), font, fontScale, color, thickness)
+#         threshval=self.pirahansiah_threshold_method_find_threshold_values_1()
+#         th_img = th.manually(threshval)
+#         binaryImg = th_img * 255
+#         cv2.rectangle(binaryImg, (textX, textY - textSize[1]), (textX + textSize[0], textY), (255, 255, 255), -1)
+#         cv2.putText(binaryImg, 'PirahanSiah Threshold ', (textX, textY), font, fontScale, color, thickness)
+#         cv2.rectangle(self.grayImg, (textX, textY - textSize[1]), (textX + textSize[0], textY), (255, 255, 255), -1)
+#         cv2.putText(self.grayImg, 'Original', (textX, textY), font, fontScale, color, thickness)
+#         # Concatenate the images into a grid with 3 rows and 3 columns
+#         row1 = np.concatenate((self.grayImg, binaryImg, binaryInvImg), axis=1)
+#         row2 = np.concatenate((truncImg, toZeroImg, toZeroInvImg), axis=1)
+#         row3 = np.concatenate((adaptiveImg, image_result, binaryImg), axis=1) # np.zeros_like(adaptiveImg)
+#         concatenatedImg = np.concatenate((row1, row2, row3), axis=0)
+#         # Resize the concatenated image to fit the screen resolution
+#         screenRes = (1920-200, 1080-200)
+#         scaleWidth = screenRes[0] / concatenatedImg.shape[1]
+#         scaleHeight = screenRes[1] / concatenatedImg.shape[0]
+#         scale = min(scaleWidth, scaleHeight)
+#         windowWidth = int(concatenatedImg.shape[1] * scale)
+#         windowHeight = int(concatenatedImg.shape[0] * scale)
+#         resizedImg = cv2.resize(concatenatedImg, (windowWidth, windowHeight))
+#         # Display the resized image
+#         cv2.imshow('Thresholded Images', resizedImg)
+#         cv2.waitKey(0)
+#         cv2.destroyAllWindows()
+# if __name__ == "__main__":
+#     img = cv2.imread("opencv.png")
+#     gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+#     th = Thresholding(gray)
+#     th.opencv_th()
+    #threshval = 128
+    # read an image
+    # convert it to grayscale
+    #threshval=th.pirahansiah_threshold_method_find_threshold_values_1()
+    # threshval=th.pirahansiah_threshold_method_find_threshold_values_2()
+    # th_img = th.manually(threshval)
+    # binaryImg = th_img * 255
+    # cv2.imshow('image', binaryImg)
+    # cv2.waitKey(100)
+'''
+cv::Mat binaryImg = threshval < 128 ? (grayImg < threshval) : (grayImg > threshval);
+#thresholding #opencv #python
+The PirahanSiah’s method for thresholding, described in the paper, uses a gray-scale histogram,
+thresholding range, and the Peak Signal-to-Noise Ratio (PSNR) to segment images and find the best
+threshold values to binarize the image. They argue that thresholding is an important problem in
+pattern recognition and use the PSNR quality measure to assess the similarities between the
+original and binarized image. They calculate PSNRs for every threshold value and use the
+difference between the PSNR of the previous threshold image and the new one to select the
+threshold value. They also describe a multi-threshold algorithm that applies multiple
+threshold values and computes the total number of blobs or objects in an image for each threshold.
+The peak threshold values are those with the highest total number of blobs compared to their threshold neighbors.
+In addition, their method uses thresholding on images suitable for OCR systems, LPR systems, etc.
+The proposed adaptive threshold method, based on the Peak Signal-to-Noise Ratio (PSNR),
+has the potential to be applied in all domains, such as LPR and OCR. The proposed algorithm
+achieves competitive results in four databases, including Malaysian vehicle, standard,
+printed and handwritten images. The objective of this research was to develop a new single
+adaptive thresholding algorithm that works for a wide range of pattern recognition applications.
+The proposed method has been implemented in four different types of applications and compared
+with other methods. The results show that the proposed algorithm achieves the objective because
+it has obtained reasonable results in all four areas/domains.
+https://www.jatit.org/volumes/Vol57No2/4Vol57No2.pdf
+http://www.jatit.org/volumes/Vol95No21/1Vol95No21.pdf
+https://pdfs.semanticscholar.org/05b2/d39fce4e8a99897e95f8c75416f65a5a0acc.pdf
+'''