Spaces:

VOJ
/

voj

Sleeping

App Files Files Community

amroa commited on Jun 2, 2024

Commit

8c4ff63

1 Parent(s): c751d20

themes

Browse files

Files changed (4) hide show

__pycache__/app.cpython-311.pyc +0 -0
__pycache__/classpred.cpython-311.pyc +0 -0
app.py +66 -8
classpred.py +1 -1

__pycache__/app.cpython-311.pyc CHANGED Viewed

Binary files a/__pycache__/app.cpython-311.pyc and b/__pycache__/app.cpython-311.pyc differ

__pycache__/classpred.cpython-311.pyc CHANGED Viewed

Binary files a/__pycache__/classpred.cpython-311.pyc and b/__pycache__/classpred.cpython-311.pyc differ

app.py CHANGED Viewed

@@ -10,6 +10,11 @@ import torch
 import librosa
 import noisereduce as nr
 import timm
 import pandas as pd
 from classpred import predict_class
 import torch.nn.functional as F
@@ -134,13 +139,18 @@ def preprocess_for_inference(audio_arr, sr):
         results = []
         for idx, scores in zip(topk_indices, topk_values):
             species_name = species_id_to_name[idx.item()]
-            probability = scores.item()
             results.append([species_name, probability])
     return results
 DESCRIPTION = """
-Bird audio classification using SOTA Voice of Jungle Technology.
 """
@@ -153,11 +163,59 @@ css = """
     height: 100%;
 }
 .column-container {
-    height: 100%;
-}
 """
-with gr.Blocks(css = css) as demo:
-    gr.Markdown("# Bird Species Audio Classification")
     gr.Markdown(DESCRIPTION)
     with gr.Row():
@@ -169,8 +227,8 @@ with gr.Blocks(css = css) as demo:
     with gr.Row():
-        raw_class_output = gr.Dataframe(headers=["class", "score"], row_count=10, label="Class Prediction")
-        species_output = gr.Dataframe(headers=["class", "score"], row_count=10, label="Species Prediction")
     with gr.Row():
         waveform_output = gr.Plot(label="Waveform")

 import librosa
 import noisereduce as nr
 import timm
+from typing import Iterable
+import gradio as gr
+from gradio.themes.base import Base
+from gradio.themes.utils import colors, fonts, sizes
+import time
 import pandas as pd
 from classpred import predict_class
 import torch.nn.functional as F
         results = []
         for idx, scores in zip(topk_indices, topk_values):
             species_name = species_id_to_name[idx.item()]
+            probability = scores.item()*100
             results.append([species_name, probability])
     return results
 DESCRIPTION = """
+# Bird audio classification using SOTA Voice of Jungle Technology.  \n
+# Introduction
+It is esimated that 50% of the global economy is threatened by biodiversity loss. As such, efforts have been concerted into estimating bird biodiversity, as birds are a top indicator of biodiversity in the region. One of these efforts is
+finding the bird species in a region using bird species audio classification.
+Prediction on left table shows prediction on the type of noise (class), while the right predictions are the species of bird. If class prediction does not output bird, then consequently the species prediction is not confident.
 """
     height: 100%;
 }
 .column-container {
+    height: 100%;
+}
 """
+class Seafoam(Base):
+    def __init__(
+        self,
+        *,
+        primary_hue: colors.Color | str = colors.emerald,
+        secondary_hue: colors.Color | str = colors.blue,
+        neutral_hue: colors.Color | str = colors.gray,
+        spacing_size: sizes.Size | str = sizes.spacing_md,
+        radius_size: sizes.Size | str = sizes.radius_md,
+        text_size: sizes.Size | str = sizes.text_lg,
+        font: fonts.Font
+        | str
+        | Iterable[fonts.Font | str] = (
+            fonts.GoogleFont("Quicksand"),
+            "ui-sans-serif",
+            "sans-serif",
+        ),
+        font_mono: fonts.Font
+        | str
+        | Iterable[fonts.Font | str] = (
+            fonts.GoogleFont("IBM Plex Mono"),
+            "ui-monospace",
+            "monospace",
+        ),
+    ):
+        super().__init__(
+            primary_hue=primary_hue,
+            secondary_hue=secondary_hue,
+            neutral_hue=neutral_hue,
+            spacing_size=spacing_size,
+            radius_size=radius_size,
+            text_size=text_size,
+            font=font,
+            font_mono=font_mono,
+        )
+seafoam = Seafoam()
+## logo: <img src="https://i.ibb.co/vcG9kr0/vojlogo.jpg" alt="vojlogo" border="0">
+## cactus: <img src="https://i.ibb.co/3sW2mJN/spur.jpg" alt="spur" border="0">
+with gr.Blocks(theme=seafoam, css = css) as demo:
+    #img_src = '<img src="https://i.ibb.co/3sW2mJN/spur.jpg" alt="spur" border="0" width = "100%">'
+    #gr.Markdown(f"{img_src}")
+    #gr.Markdown(f"# Team Voice of Jungle {img_src}  more text")
     gr.Markdown(DESCRIPTION)
     with gr.Row():
     with gr.Row():
+        raw_class_output = gr.Dataframe(headers=["Class", "Score [%]"], row_count=10, label="Class Prediction")
+        species_output = gr.Dataframe(headers=["Class", "Score [%]"], row_count=10, label="Species Prediction")
     with gr.Row():
         waveform_output = gr.Plot(label="Waveform")

classpred.py CHANGED Viewed

@@ -39,6 +39,6 @@ def predict_class(x, sr, start, end):
         logits = MODEL(x.view(1, 1, 1024, 128)).squeeze(0)
     topk_probs, topk_classes = logits.sigmoid().topk(10)
-    preds = [[AUDIOSET_LABELS[cls], prob.item()] for cls, prob in zip(topk_classes, topk_probs)]
     return preds

         logits = MODEL(x.view(1, 1, 1024, 128)).squeeze(0)
     topk_probs, topk_classes = logits.sigmoid().topk(10)
+    preds = [[AUDIOSET_LABELS[cls], prob.item()*100] for cls, prob in zip(topk_classes, topk_probs)]
     return preds