Spaces:

dennisvdang
/

Chorus-Detection

Sleeping

App Files Files Community

dennisvdang commited on Jun 15, 2024

Commit

083c84b

1 Parent(s): 2836474

Script fixes

Browse files

Files changed (2) hide show

app.py +14 -14
style.css +24 -0

app.py CHANGED Viewed

@@ -316,32 +316,31 @@ def smooth_predictions(data: np.ndarray) -> np.ndarray:
     return smoothed_data
 def make_predictions(model, processed_audio, audio_features, url, video_name):
     predictions = model.predict(processed_audio)[0]
-    binary_predictions = np.round(
-        predictions[:(len(audio_features.meter_grid) - 1)]).flatten()
     smoothed_predictions = smooth_predictions(binary_predictions)
-    meter_grid_times = librosa.frames_to_time(
-        audio_features.meter_grid, sr=audio_features.sr, hop_length=audio_features.hop_length)
-    chorus_start_times = [meter_grid_times[i] for i in range(len(
-        smoothed_predictions)) if smoothed_predictions[i] == 1 and (i == 0 or smoothed_predictions[i - 1] == 0)]
-    chorus_end_times = [meter_grid_times[i + 1] for i in range(len(
-        smoothed_predictions)) if smoothed_predictions[i] == 1 and (i == len(smoothed_predictions) - 1 or smoothed_predictions[i + 1] == 0)]
     st.write(f"**Video Title:** {video_name}")
     st.write(f"**Number of choruses identified:** {len(chorus_start_times)}")
     for start_time, end_time in zip(chorus_start_times, chorus_end_times):
         link = f"{url}&t={int(start_time)}s"
-        st.write(f"Chorus from {start_time:.2f}s to {end_time:.2f}s: [Link]({link})")
     if len(chorus_start_times) == 0:
         st.write("No choruses identified.")
     return smoothed_predictions
 def plot_meter_lines(ax: plt.Axes, meter_grid_times: np.ndarray) -> None:
     for time in meter_grid_times:
         ax.axvline(x=time, color='grey', linestyle='--',
@@ -393,15 +392,16 @@ def plot_predictions(audio_features, predictions):
 def main():
-    st.title("Chorus Detection")
     st.write("Upload a YouTube URL to find the chorus in the song.")
     url = st.text_input("YouTube URL")
     if st.button("Find Chorus"):
         if url:
-            with st.spinner('Extracting audio...'):
                 audio_file, video_title, temp_dir = extract_audio(url)
             if audio_file:
-                with st.spinner('Stripping silence...'):
                     strip_silence(audio_file)
                 with st.spinner('Processing audio...'):
                     processed_audio, audio_features = process_audio(audio_path=audio_file)
@@ -416,4 +416,4 @@ def main():
             st.error("Please enter a valid YouTube URL")
 if __name__ == "__main__":
-    main()

     return smoothed_data
+def format_time(seconds):
+    m, s = divmod(seconds, 60)
+    return f"{int(m)}:{s:05.2f}"
 def make_predictions(model, processed_audio, audio_features, url, video_name):
     predictions = model.predict(processed_audio)[0]
+    binary_predictions = np.round(predictions[:(len(audio_features.meter_grid) - 1)]).flatten()
     smoothed_predictions = smooth_predictions(binary_predictions)
+    meter_grid_times = librosa.frames_to_time(audio_features.meter_grid, sr=audio_features.sr, hop_length=audio_features.hop_length)
+    chorus_start_times = [meter_grid_times[i] for i in range(len(smoothed_predictions)) if smoothed_predictions[i] == 1 and (i == 0 or smoothed_predictions[i - 1] == 0)]
+    chorus_end_times = [meter_grid_times[i + 1] for i in range(len(smoothed_predictions)) if smoothed_predictions[i] == 1 and (i == len(smoothed_predictions) - 1 or smoothed_predictions[i + 1] == 0)]
     st.write(f"**Video Title:** {video_name}")
     st.write(f"**Number of choruses identified:** {len(chorus_start_times)}")
     for start_time, end_time in zip(chorus_start_times, chorus_end_times):
         link = f"{url}&t={int(start_time)}s"
+        st.write(f"Chorus from {format_time(start_time)} to {format_time(end_time)}: [{link}]({link})")
     if len(chorus_start_times) == 0:
         st.write("No choruses identified.")
     return smoothed_predictions
 def plot_meter_lines(ax: plt.Axes, meter_grid_times: np.ndarray) -> None:
     for time in meter_grid_times:
         ax.axvline(x=time, color='grey', linestyle='--',
 def main():
+    st.title("Chorus Finder")
+    st.write("This app uses a pre-trained convolutional recurrent neural network to predict chorus locations in music. To learn more about this project, visit [github.com/dennisvdang/chorus-detection](https://github.com/dennisvdang/chorus-detection).")
     st.write("Upload a YouTube URL to find the chorus in the song.")
     url = st.text_input("YouTube URL")
     if st.button("Find Chorus"):
         if url:
+            with st.spinner('Analyzing YouTube link...'):
                 audio_file, video_title, temp_dir = extract_audio(url)
             if audio_file:
+                with st.spinner('Trimming silence...'):
                     strip_silence(audio_file)
                 with st.spinner('Processing audio...'):
                     processed_audio, audio_features = process_audio(audio_path=audio_file)
             st.error("Please enter a valid YouTube URL")
 if __name__ == "__main__":
+    main()

style.css ADDED Viewed

	@@ -0,0 +1,24 @@

+body {
+    /* background-image: url('https://your-image-url.com/background.jpg'); */
+    background-size: cover;
+}
+.stButton>button {
+    background-color: #fcb900;
+    color: white;
+    border: none;
+    padding: 10px 24px;
+    text-align: center;
+    text-decoration: none;
+    display: inline-block;
+    font-size: 16px;
+    margin: 4px 2px;
+    transition-duration: 0.4s;
+    cursor: pointer;
+}
+.stButton>button:hover {
+    background-color: white;
+    color: black;
+    border: 2px solid #4CAF50;
+}