Spaces:

mostafaashahin
/

Phone-aid

Sleeping

App Files Files Community

Mostafa Shahin commited on Apr 2

Commit

1bd17d3

•

1 Parent(s): 6403fc5

plot waveform

Browse files

Files changed (2) hide show

app.py +18 -10
phoneme_vocab.json +1 -1

app.py CHANGED Viewed

@@ -98,25 +98,33 @@ def create_spectrogram_with_att(wav_file, att_contour, att ):
     # Calculate the spectrogram
     f, t, Sxx = spectrogram(data, fs=sampling_rate)
-    fig, ax = plt.subplots(figsize=(10, 5))
     # Plot the spectrogram
-    ax.pcolormesh(t, f, 10 * np.log10(Sxx), shading='gouraud')  # Use grayscale colormap
-    ax.set_ylabel('Frequency (Hz)')
-    ax.set_xlabel('Time (s)')
-    ax.set_title(f'Spectrogram with {att} Contour')
-    ax.set_ylim(0, 8000)  # Adjust the frequency range if necessary
-    ax_att = ax.twinx()
     # Plot the att contour
     x_points = att_contour.shape[0]
-    time_att = np.arange(0,  x_points * 0.02, 0.02)[:x_points]
     ax_att.plot(time_att, att_contour, color='blue', label=f'{att} Contour')
     ax_att.set_ylim(0,1)
     ax_att.legend()
-    return fig
 def plot_contour(audio_file, att):
     indx_n = engine.processor.tokenizer.convert_tokens_to_ids([f'n_{att}'])[0]

     # Calculate the spectrogram
     f, t, Sxx = spectrogram(data, fs=sampling_rate)
+    fig, axs = plt.subplots(2, 1, figsize=(10, 10), sharex=True)
     # Plot the spectrogram
+    axs[0].pcolormesh(t, f, 10 * np.log10(Sxx), shading='gouraud')  # Use grayscale colormap
+    #plt.colorbar(label='Intensity (dB)')
+    axs[0].set_ylabel('Frequency (Hz)')
+    axs[0].set_xlabel('Time (s)')
+    axs[0].set_title(f'Spectrogram with {att} Contour')
+    axs[0].set_ylim(0, 8000)  # Adjust the frequency range if necessary
+    ax_att = axs[0].twinx()
     # Plot the att contour
     x_points = att_contour.shape[0]
+    time_att = np.arange(0,  x_points * 0.02, 0.02)[:x_points]  # Assuming pitch_contour is sampled every 20 ms
     ax_att.plot(time_att, att_contour, color='blue', label=f'{att} Contour')
     ax_att.set_ylim(0,1)
     ax_att.legend()
+    # Plot the waveform
+    time = np.arange(0, len(data)) / sampling_rate
+    axs[1].plot(time, data, color='blue')
+    axs[1].set_ylabel('Amplitude')
+    axs[1].set_xlabel('Time (s)')
+    axs[1].set_title('Waveform')
+    #plt.show()
+    return fig
 def plot_contour(audio_file, att):
     indx_n = engine.processor.tokenizer.convert_tokens_to_ids([f'n_{att}'])[0]

phoneme_vocab.json CHANGED Viewed

@@ -1 +1 @@

- {"<pad>": 0, "aa": 1, "ae": 2, "ah": 3, "ao": 4, "aw": 5, "ay": 6, "eh": 7, "er": 8, "ey": 9, "ih": 10, "iy": 11, "ow": 12, "oy": 13, "uh": 14, "uw": 15, "b": 16, "ch": 17, "d": 18, "dh": 19, "f": 20, "g": 21, "hh": 22, "jh": 23, "k": 24, "l": 25, "m": 26, "n": 27, "nd": 28, "ng": 29, "p": 30, "r": 31, "s": 32, "sh": 33, "~~sil~~": 34, "t": 35, "th": 36, "v": 37, "w": 38, "y": 39~~, "z": 40, "zh": 41~~}

+ {"<pad>": 0, "\u0251": 1, "\u00e6": 2, "\u028c": 3, "\u0254": 4, "a\u028a": 5, "a\u026a": 6, "\u025b": 7, "\u025d": 8, "e\u026a": 9, "\u026a": 10, "i": 11, "o\u028a": 12, "\u0254\u026a": 13, "\u028a": 14, "u": 15, "b": 16, "t\u0283": 17, "d": 18, "\u00f0": 19, "f": 20, "g": 21, "h": 22, "d\u0292": 23, "k": 24, "l": 25, "m": 26, "n": 27, "\u014b": 28, "p": 29, "\u0279": 30, "s": 31, "\u0283": 32, "t": 33, "\u03b8": 34, "v": 35, "w": 36, "j": 37, "z": 38, "\u0292": 39}