File size: 1,072 Bytes
bfbfae6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
import numpy as np
import matplotlib.pyplot as plt

seq_id = "gMH_sFM_cAll_d24_mMH5_ch20"
music_file = "data/aistpp_20hz/"+seq_id+".mp3"
ddc_file = "data/aistpp_ddcpca/"+seq_id+".ddcpca.npy"
ddc_features = np.load(ddc_file)
import IPython.display as ipd
ipd.Audio(music_file) # load a local WAV file

import feature_extraction.madmom as madmom
from feature_extraction.madmom.audio.cepstrogram import MFCC
proc_dwn = madmom.features.RNNDownBeatProcessor()
beats = proc_dwn(music_file, fps=20)

%matplotlib inline
plt.matshow(beats[:200].T)

ddc_features.shape
beats.shape

plt.matshow(ddc_features[:200].T)

%matplotlib
plt.plot(ddc_features[:100,0])
plt.plot(beats[:100,0])


tgt_fps = 20
filtbank = madmom.audio.filters.MelFilterbank
spec = madmom.audio.spectrogram.Spectrogram(music_file, fps=tgt_fps, filterbank=filtbank, num_channels = 1)
# mfccs = MFCC(spec, filterbank=filtbank, num_bands=5)
# chroma = madmom.audio.chroma.PitchClassProfile(spec, num_classes=6, num_channels=1)
sectralflux = madmom.features.onsets.spectral_flux(spec)

mfccs.shape
sectralflux.shape