MIDNIGHT-AITTM / midi_synthesizer.py
skytnt's picture
speed up rendering audio
1fd2f8b
raw
history blame
2.98 kB
from threading import Lock
import fluidsynth
import numpy as np
class MidiSynthesizer:
def __init__(self, soundfont_path, sample_rate=44100):
self.soundfont_path = soundfont_path
self.sample_rate = sample_rate
fl = fluidsynth.Synth(samplerate=float(sample_rate))
sfid = fl.sfload(soundfont_path)
self.devices = [[fl, sfid, False]]
self.file_lock = Lock()
def get_fluidsynth(self):
for device in self.devices:
if not device[2]:
device[2] = True
return device
with self.file_lock:
fl = fluidsynth.Synth(samplerate=float(self.sample_rate))
sfid = fl.sfload(self.soundfont_path)
device = [fl, sfid, True]
self.devices.append(device)
return device
def release_fluidsynth(self, device):
device[0].system_reset()
device[0].get_samples(self.sample_rate*5) # wait for silence
device[2] = False
def synthesis(self, midi_opus):
ticks_per_beat = midi_opus[0]
event_list = []
for track_idx, track in enumerate(midi_opus[1:]):
abs_t = 0
for event in track:
abs_t += event[1]
event_new = [*event]
event_new[1] = abs_t
event_list.append(event_new)
event_list = sorted(event_list, key=lambda e: e[1])
tempo = int((60 / 120) * 10 ** 6) # default 120 bpm
ss = np.empty((0, 2), dtype=np.int16)
device = self.get_fluidsynth()
fl, sfid = device[:-1]
last_t = 0
for c in range(16):
fl.program_select(c, sfid, 128 if c == 9 else 0, 0)
for event in event_list:
name = event[0]
sample_len = int(((event[1] / ticks_per_beat) * tempo / (10 ** 6)) * self.sample_rate)
sample_len -= int(((last_t / ticks_per_beat) * tempo / (10 ** 6)) * self.sample_rate)
last_t = event[1]
if sample_len > 0:
sample = fl.get_samples(sample_len).reshape(sample_len, 2)
ss = np.concatenate([ss, sample])
if name == "set_tempo":
tempo = event[2]
elif name == "patch_change":
c, p = event[2:4]
fl.program_select(c, sfid, 128 if c == 9 else 0, p)
elif name == "control_change":
c, cc, v = event[2:5]
fl.cc(c, cc, v)
elif name == "note_on" and event[3] > 0:
c, p, v = event[2:5]
fl.noteon(c, p, v)
elif name == "note_off" or (name == "note_on" and event[3] == 0):
c, p = event[2:4]
fl.noteoff(c, p)
self.release_fluidsynth(device)
if ss.shape[0] > 0:
max_val = np.abs(ss).max()
if max_val != 0:
ss = (ss / max_val) * np.iinfo(np.int16).max
ss = ss.astype(np.int16)
return ss