|
from threading import Lock |
|
|
|
import fluidsynth |
|
import numpy as np |
|
|
|
|
|
class MidiSynthesizer: |
|
def __init__(self, soundfont_path, sample_rate=44100): |
|
self.soundfont_path = soundfont_path |
|
self.sample_rate = sample_rate |
|
fl = fluidsynth.Synth(samplerate=float(sample_rate)) |
|
sfid = fl.sfload(soundfont_path) |
|
self.devices = [[fl, sfid, False]] |
|
self.devices_lock = Lock() |
|
|
|
def get_fluidsynth(self): |
|
with self.devices_lock: |
|
for device in self.devices: |
|
if not device[2]: |
|
device[2] = True |
|
return device |
|
fl = fluidsynth.Synth(samplerate=float(self.sample_rate)) |
|
sfid = fl.sfload(self.soundfont_path) |
|
device = [fl, sfid, True] |
|
self.devices.append(device) |
|
return device |
|
|
|
def release_fluidsynth(self, device): |
|
device[0].system_reset() |
|
device[0].get_samples(self.sample_rate*5) |
|
device[2] = False |
|
|
|
def synthesis(self, midi_opus): |
|
ticks_per_beat = midi_opus[0] |
|
event_list = [] |
|
for track_idx, track in enumerate(midi_opus[1:]): |
|
abs_t = 0 |
|
for event in track: |
|
abs_t += event[1] |
|
event_new = [*event] |
|
event_new[1] = abs_t |
|
event_list.append(event_new) |
|
event_list = sorted(event_list, key=lambda e: e[1]) |
|
|
|
tempo = int((60 / 120) * 10 ** 6) |
|
ss = np.empty((0, 2), dtype=np.int16) |
|
device = self.get_fluidsynth() |
|
fl, sfid = device[:-1] |
|
last_t = 0 |
|
for c in range(16): |
|
fl.program_select(c, sfid, 128 if c == 9 else 0, 0) |
|
for event in event_list: |
|
name = event[0] |
|
sample_len = int(((event[1] / ticks_per_beat) * tempo / (10 ** 6)) * self.sample_rate) |
|
sample_len -= int(((last_t / ticks_per_beat) * tempo / (10 ** 6)) * self.sample_rate) |
|
last_t = event[1] |
|
if sample_len > 0: |
|
sample = fl.get_samples(sample_len).reshape(sample_len, 2) |
|
ss = np.concatenate([ss, sample]) |
|
if name == "set_tempo": |
|
tempo = event[2] |
|
elif name == "patch_change": |
|
c, p = event[2:4] |
|
fl.program_select(c, sfid, 128 if c == 9 else 0, p) |
|
elif name == "control_change": |
|
c, cc, v = event[2:5] |
|
fl.cc(c, cc, v) |
|
elif name == "note_on" and event[3] > 0: |
|
c, p, v = event[2:5] |
|
fl.noteon(c, p, v) |
|
elif name == "note_off" or (name == "note_on" and event[3] == 0): |
|
c, p = event[2:4] |
|
fl.noteoff(c, p) |
|
|
|
self.release_fluidsynth(device) |
|
if ss.shape[0] > 0: |
|
max_val = np.abs(ss).max() |
|
if max_val != 0: |
|
ss = (ss / max_val) * np.iinfo(np.int16).max |
|
ss = ss.astype(np.int16) |
|
return ss |
|
|