File size: 3,017 Bytes
1fd2f8b
 
1ea42dc
 
 
256bea9
239bed9
 
 
 
 
 
 
bb14020
1ea42dc
239bed9
bb14020
 
 
 
 
1fd2f8b
 
bb14020
 
 
1ea42dc
239bed9
256bea9
d25994f
239bed9
b5d92aa
239bed9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
256bea9
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
from threading import Lock

import fluidsynth
import numpy as np


class MidiSynthesizer:
    def __init__(self, soundfont_path, sample_rate=44100):
        self.soundfont_path = soundfont_path
        self.sample_rate = sample_rate
        fl = fluidsynth.Synth(samplerate=float(sample_rate))
        sfid = fl.sfload(soundfont_path)
        self.devices = [[fl, sfid, False]]
        self.devices_lock = Lock()

    def get_fluidsynth(self):
        with self.devices_lock:
            for device in self.devices:
                if not device[2]:
                    device[2] = True
                    return device
            fl = fluidsynth.Synth(samplerate=float(self.sample_rate))
            sfid = fl.sfload(self.soundfont_path)
            device = [fl, sfid, True]
            self.devices.append(device)
            return device

    def release_fluidsynth(self, device):
        device[0].system_reset()
        device[0].get_samples(self.sample_rate*5) # wait for silence
        device[2] = False

    def synthesis(self, midi_opus):
        ticks_per_beat = midi_opus[0]
        event_list = []
        for track_idx, track in enumerate(midi_opus[1:]):
            abs_t = 0
            for event in track:
                abs_t += event[1]
                event_new = [*event]
                event_new[1] = abs_t
                event_list.append(event_new)
        event_list = sorted(event_list, key=lambda e: e[1])

        tempo = int((60 / 120) * 10 ** 6)  # default 120 bpm
        ss = np.empty((0, 2), dtype=np.int16)
        device = self.get_fluidsynth()
        fl, sfid = device[:-1]
        last_t = 0
        for c in range(16):
            fl.program_select(c, sfid, 128 if c == 9 else 0, 0)
        for event in event_list:
            name = event[0]
            sample_len = int(((event[1] / ticks_per_beat) * tempo / (10 ** 6)) * self.sample_rate)
            sample_len -= int(((last_t / ticks_per_beat) * tempo / (10 ** 6)) * self.sample_rate)
            last_t = event[1]
            if sample_len > 0:
                sample = fl.get_samples(sample_len).reshape(sample_len, 2)
                ss = np.concatenate([ss, sample])
            if name == "set_tempo":
                tempo = event[2]
            elif name == "patch_change":
                c, p = event[2:4]
                fl.program_select(c, sfid, 128 if c == 9 else 0, p)
            elif name == "control_change":
                c, cc, v = event[2:5]
                fl.cc(c, cc, v)
            elif name == "note_on" and event[3] > 0:
                c, p, v = event[2:5]
                fl.noteon(c, p, v)
            elif name == "note_off" or (name == "note_on" and event[3] == 0):
                c, p = event[2:4]
                fl.noteoff(c, p)

        self.release_fluidsynth(device)
        if ss.shape[0] > 0:
            max_val = np.abs(ss).max()
            if max_val != 0:
                ss = (ss / max_val) * np.iinfo(np.int16).max
        ss = ss.astype(np.int16)
        return ss