Advanced-MIDI-Renderer

Running

App Files Files Community

asigalov61 commited on 18 days ago

Commit

04e14ea

verified ·

1 Parent(s): e169dd8

Upload 2 files

Browse files

Files changed (2) hide show

TMIDIX.py +106 -1
midi_to_colab_audio.py +102 -13

TMIDIX.py CHANGED Viewed

@@ -51,7 +51,7 @@ r'''############################################################################
 ###################################################################################
-__version__ = "25.8.27"
 print('=' * 70)
 print('TMIDIX Python module')
@@ -14433,6 +14433,111 @@ def replace_chords_in_escore_notes(escore_notes,
 ###################################################################################
 print('Module loaded!')
 print('=' * 70)
 print('Enjoy! :)')

 ###################################################################################
+__version__ = "25.8.29"
 print('=' * 70)
 print('TMIDIX Python module')
 ###################################################################################
+class Cell:
+    def __init__(self, cost, segments, gaps, prev_dir):
+        self.cost = cost
+        self.segments = segments
+        self.gaps = gaps
+        self.prev_dir = prev_dir
+def align_integer_lists(seq1, seq2):
+    n, m = len(seq1), len(seq2)
+    if n == 0:
+        return [None]*m, seq2.copy(), sum(abs(x) for x in seq2)
+    if m == 0:
+        return seq1.copy(), [None]*n, sum(abs(x) for x in seq1)
+    priority = {'diag': 0, 'up': 1, 'left': 2}
+    dp = [
+        [Cell(cost=math.inf, segments=math.inf, gaps=math.inf, prev_dir='') for _ in range(m+1)]
+        for _ in range(n+1)
+    ]
+    dp[0][0] = Cell(cost=0, segments=0, gaps=0, prev_dir='')
+    for i in range(1, n+1):
+        prev = dp[i-1][0]
+        new_cost = prev.cost + abs(seq1[i-1])
+        new_seg  = prev.segments + (1 if prev.prev_dir != 'up' else 0)
+        new_gaps = prev.gaps + 1
+        dp[i][0]  = Cell(new_cost, new_seg, new_gaps, 'up')
+    for j in range(1, m+1):
+        prev = dp[0][j-1]
+        new_cost = prev.cost + abs(seq2[j-1])
+        new_seg  = prev.segments + (1 if prev.prev_dir != 'left' else 0)
+        new_gaps = prev.gaps + 1
+        dp[0][j] = Cell(new_cost, new_seg, new_gaps, 'left')
+    for i in range(1, n+1):
+        for j in range(1, m+1):
+            a, b = seq1[i-1], seq2[j-1]
+            c0 = dp[i-1][j-1]
+            cand_diag = Cell(
+                cost     = c0.cost + abs(a - b),
+                segments = c0.segments,
+                gaps     = c0.gaps,
+                prev_dir = 'diag'
+            )
+            c1 = dp[i-1][j]
+            seg1 = c1.segments + (1 if c1.prev_dir != 'up' else 0)
+            cand_up = Cell(
+                cost     = c1.cost + abs(a),
+                segments = seg1,
+                gaps     = c1.gaps + 1,
+                prev_dir = 'up'
+            )
+            c2 = dp[i][j-1]
+            seg2 = c2.segments + (1 if c2.prev_dir != 'left' else 0)
+            cand_left = Cell(
+                cost     = c2.cost + abs(b),
+                segments = seg2,
+                gaps     = c2.gaps + 1,
+                prev_dir = 'left'
+            )
+            best = min(
+                (cand_diag, cand_up, cand_left),
+                key=lambda c: (c.cost, c.segments, c.gaps, priority[c.prev_dir])
+            )
+            dp[i][j] = best
+    aligned1 = []
+    aligned2 = []
+    i, j = n, m
+    while i > 0 or j > 0:
+        cell = dp[i][j]
+        if cell.prev_dir == 'diag':
+            aligned1.append(seq1[i-1])
+            aligned2.append(seq2[j-1])
+            i, j = i-1, j-1
+        elif cell.prev_dir == 'up':
+            aligned1.append(seq1[i-1])
+            aligned2.append(None)
+            i -= 1
+        else:
+            aligned1.append(None)
+            aligned2.append(seq2[j-1])
+            j -= 1
+    aligned1.reverse()
+    aligned2.reverse()
+    total_cost = int(dp[n][m].cost)
+    return aligned1, aligned2, total_cost
+###################################################################################
 print('Module loaded!')
 print('=' * 70)
 print('Enjoy! :)')

midi_to_colab_audio.py CHANGED Viewed

@@ -3233,14 +3233,27 @@ def normalize_audio(audio: np.ndarray,
 #===============================================================================
 def midi_opus_to_colab_audio(midi_opus,
-                              soundfont_path='/usr/share/sounds/sf2/FluidR3_GM.sf2',
-                              sample_rate=16000, # 44100
-                              volume_level_db=-1,
-                              trim_silence=True,
-                              silence_threshold=0.1,
-                              output_for_gradio=False,
-                              write_audio_to_WAV=''
-                              ):
     if midi_opus[1]:
@@ -3263,7 +3276,37 @@ def midi_opus_to_colab_audio(midi_opus,
         for chan in range(16):
             # channel 9 = percussion GM bank 128
             fl.program_select(chan, sfid, 128 if chan == 9 else 0, 0)
         # Playback vars
         tempo = int((60 / 120) * 1e6)  # default 120bpm
         last_t = 0
@@ -3299,11 +3342,11 @@ def midi_opus_to_colab_audio(midi_opus,
             elif name == "key_after_touch":
                 chan, note, vel = data
-                fl.key_pressure(chan, note, vel)
             elif name == "channel_after_touch":
                 chan, vel = data
-                fl.channel_pressure(chan, vel)
             elif name == "pitch_wheel_change":
                 chan, wheel = data
@@ -3373,6 +3416,8 @@ def midi_opus_to_colab_audio(midi_opus,
         # Optionally write WAV to disk
         if write_audio_to_WAV:
             wav_name = midi_file.rsplit('.', 1)[0] + '.wav'
             pcm = np.int16(raw_audio.T / np.max(np.abs(raw_audio)) * 32767)
             with wave.open(wav_name, 'wb') as wf:
                 wf.setframerate(sample_rate)
@@ -3393,8 +3438,21 @@ def midi_to_colab_audio(midi_file,
                         volume_level_db=-1,
                         trim_silence=True,
                         silence_threshold=0.1,
                         output_for_gradio=False,
-                        write_audio_to_WAV=False
                        ):
     """
     Returns raw audio to pass to IPython.disaply.Audio func
@@ -3427,6 +3485,35 @@ def midi_to_colab_audio(midi_file,
         # channel 9 = percussion GM bank 128
         fl.program_select(chan, sfid, 128 if chan == 9 else 0, 0)
     # Playback vars
     tempo = int((60 / 120) * 1e6)  # default 120bpm
     last_t = 0
@@ -3462,11 +3549,11 @@ def midi_to_colab_audio(midi_file,
         elif name == "key_after_touch":
             chan, note, vel = data
-            fl.key_pressure(chan, note, vel)
         elif name == "channel_after_touch":
             chan, vel = data
-            fl.channel_pressure(chan, vel)
         elif name == "pitch_wheel_change":
             chan, wheel = data
@@ -3536,6 +3623,8 @@ def midi_to_colab_audio(midi_file,
     # Optionally write WAV to disk
     if write_audio_to_WAV:
         wav_name = midi_file.rsplit('.', 1)[0] + '.wav'
         pcm = np.int16(raw_audio.T / np.max(np.abs(raw_audio)) * 32767)
         with wave.open(wav_name, 'wb') as wf:
             wf.setframerate(sample_rate)

 #===============================================================================
 def midi_opus_to_colab_audio(midi_opus,
+                             soundfont_path='/usr/share/sounds/sf2/FluidR3_GM.sf2',
+                             sample_rate=16000, # 44100
+                             volume_level_db=-1,
+                             trim_silence=True,
+                             silence_threshold=0.1,
+                             enable_reverb=False,
+                             reverb_param_dic={'roomsize': 0,
+                                               'damping': 0,
+                                               'width': 0,
+                                               'level': 0
+                                              },
+                             enable_chorus=False,
+                             chorus_param_dic={'nr': 0,
+                                               'level': 0,
+                                               'speed': 0.1,
+                                               'depth': 0,
+                                               'type': 0},
+                             output_for_gradio=False,
+                             write_audio_to_WAV=False,
+                             output_WAV_name=''
+                            ):
     if midi_opus[1]:
         for chan in range(16):
             # channel 9 = percussion GM bank 128
             fl.program_select(chan, sfid, 128 if chan == 9 else 0, 0)
+        if enable_reverb:
+            fl.set_reverb(roomsize=reverb_param_dic['roomsize'],
+                          damping=reverb_param_dic['damping'],
+                          width=reverb_param_dic['width'],
+                          level=reverb_param_dic['level']
+                         )
+            """
+            roomsize Reverb room size value (0.0-1.0)
+            damping Reverb damping value (0.0-1.0)
+            width Reverb width value (0.0-100.0)
+            level Reverb level value (0.0-1.0)
+            """
+        if enable_chorus:
+            fl.set_chorus(nr=chorus_param_dic['nr'],
+                          level=chorus_param_dic['level'],
+                          speed=chorus_param_dic['speed'],
+                          depth=chorus_param_dic['depth'],
+                          type=chorus_param_dic['type']
+                         )
+        """
+        nr Chorus voice count (0-99, CPU time consumption proportional to this value)
+        level Chorus level (0.0-10.0)
+        speed Chorus speed in Hz (0.29-5.0)
+        depth_ms Chorus depth (max value depends on synth sample rate, 0.0-21.0 is safe for sample rate values up to 96KHz)
+        type Chorus waveform type (0=sine, 1=triangle)
+        """
         # Playback vars
         tempo = int((60 / 120) * 1e6)  # default 120bpm
         last_t = 0
             elif name == "key_after_touch":
                 chan, note, vel = data
+                # fl.key_pressure(chan, note, vel)
             elif name == "channel_after_touch":
                 chan, vel = data
+                # fl.channel_pressure(chan, vel)
             elif name == "pitch_wheel_change":
                 chan, wheel = data
         # Optionally write WAV to disk
         if write_audio_to_WAV:
             wav_name = midi_file.rsplit('.', 1)[0] + '.wav'
+            if output_WAV_name != '':
+                wav_name = output_WAV_name
             pcm = np.int16(raw_audio.T / np.max(np.abs(raw_audio)) * 32767)
             with wave.open(wav_name, 'wb') as wf:
                 wf.setframerate(sample_rate)
                         volume_level_db=-1,
                         trim_silence=True,
                         silence_threshold=0.1,
+                        enable_reverb=False,
+                        reverb_param_dic={'roomsize': 0,
+                                          'damping': 0,
+                                          'width': 0,
+                                          'level': 0
+                                         },
+                        enable_chorus=False,
+                        chorus_param_dic={'nr': 0,
+                                          'level': 0,
+                                          'speed': 0.1,
+                                          'depth': 0,
+                                          'type': 0},
                         output_for_gradio=False,
+                        write_audio_to_WAV=False,
+                        output_WAV_name=''
                        ):
     """
     Returns raw audio to pass to IPython.disaply.Audio func
         # channel 9 = percussion GM bank 128
         fl.program_select(chan, sfid, 128 if chan == 9 else 0, 0)
+    if enable_reverb:
+        fl.set_reverb(roomsize=reverb_param_dic['roomsize'],
+                      damping=reverb_param_dic['damping'],
+                      width=reverb_param_dic['width'],
+                      level=reverb_param_dic['level']
+                     )
+        """
+        roomsize Reverb room size value (0.0-1.0)
+        damping Reverb damping value (0.0-1.0)
+        width Reverb width value (0.0-100.0)
+        level Reverb level value (0.0-1.0)
+        """
+    if enable_chorus:
+        fl.set_chorus(nr=chorus_param_dic['nr'],
+                      level=chorus_param_dic['level'],
+                      speed=chorus_param_dic['speed'],
+                      depth=chorus_param_dic['depth'],
+                      type=chorus_param_dic['type']
+                     )
+    """
+    nr Chorus voice count (0-99, CPU time consumption proportional to this value)
+    level Chorus level (0.0-10.0)
+    speed Chorus speed in Hz (0.29-5.0)
+    depth_ms Chorus depth (max value depends on synth sample rate, 0.0-21.0 is safe for sample rate values up to 96KHz)
+    type Chorus waveform type (0=sine, 1=triangle)
+    """
     # Playback vars
     tempo = int((60 / 120) * 1e6)  # default 120bpm
     last_t = 0
         elif name == "key_after_touch":
             chan, note, vel = data
+            # fl.key_pressure(chan, note, vel)
         elif name == "channel_after_touch":
             chan, vel = data
+            # fl.channel_pressure(chan, vel)
         elif name == "pitch_wheel_change":
             chan, wheel = data
     # Optionally write WAV to disk
     if write_audio_to_WAV:
         wav_name = midi_file.rsplit('.', 1)[0] + '.wav'
+        if output_WAV_name != '':
+            wav_name = output_WAV_name
         pcm = np.int16(raw_audio.T / np.max(np.abs(raw_audio)) * 32767)
         with wave.open(wav_name, 'wb') as wf:
             wf.setframerate(sample_rate)