Replace minor libfmp helpers locally

Curucail · Curucail · commit c02090a9dc6f · 2026-05-12T13:20:54.000+02:00
diff --git a/sync_audio_audio_full.ipynb b/sync_audio_audio_full.ipynb
@@ -34,8 +34,7 @@
     "import matplotlib.pyplot as plt\n",
     "import IPython.display as ipd\n",
     "import scipy.interpolate\n",
-    "from libfmp.b.b_plot import plot_signal, plot_chromagram\n",
-    "from libfmp.c3.c3s2_dtw_plot import plot_matrix_with_points\n",
+    "from synctoolbox.feature.visualization import plot_chromagram, plot_matrix_with_points, plot_signal\n",
     "\n",
     "from synctoolbox.dtw.mrmsdtw import sync_via_mrmsdtw\n",
     "from synctoolbox.dtw.utils import compute_optimal_chroma_shift, shift_chroma_vectors, make_path_strictly_monotonic, evaluate_synchronized_positions\n",
@@ -123,7 +122,6 @@
    },
    "outputs": [],
    "source": [
-    "import libfmp.c2\n",
     "# Alternative: librosa.estimate_tuning\n",
     "tuning_offset_1 = estimate_tuning(audio_1, Fs)\n",
     "tuning_offset_2 = estimate_tuning(audio_2, Fs)\n",
diff --git a/sync_audio_audio_simple.ipynb b/sync_audio_audio_simple.ipynb
@@ -30,8 +30,7 @@
     "import librosa.display\n",
     "import matplotlib.pyplot as plt\n",
     "import IPython.display as ipd\n",
-    "from libfmp.b.b_plot import plot_signal, plot_chromagram\n",
-    "from libfmp.c3.c3s2_dtw_plot import plot_matrix_with_points\n",
+    "from synctoolbox.feature.visualization import plot_chromagram, plot_matrix_with_points, plot_signal\n",
     "\n",
     "from synctoolbox.dtw.core import compute_warping_path\n",
     "from synctoolbox.dtw.cost import cosine_distance\n",
diff --git a/sync_audio_score_full.ipynb b/sync_audio_score_full.ipynb
@@ -29,8 +29,8 @@
    "source": [
     "# Loading some modules and defining some constants used later\n",
     "import IPython.display as ipd\n",
-    "from libfmp.b import list_to_pitch_activations, plot_chromagram, plot_signal, plot_matrix, \\\n",
-    "                     sonify_pitch_activations_with_signal\n",
+    "from synctoolbox.feature.sonification import list_to_pitch_activations, sonify_pitch_activations_with_signal\n",
+    "from synctoolbox.feature.visualization import plot_chromagram, plot_matrix, plot_signal\n",
     "import librosa.display\n",
     "import matplotlib.pyplot as plt\n",
     "import numpy as np\n",
@@ -119,7 +119,6 @@
    },
    "outputs": [],
    "source": [
-    "import libfmp.c2\n",
     "# Alternative: librosa.estimate_tuning\n",
     "tuning_offset = estimate_tuning(audio, Fs)\n",
     "print('Estimated tuning deviation for recording: %d cents' % (tuning_offset))"
diff --git a/synctoolbox/dtw/utils.py b/synctoolbox/dtw/utils.py
@@ -1,5 +1,4 @@
 import numpy as np
-from libfmp.c3 import compute_strict_alignment_path_mask
 from typing import List
 
 from synctoolbox.dtw.core import compute_warping_path
@@ -243,8 +242,6 @@ def find_anchor_indices_in_warping_path(warping_path: np.ndarray,
 def make_path_strictly_monotonic(P: np.ndarray) -> np.ndarray:
     """Compute strict alignment path from a warping path
 
-    Wrapper around "compute_strict_alignment_path_mask" from libfmp.
-
     Parameters
     ----------
     P: np.ndarray [shape=(2, N)]
@@ -255,9 +252,14 @@ def make_path_strictly_monotonic(P: np.ndarray) -> np.ndarray:
     P_mod: np.ndarray [shape=(2, M)]
         Strict alignment path, M <= N
     """
-    P_mod = compute_strict_alignment_path_mask(P.T)
-
-    return P_mod.T
+    P_transposed = np.array(P.T, copy=True)
+    N, M = P_transposed[-1]
+    keep_mask = (P_transposed[1:, 0] > P_transposed[:-1, 0]) & (P_transposed[1:, 1] > P_transposed[:-1, 1])
+    keep_mask = np.concatenate(([True], keep_mask))
+    keep_mask[(P_transposed[:, 0] == N) | (P_transposed[:, 1] == M)] = False
+    keep_mask[-1] = True
+
+    return P_transposed[keep_mask, :].T
 
 
 def evaluate_synchronized_positions(ground_truth_positions: np.ndarray,
diff --git a/synctoolbox/feature/csv_tools.py b/synctoolbox/feature/csv_tools.py
@@ -1,7 +1,7 @@
+import csv
 import os.path
 import subprocess
 
-import libfmp.c1
 import music21
 import numpy as np
 import pandas as pd
@@ -343,7 +343,7 @@ def __get_audio_duration_from_df(df: pd.DataFrame) -> float:
 
 def music_xml_to_csv_musical_time(xml, csv_filepath: str):
     """Convert a music xml file to a list of note events, with starts and durations as fractions of measures, and stores
-    it as a csv file in libfmp format.
+    it as a csv file.
 
     Args:
         xml (str or music21.stream.Score): Either a path to a music xml file or a music21.stream.Score
@@ -367,7 +367,7 @@ def music_xml_to_csv_musical_time(xml, csv_filepath: str):
     xml_data = xml_data_expanded
 
     score = []
-    # First, get starts and ends of notes in terms of quarters (similar to 'xml_to_list' in libfmp)
+    # First, get starts and ends of notes in terms of quarters.
     for part in xml_data.parts:
         instrument = __get_part_instrument_name(part)
         for note in part.flatten().notes:
@@ -419,13 +419,14 @@ def get_position_in_fraction_of_measures(position_in_quarters, is_end=False):
     for i in range(len(score)):
         start = get_position_in_fraction_of_measures(score[i][0])
         end = get_position_in_fraction_of_measures(score[i][1], is_end=True)
-        # To stay compatible with libfmp functions, we store this as a list with start and duration,
+        # Store this as a list with start and duration,
         # although many of our annotations are actually stored as start and end...
         score[i][0] = start
         score[i][1] = end - start
 
     score = sorted(score, key=lambda x: (x[0], x[2]))
-    libfmp.c1.list_to_csv(score, csv_filepath)
+    df = pd.DataFrame(score, columns=['Start', 'Duration', 'Pitch', 'Velocity', 'Instrument'])
+    df.to_csv(csv_filepath, sep=';', index=False, quoting=csv.QUOTE_NONNUMERIC)
 
 
 def midi_to_music_xml_musescore(midi_filepath: str, musescore_executable: str = "musescore"):
diff --git a/synctoolbox/feature/dlnco.py b/synctoolbox/feature/dlnco.py
@@ -1,6 +1,7 @@
 import matplotlib.pyplot as plt
 import numpy as np
-from libfmp.b import MultiplePlotsWithColorbar, plot_chromagram, plot_matrix
+
+from synctoolbox.feature.visualization import plot_chromagram
 
 
 def pitch_onset_features_to_DLNCO(f_peaks: dict,
diff --git a/synctoolbox/feature/novelty.py b/synctoolbox/feature/novelty.py
@@ -1,5 +1,4 @@
 import librosa
-from libfmp.c6 import compute_local_average
 import numpy as np
 
 
@@ -59,7 +58,7 @@ def spectral_flux(f_audio: np.ndarray,
 
     # Compute local average
     M = int(np.ceil(M_sec * Fs / hop_size))
-    local_average = compute_local_average(nov, M)
+    local_average = __compute_local_average(nov, M)
 
     # Subtract the local average from the novelty curve
     nov_norm = nov - local_average
@@ -68,6 +67,18 @@ def spectral_flux(f_audio: np.ndarray,
     return nov_norm
 
 
+def __compute_local_average(x: np.ndarray, M: int) -> np.ndarray:
+    """Compute a centered local average with a fixed window denominator."""
+    L = len(x)
+    prefix_sum = np.concatenate(([0], np.cumsum(x)))
+    local_average = np.zeros(L)
+    for m in range(L):
+        a = max(m - M, 0)
+        b = min(m + M + 1, L)
+        local_average[m] = (prefix_sum[b] - prefix_sum[a]) / (2 * M + 1)
+    return local_average
+
+
 def add_decay(nov_norm: np.ndarray,
               filter_coeff: np.ndarray = np.sqrt(1 / np.arange(1, 11))):
     # Add a temporal decay to the novelty curve.
diff --git a/synctoolbox/feature/pitch.py b/synctoolbox/feature/pitch.py
@@ -1,10 +1,10 @@
-from libfmp.b import plot_matrix
 import numpy as np
 import matplotlib.pyplot as plt
 from scipy import signal
 
 from synctoolbox.feature.filterbank import FS_PITCH, generate_list_of_downsampled_audio, get_fs_index,\
     generate_filterbank
+from synctoolbox.feature.visualization import plot_matrix
 
 PITCH_NAME_LABELS = ['   ', '   ', '   ', '   ', '   ', '   ', '   ', '   ', '   ', '   ', '   ',
                      'C0 ', '   ', '   ', '   ', '   ', '   ', '   ', '   ', '   ', '   ', '   ', '   ',
diff --git a/synctoolbox/feature/sonification.py b/synctoolbox/feature/sonification.py
@@ -0,0 +1,74 @@
+import numpy as np
+
+
+def list_to_pitch_activations(note_list, num_frames, frame_rate):
+    """Create a pitch activation matrix from a list of note events."""
+    P = np.zeros((128, num_frames))
+    F_coef_MIDI = np.arange(128) + 1
+    for note in note_list:
+        start_frame = max(0, int(note[0] * frame_rate))
+        end_frame = min(num_frames, int((note[0] + note[1]) * frame_rate) + 1)
+        P[int(note[2] - 1), start_frame:end_frame] = 1
+    return P, F_coef_MIDI
+
+
+def sonify_pitch_activations(P,
+                             N,
+                             frame_rate,
+                             Fs,
+                             min_pitch=1,
+                             Fc=440,
+                             harmonics_weights=(1,),
+                             fading_msec=5):
+    """Sonify a pitch activation matrix using sinusoidal tones."""
+    fade_sample = int(fading_msec / 1000 * Fs)
+    pitch_son = np.zeros((N,))
+
+    for p in range(P.shape[0]):
+        if np.sum(np.abs(P[p, :])) > 0:
+            pitch = min_pitch + p
+            freq = (2 ** ((pitch - 69) / 12)) * Fc
+            sin_tone = np.zeros((N,))
+
+            for i, cur_harmonic_weight in enumerate(harmonics_weights):
+                sin_tone += cur_harmonic_weight * np.sin(2 * np.pi * (i + 1) * freq * np.arange(N) / Fs)
+
+            weights = np.zeros((N,))
+            for n in range(P.shape[1]):
+                if np.abs(P[p, n]) > 0:
+                    start = min(N, max(0, int((n - 0.5) * Fs / frame_rate)))
+                    end = min(N, int((n + 0.5) * Fs / frame_rate))
+                    fade_start = min(N, start + fade_sample)
+                    fade_end = min(N, end + fade_sample)
+
+                    weights[fade_start:end] += P[p, n]
+                    weights[start:fade_start] += np.linspace(0, P[p, n], fade_start - start)
+                    weights[end:fade_end] += np.linspace(P[p, n], 0, fade_end - end)
+
+            pitch_son += weights * sin_tone
+
+    pitch_son = pitch_son / np.max(np.abs(pitch_son))
+    return pitch_son
+
+
+def sonify_pitch_activations_with_signal(P,
+                                         x,
+                                         frame_rate,
+                                         Fs,
+                                         min_pitch=1,
+                                         Fc=440,
+                                         harmonics_weights=(1,),
+                                         fading_msec=5,
+                                         stereo=True):
+    """Sonify a pitch activation matrix and combine it with a signal."""
+    N = x.size
+    pitch_son = sonify_pitch_activations(P, N, frame_rate, Fs, min_pitch=min_pitch, Fc=Fc,
+                                         harmonics_weights=harmonics_weights, fading_msec=fading_msec)
+    pitch_scaled = pitch_son * np.sqrt(np.mean(x ** 2)) / np.sqrt(np.mean(pitch_son ** 2))
+
+    if stereo:
+        out = np.vstack((x, pitch_scaled))
+    else:
+        out = x + pitch_scaled
+
+    return pitch_son, out
diff --git a/synctoolbox/feature/visualization.py b/synctoolbox/feature/visualization.py
diff --git a/tests/test_dtw.py b/tests/test_dtw.py
diff --git a/tests/test_features.py b/tests/test_features.py