Restructured files and added another snap function that does not relies on any bpm

2024-06-02 16:45:25 +02:00 · 2024-06-02 16:45:25 +02:00 · 177a8658f0
parent 31639c850e
commit 177a8658f0
2 changed files with 289 additions and 164 deletions
--- a/debug.py
+++ b/debug.py
@ -0,0 +1,272 @@
+from math import *
+import numpy as np
+from scipy.io import wavfile
+from scipy import signal
+import matplotlib.pyplot as plt
+import subprocess
+import wave as wv
+import struct
+import librosa
+import heapq
+import scipy
+import os
+import random
+from pathlib import Path
+from time import sleep
+from datetime import timedelta
+
+def adjust_timings(raw_data, snapped_data, indexes, thr=100):
+    """
+    adjusts weirdly snapped notes
+    """
+    current = 0
+
+    while(current < len(indexes)):
+    
+        if(current < len(indexes) - 3 and current % 2 == 1): # on a 1/4 beat
+            if(snapped_data[indexes[current]] > thr and snapped_data[indexes[current+1]] > thr and snapped_data[indexes[current+2]] > thr and snapped_data[indexes[current+3]] <= thr):
+                # -XXX_
+                snapped_data[indexes[current+3]] = snapped_data[indexes[current+2]]
+                snapped_data[indexes[current+2]] = 0
+
+        if(current > 0 and current < len(indexes) - 1 and current % 2 == 1):
+            if(snapped_data[indexes[current]] > thr and (snapped_data[indexes[current+1]] < thr or snapped_data[indexes[current-1]] < thr)):
+                #_X_
+                '''if(snapped_data[indexes[current-1]] < thr and raw_data[indexes[current-1]] > raw_data[indexes[current+1]]):
+                    snapped_data[indexes[current-1]] = snapped_data[indexes[current]]
+                else:
+                    snapped_data[indexes[current+1]] = snapped_data[indexes[current]]'''
+
+                snapped_data[indexes[current]] = 0
+
+        current += 1
+
+    print("Resnap done")
+    return snapped_data
+
+
+
+def snap(data, sample_rate, bpm, divisor, show=False):
+    # adjust time amplitudes to match the given BPM 
+    new = [0 for x in range(int(1000*len(data)/sample_rate))] # 1pt per millisecond
+    print("old =", len(data))
+    print("len =", 1000*len(data)/sample_rate)
+    k = 0
+    t = 0
+    percent = 0
+    for i in range(len(data)):
+
+        while(t < i/sample_rate):
+            t = k/(bpm*divisor)
+            k += 60
+        '''
+        if(np.abs(i/sample_rate - k/(bpm*divisor)) > np.abs(i/sample_rate - (k-60)/(bpm*divisor))):
+            k -= 60
+            t = k/(bpm*divisor)'''
+
+        if(i%(len(data)//100) == 0):
+            print(percent, "%")
+            percent += 1
+
+        if(int(t*1000) < len(new)):
+            new[int(t*1000)] = max(data[i], new[int(t*1000)])
+        else:
+            new[len(new)-1] = max(data[i], new[len(new)-1])
+
+    if(show):
+        t = [j/1000 for j in range(len(new))]
+        plt.plot(t, new)
+        plt.xlabel("Time (e)")
+        plt.ylabel("Amplitude")
+        plt.grid()
+        plt.show()
+
+    return new
+
+def snap2(data, sample_rate, bpm, first_offset=0, div=4, show=False, adjust=False):
+    """
+    data : list(int)
+    sample_rate : int
+    bpm = float
+    """
+
+    song_len = int(len(data)/sample_rate)
+
+    indexes = []
+    app = True
+
+    reduced = [0 for i in range(song_len*1000)]
+    new = [0 for i in range(song_len*1000)]
+
+    # build the reduced version
+    for i in range(len(data)):
+        x = int(i*1000/sample_rate)
+        if(x < len(reduced)):
+            reduced[x] = max(reduced[x], data[i])
+
+
+    print("Build done")
+    # snap
+    k = 0
+    current_t = first_offset
+
+    while(current_t < 0):
+        k += 1
+        current_t = first_offset + k*60/(bpm*div)
+
+    for j in range(len(new)):
+        if(j/1000 > current_t):
+            k += 1
+            current_t = first_offset + k*60/(bpm*div)
+            app = True
+
+        y = int(current_t*1000)
+        if(y < len(new)):
+            new[y] = max(new[y], reduced[j])
+
+            if(app):
+                indexes.append(y)
+                app = False 
+
+    print("Snap done")
+    
+    if(adjust):
+        print("Len :", len(indexes))
+
+        new = adjust_timings(reduced, new, indexes)
+
+    
+    if(show):
+        new2 = [0.9 if new[i] != 0 else 0 for i in range(len(new))]
+
+        t = [j/1000+first_offset for j in range(len(new))]
+        beats_1 = [0 for j in range(len(new))]
+        beats_2 = [0 for k in range(len(new))]
+        beats_4 = [0 for l in range(len(new))]
+
+        k = 0
+        current_t = first_offset
+
+        while(current_t < 0):
+            k += 1
+            current_t = first_offset + k*60/(bpm*div)
+
+        while(1000*current_t < len(new)):
+            beats_4[int(1000*current_t)] = 0.9
+
+            if(k % 2 == 0):
+                beats_2[int(1000*current_t)] = 0.92
+
+            if(k % 4 == 0):
+                beats_1[int(1000*current_t)] = 0.94
+
+            k += 1
+            current_t = first_offset + k*60/(bpm*div)
+
+        plt.plot(t, new2, "bo")
+        plt.plot(t, beats_4, "r-")
+        plt.plot(t, beats_2, "y-")
+        plt.plot(t, beats_1, "g-")
+        plt.xlabel("Time (s)")
+        plt.ylabel("Amplitude")
+        plt.grid()
+        plt.show()
+
+    return new
+
+def filter_peaks(data, sample_rate=44100, thr=1000):
+    tdata = []
+    times = []
+
+    for i in range(len(data)):
+        if data[i] > thr:
+            tdata.append(data[i])
+            times.append(i/sample_rate)
+
+    return (tdata, times)
+    '''
+    times is in seconds
+    '''
+
+def get_spacing(data, sample_rate=44100, show=False, retrieve=False):
+    tdata, times = filter_peaks(data, sample_rate=sample_rate)
+
+    absc = [i for i in range(len(times))]
+    dt = [0]
+
+    for i in range(1, len(times)):
+        dt.append(1000*(times[i]-times[i-1]))
+
+    if(show):
+        plt.plot(absc, dt)
+        plt.xlabel("x")
+        plt.ylabel("T(peak x) - T(peak x-1) (ms)")
+        plt.grid()
+        plt.show()
+
+    if(retrieve):
+        return dt
+
+    '''
+    post-condition : 
+    - dt[i] = time(peak number i) - time(peak number i-1)
+    - dt is in ms
+    '''
+
+def snap3(data, sample_rate=44100, mintime=10, initial_plot=False, after_plot=False):
+    '''
+    explaination : 
+    1) get the time differences (cf get_spacing)
+    2) for eack peak : 2 cases
+        - if it's farther than mintime (in ms) :
+            > calculate the weighted mean if all elements in temp_list
+            > place a note at that mean
+            > empty temp_list
+            > push the current peak to temp_list
+        - else :
+            > push the current peak to temp_list
+    '''
+    data_peaks, peak_times = filter_peaks(data, sample_rate=sample_rate)
+    time_diff = get_spacing(data, show=initial_plot, retrieve=True)
+
+    res_peaks = []
+    res_times = []
+
+    segments = []
+    seglen = []
+
+    current_left = 0
+
+    for i in range(len(peak_times)):
+        if(time_diff[i] > mintime):
+            segments.append([current_left, i])
+            seglen.append(peak_times[i]-peak_times[current_left])
+            res_peaks.append(500)
+            res_times.append(peak_times[i])
+            current_left = i
+
+    for i in range(len(segments)):
+        print(segments[i], ":", seglen[i])
+
+    if(after_plot):
+        peakplot = []
+        diffplot = []
+        for x in range(len(peak_times)):
+            peakplot.append(peak_times[x]-peak_times[x]/1000)
+            peakplot.append(peak_times[x])
+            peakplot.append(peak_times[x]+peak_times[x]/1000)
+            diffplot.append(0)
+            diffplot.append(time_diff[x])
+            diffplot.append(0)
+
+        plt.plot(res_times, res_peaks, "ro", label="placed beats")
+        plt.plot(peakplot, diffplot, label="derivatine of time")
+        plt.xlabel("t (s)")
+        plt.ylabel(".")
+        plt.legend(loc="upper left")
+        plt.grid()
+        plt.show()
+
+    return (res_peaks, res_times)
+
+    
--- a/sound_process.py
+++ b/sound_process.py
@ -15,6 +15,8 @@ from pathlib import Path
 from time import sleep
 from datetime import timedelta

+import debug
+
 print("Starting...\n")

 def filter_n_percent_serial(song_name, offset, n_iter, step, threshold):
@ -283,11 +285,11 @@ def test_sample(timelist):
        print("F")
        sleep(timelist[i]-timelist[i-1])

-def convert_tuple(datares, freq):
+def convert_tuple(data, times):
    """
-    Takes datares and converts it to a list of tuples (amplitude, datetimes)
+    Takes data and converts it to a list of tuples (amplitude, datetimes)
    """
-    return [(timedelta(milliseconds=i), datares[i], freq[i]) for i in range(len(datares)) if datares[i] > 0]
+    return [(times[i], data[i]) for i in range(len(data))]

 def get_songlen(filename):
    """
@ -298,163 +300,6 @@ def get_songlen(filename):

    return (len(global_data)/sample_rate)

-def snap(data, sample_rate, bpm, divisor, show=False):
-    # adjust time amplitudes to match the given BPM 
-    new = [0 for x in range(int(1000*len(data)/sample_rate))] # 1pt per millisecond
-    print("old =", len(data))
-    print("len =", 1000*len(data)/sample_rate)
-    k = 0
-    t = 0
-    percent = 0
-    for i in range(len(data)):
-
-        while(t < i/sample_rate):
-            t = k/(bpm*divisor)
-            k += 60
-        '''
-        if(np.abs(i/sample_rate - k/(bpm*divisor)) > np.abs(i/sample_rate - (k-60)/(bpm*divisor))):
-            k -= 60
-            t = k/(bpm*divisor)'''
-
-        if(i%(len(data)//100) == 0):
-            print(percent, "%")
-            percent += 1
-
-        if(int(t*1000) < len(new)):
-            new[int(t*1000)] = max(data[i], new[int(t*1000)])
-        else:
-            new[len(new)-1] = max(data[i], new[len(new)-1])
-
-    if(show):
-        t = [j/1000 for j in range(len(new))]
-        plt.plot(t, new)
-        plt.xlabel("Time (e)")
-        plt.ylabel("Amplitude")
-        plt.grid()
-        plt.show()
-
-    return new
-
-def adjust_timings(raw_data, snapped_data, indexes, thr=100):
-    """
-    adjusts weirdly snapped notes
-    """
-    current = 0
-
-    while(current < len(indexes)):
-    
-        if(current < len(indexes) - 3 and current % 2 == 1): # on a 1/4 beat
-            if(snapped_data[indexes[current]] > thr and snapped_data[indexes[current+1]] > thr and snapped_data[indexes[current+2]] > thr and snapped_data[indexes[current+3]] <= thr):
-                # -XXX_
-                snapped_data[indexes[current+3]] = snapped_data[indexes[current+2]]
-                snapped_data[indexes[current+2]] = 0
-
-        if(current > 0 and current < len(indexes) - 1 and current % 2 == 1):
-            if(snapped_data[indexes[current]] > thr and (snapped_data[indexes[current+1]] < thr or snapped_data[indexes[current-1]] < thr)):
-                #_X_
-                '''if(snapped_data[indexes[current-1]] < thr and raw_data[indexes[current-1]] > raw_data[indexes[current+1]]):
-                    snapped_data[indexes[current-1]] = snapped_data[indexes[current]]
-                else:
-                    snapped_data[indexes[current+1]] = snapped_data[indexes[current]]'''
-
-                snapped_data[indexes[current]] = 0
-
-        current += 1
-
-    print("Resnap done")
-    return snapped_data
-
-def snap2(data, sample_rate, bpm, first_offset=0, div=4, show=False, adjust=False):
-    """
-    data : list(int)
-    sample_rate : int
-    bpm = float
-    """
-
-    song_len = int(len(data)/sample_rate)
-
-    indexes = []
-    app = True
-
-    reduced = [0 for i in range(song_len*1000)]
-    new = [0 for i in range(song_len*1000)]
-
-    # build the reduced version
-    for i in range(len(data)):
-        x = int(i*1000/sample_rate)
-        if(x < len(reduced)):
-            reduced[x] = max(reduced[x], data[i])
-
-
-    print("Build done")
-    # snap
-    k = 0
-    current_t = first_offset
-
-    while(current_t < 0):
-        k += 1
-        current_t = first_offset + k*60/(bpm*div)
-
-    for j in range(len(new)):
-        if(j/1000 > current_t):
-            k += 1
-            current_t = first_offset + k*60/(bpm*div)
-            app = True
-
-        y = int(current_t*1000)
-        if(y < len(new)):
-            new[y] = max(new[y], reduced[j])
-
-            if(app):
-                indexes.append(y)
-                app = False 
-
-    print("Snap done")
-    
-    if(adjust):
-        print("Len :", len(indexes))
-
-        new = adjust_timings(reduced, new, indexes)
-
-    
-    if(show):
-        new2 = [0.9 if new[i] != 0 else 0 for i in range(len(new))]
-
-        t = [j/1000+first_offset for j in range(len(new))]
-        beats_1 = [0 for j in range(len(new))]
-        beats_2 = [0 for k in range(len(new))]
-        beats_4 = [0 for l in range(len(new))]
-
-        k = 0
-        current_t = first_offset
-
-        while(current_t < 0):
-            k += 1
-            current_t = first_offset + k*60/(bpm*div)
-
-        while(1000*current_t < len(new)):
-            beats_4[int(1000*current_t)] = 0.9
-
-            if(k % 2 == 0):
-                beats_2[int(1000*current_t)] = 0.92
-
-            if(k % 4 == 0):
-                beats_1[int(1000*current_t)] = 0.94
-
-            k += 1
-            current_t = first_offset + k*60/(bpm*div)
-
-        plt.plot(t, new2, "bo")
-        plt.plot(t, beats_4, "r-")
-        plt.plot(t, beats_2, "y-")
-        plt.plot(t, beats_1, "g-")
-        plt.xlabel("Time (s)")
-        plt.ylabel("Amplitude")
-        plt.grid()
-        plt.show()
-
-    return new
-
 def convert_to_wav(song_name:str, output_file="audio.wav") -> str:
    """
    Converts the song to .wav, only if it's not already in wave format.
@ -495,16 +340,24 @@ def process_song(filename, bpm, offset0=0, div_len_factor=1, n_iter_2=-1, thresh
    filtered_name = f"{filename}_trimmed.wav"

    void_freq(filename, offset, min(song_len, offset+div_len*(n_iter+1)+0.01), 4*60/bpm, minfreq=0, maxfreq=220, upperthr=5000, ampthr=60, ampfreq = 1200, ampval = 5.0, leniency = 0.005, write=True, linear=False, output_file=filtered_name)
-    #void_freq(filename, offset, offset+div_len*(n_iter+1)+0.01, 4*60/bpm, minfreq=0, maxfreq=330, upperthr=2500, ampthr=60, ampfreq = 1200, ampval = 1/2000, leniency = 0.0, write=True, linear=True, output_file=filtered_name)
+    
    datares = filter_n_percent_serial(filtered_name, offset, n_iter, div_len, threshold) 
-    #datares = snap(datares, 44100, bpm, 4, True)
-    datares = snap2(datares, 44100, bpm, first_offset=offset, div=divisor, show=True, adjust=True)
+
+    (snapped_data, times) = debug.snap3(datares, mintime=50, initial_plot=True, after_plot=True)
+
+    #frequencies=get_freq(filtered_name, offset, div_len, div_len*n_iter, snapped_data, True)
+    Path(f"{filename}_trimmed.wav").unlink()
+    return convert_tuple(snapped_data, times)
+
+    '''
+    datares = debug.snap2(datares, 44100, bpm, first_offset=offset, div=divisor, show=True, adjust=True)
    frequencies = get_freq(filtered_name, offset, div_len, div_len*n_iter, datares, True)
    Path(f"{filename}_trimmed.wav").unlink()
    return convert_tuple(datares, frequencies)
+    '''

 def main():
-    data = process_song("tetris_4.wav", 160, n_iter_2=48, threshold=100)
+    data = process_song("tetris_4.wav", 160, n_iter_2=48)
    #print(data)
    print("Program finished with return 0")