init

2024-09-30 17:56:32 +02:00 · 2024-09-30 17:56:32 +02:00 · 9e7c18930f
parent 95e06d3235
commit 9e7c18930f
5 changed files with 349 additions and 674 deletions
--- a/cleaned_sp.py
+++ b/cleaned_sp.py
@ -0,0 +1,349 @@
+from math import *
+import numpy as np
+import scipy as scp
+from scipy.io import wavfile
+import matplotlib.pyplot as plt
+import subprocess
+import heapq
+from pathlib import Path
+from time import sleep
+
+def is_data_stereo(raw_global_data:list) -> bool:
+    """
+    self-explainatory
+    """
+    try:
+        assert(raw_global_data[0][0])
+    except IndexError:
+        return False
+    except AssertionError:
+        return True
+    return True
+
+def retrieve_dominant_freqs(song_name, offset, songlen, segsize):
+    # returns a list with peak frequencies alongside the sample rate
+    # /!\ song_name is specified to be a list, NOT a list of couples (aka song is mono)
+    # segsize is in seconds
+    
+    # remove high_pitched/low-pitched frequencies
+    minfreq = 110
+    maxfreq = 440*8
+    
+    # cutting the song to only keep the one we're interested in
+    subprocess.run(["ffmpeg", "-ss", str(offset), "-t", str(songlen+offset), "-i", song_name, "crop.wav"], shell=False) 
+
+    # extracting data from cropped song
+    sample_rate, raw_song_data = wavfile.read("crop.wav")
+    blit = int(sample_rate*segsize) # Te
+
+    song_data = [0 for i in range(len(raw_song_data))]
+
+    a = 0
+    if(is_data_stereo(raw_song_data)):
+        print("Converting to mono...")
+        for x in range(len(raw_song_data)):
+            song_data[x] = raw_song_data[x][0]/2 + raw_song_data[x][1]/2
+
+            if(x % (int(len(raw_song_data)/100)) == 0):
+                print(a, "/ 100")
+                a += 1
+    else:
+        song_data = raw_song_data
+
+    # remove the copy of the song
+    subprocess.run(["rm", "crop.wav"], shell=False)
+    
+    # calculate the frequencies associated to the FFTs
+    pfreq = scp.fft.rfftfreq(blit, 1/sample_rate)
+
+    # left boundary of segment to crop
+    current_time = offset
+
+    # list of FFTs
+    fft_list = []
+    
+    # number of samples
+    k = 0
+
+    print("Retrieving freqs from", offset, "to", songlen+offset, "...")
+    print("amplitudes are from", minfreq, "to", maxfreq)
+    while(current_time < songlen-segsize):
+        # index corresponding to left boundary
+        left_id = int(current_time*sample_rate)
+        
+        # index corresponding to right boundary
+        right_id = int((current_time+segsize)*sample_rate)
+        
+        # calculate the fft, append it to fft_list
+        pff = scp.fft.rfft(song_data[int(current_time*sample_rate):int(sample_rate*(current_time+segsize))])
+        fft_list.append(pff)
+
+        # just to avoid what causes 0.1 + 0.1 == 0.2 to be False
+        k += 1
+        current_time = offset + k*segsize
+        #print(current_time)
+
+    # spacing between samples (time)
+    fe = segsize/sample_rate
+    
+    # list that will contain the maximum frequencies/amplitudes for all FFTs
+    maxlist = []
+    maxamps = []
+
+    print("\n\nSegSize :", segsize, "\nFFT :", len(fft_list), "\nFFT[0] :", len(fft_list[0]), "\npfreq :", len(pfreq), "\n\n")
+    
+    # find all maximums
+    for i in range(len(fft_list)):
+        current_max = -1
+        current_fmax = 0
+        
+        for j in range(len(fft_list[i])): 
+            if(pfreq[j] < maxfreq and pfreq[j] >= minfreq and np.abs(fft_list[i][j]) > current_max):
+                current_max = np.abs(fft_list[i][j])
+                current_fmax = pfreq[j]
+                
+        maxlist.append(current_fmax)
+        maxamps.append(current_max)
+        
+    # gg
+    # maxlist[i] corresponds to time (offset + i*segsize)
+    return (maxlist, maxamps)
+
+def void_freq_clean(song_name, offset, songlen, segsize, minfreq, maxfreq, ampthr, output_name):
+    # removes unnecessary frequencies/amps from a song
+    #ampthr is in [0, 1]
+    
+    # remove high_pitched/low-pitched frequencies
+    minfreq = 110
+    maxfreq = 440*8
+    
+    # cutting the song to only keep the one we're interested in
+    subprocess.run(["ffmpeg", "-ss", str(offset), "-t", str(songlen+offset), "-i", song_name, "crop.wav"], shell=False) 
+
+    # extracting data from cropped song
+    sample_rate, raw_song_data = wavfile.read("crop.wav")
+    blit = int(sample_rate*segsize) # Te
+
+    song_data = [0 for i in range(len(raw_song_data))]
+
+    a = 0
+    if(is_data_stereo(raw_song_data)):
+        print("Converting to mono...")
+        for x in range(len(raw_song_data)):
+            song_data[x] = raw_song_data[x][0]/2 + raw_song_data[x][1]/2
+
+            if(x % (int(len(raw_song_data)/100)) == 0):
+                print(a, "/ 100")
+                a += 1
+    else:
+        song_data = raw_song_data
+
+    # remove the copy of the song
+    subprocess.run(["rm", "crop.wav"], shell=False)
+    
+    # calculate the frequencies associated to the FFTs
+    pfreq = scp.fft.rfftfreq(blit, 1/sample_rate)
+
+    # left boundary of segment to crop
+    current_time = offset
+
+    # list of FFTs
+    fft_list = []
+    
+    # number of samples
+    k = 0
+
+    print("Retrieving freqs from", offset, "to", songlen+offset, "...")
+    print("amplitudes are from", minfreq, "to", maxfreq)
+    while(current_time < songlen-segsize):
+        # index corresponding to left boundary
+        left_id = int(current_time*sample_rate)
+        
+        # index corresponding to right boundary
+        right_id = int((current_time+segsize)*sample_rate)
+        
+        # calculate the fft, append it to fft_list
+        pff = scp.fft.rfft(song_data[int(current_time*sample_rate):int(sample_rate*(current_time+segsize))])
+        fft_list.append(pff)
+
+        # just to avoid what causes 0.1 + 0.1 == 0.2 to be False
+        k += 1
+        current_time = offset + k*segsize
+        #print(current_time)
+
+    print("\n\nSegSize :", segsize, "\nFFT :", len(fft_list), "\nFFT[0] :", len(fft_list[0]), "\npfreq :", len(pfreq), "\n\n")
+    
+    # remove
+    for i in range(len(fft_list)):
+        # get the local max freq
+        lmax = 0
+        for j in range(len(fft_list[i])):
+            if(np.abs(fft_list[i][j]) > lmax):
+                lmax = np.abs(fft_list[i][j])
+        
+        # remove freqs + amps
+        for j in range(len(fft_list[i])): 
+            if(pfreq[j] <= minfreq or pfreq[j] >= maxfreq):
+                fft_list[i][j] = 0+0j
+
+            if(np.abs(fft_list[i][j]) <= lmax*ampthr):
+                fft_list[i][j] = 0+0j
+        
+    # writing new .wav
+    res = []
+    print("Converting...")
+    for i in range(len(fft_list)):
+        ift = scp.fft.irfft(fft_list[i], n=blit)
+        for k in ift:
+            res.append(k)
+    #print(type(res[0]))
+    mx = 0
+    for j in range(len(res)):
+        if(res[j] > mx):
+            mx = res[j]
+
+    for i in range(len(res)):
+        res[i] = np.int16(32767*res[i]/mx)
+
+    res = np.array(res)
+    wavfile.write(output_name, sample_rate, res)
+
+def retrieve_dominant_amps(song_name, offset, songlen, segsize, percent):
+    # returns a list with the percent% peak amplitudes alongside the sample rate
+    # /!\ song_name is specified to be a list, NOT a list of couples (aka song is mono)
+    # segsize is in seconds
+    
+    # cutting the song to only keep the one we're interested in
+    subprocess.run(["ffmpeg", "-ss", str(offset), "-t", str(songlen+offset), "-i", song_name, "crop.wav"], shell=False) 
+
+    # extracting data from cropped song
+    sample_rate, raw_song_data = wavfile.read("crop.wav")
+    blit = int(sample_rate*segsize) # Te
+
+    # in case song has stereo format, conversion to mono
+    song_data = [0 for i in range(len(raw_song_data))]
+
+    a = 0
+    if(is_data_stereo(raw_song_data)):
+        print("Converting to mono...")
+        for x in range(len(raw_song_data)):
+            song_data[x] = raw_song_data[x][0]/2 + raw_song_data[x][1]/2
+
+            if(x % (int(len(raw_song_data)/100)) == 0):
+                print(a, "/ 100")
+                a += 1
+    else:
+        song_data = raw_song_data
+    
+    # which notes will be voided
+    is_locked = [False for i in range(len(song_data))]
+    x = int((len(song_data)*percent)//100)
+
+    print("Retreiving the", int(x), "/", len(song_data), "highest values")
+    elements = heapq.nlargest(int(x), enumerate(song_data), key=lambda x: x[1])
+    #returns a list of couples [id, value]
+
+    for idx in range(len(elements)):
+        is_locked[elements[idx][0]] = True
+
+    for r in range(len(song_data)):
+        if(is_locked[r] == False):
+            song_data[r] = 0
+    
+    # now we need to reduce song_data so that it matches the length of the previous function's return
+    res = []
+    k = 0
+    current_time = offset 
+
+    while(current_time < songlen-segsize):
+        # index corresponding to left boundary
+        left_id = int(current_time*sample_rate)
+        
+        # index corresponding to right boundary
+        right_id = int((current_time+segsize)*sample_rate)
+        
+        # merge the segment into one value
+        cmax = 0
+        for i in range(left_id, right_id):
+            if(i < len(song_data) and cmax < song_data[i]):
+                cmax = song_data[i]
+                
+        res.append(cmax)
+            
+        k += 1
+        current_time = offset + k*segsize
+        
+    # gg
+    # res[i] corresponds to time (offset + i*segsize)
+    return res
+
+def convert_to_wav(song_name:str, output_file="audio.wav") -> str:
+    """
+    Converts the song to .wav, only if it's not already in wave format.
+    Currently relies on file extension.
+    Returns: the song_name that should be used afterwards.
+    """
+    extension = Path(song_name).suffix
+    match extension:
+        case ".mp3" | ".ogg":
+            print("Converting to .wav...")
+            subprocess.run(["ffmpeg", "-y", "-i", song_name, output_file], shell=False) 
+            return output_file
+    return song_name
+
+def retrieve_all_from_song(filename, t0, t1, dt=0.001, threshold=0.1):
+    # dt = sample interval
+    # threshold is in percent
+
+    if(t1 <= t0):
+        print("ERROR : t1 <= t0\n")
+        exit(1)
+
+    # converts format to .wav
+    new_fn = convert_to_wav(filename)
+
+    # crop the song to the part that will be mapped
+    subprocess.run(["ffmpeg", "-ss", str(t0), "-t", str(t1), "-i", new_fn, "crop0.wav"], shell=False) 
+    subprocess.run(["clear"])
+
+    sample_rate, _ = wavfile.read("crop0.wav")
+
+    print("Filtering song...")
+    void_freq_clean(new_fn, t0, t1-t0, dt, 200, 2500, 0.05, "crop1.wav")
+
+    print("Now retrieving the frequencies")
+    (maxlist, maxamps) = retrieve_dominant_freqs(new_fn, t0, t1-t0, dt)
+    
+    print("Now retrieving the amplitudes")
+    amps = retrieve_dominant_amps(new_fn, t0, t1-t0, dt, threshold)
+
+    print("Len of freqs : ", len(maxlist), "|", len(maxamps))
+    print("Len of amps : ", len(maxlist), "|", len(amps))
+
+    timesF = [t0 + dt*k for k in range(len(maxlist))]
+    timesA = [t0 + dt*k for k in range(len(amps))]
+
+    plt.plot(timesF, maxlist)
+    plt.show()
+
+    plt.plot(timesA, amps)
+    plt.show()
+
+    # free()
+    subprocess.run(["rm", "crop0.wav"], shell=False)
+
+retrieve_all_from_song("tetris_4.wav", 0, 5)
+print("yipee")
+
+
+
+
+
+
+
+
+
+
+
+
+
--- a/crop.wav
+++ b/crop.wav
--- a/crop1.wav
+++ b/crop1.wav
--- a/(1).py
+++ b/(1).py
@ -1,145 +0,0 @@
-import numpy as np
-import scipy as scp
-import heapq
-
-def retrieve_dominant_freqs(song_name, offset, songlen, segsize):
-    # returns a list with peak frequencies alongside the sample rate
-    # /!\ song_name is specified to be a list, NOT a list of couples (aka song is mono)
-    # segsize is in seconds
-    
-    # remove high_pitched/low-pitched frequencies
-    minfreq = 110
-    maxfreq = 440*8
-    
-    # cutting the song to only keep the one we're interested in
-    subprocess.run(["ffmpeg", "-ss", str(offset), "-t", str(songlen+offset), "-i", song_name, "crop.wav"], shell=False) 
-
-    # extracting data from cropped song
-    sample_rate, song_data = wavfile.read("crop.wav")
-    blit = int(sample_rate*segsize) # Te
-
-    # remove the copy of the song
-    subprocess.run(["rm", "crop.wav"], shell=False)
-    
-    # calculate the frequencies associated to the FFTs
-    pfreq = scipy.fft.rfftfreq(blit, 1/sample_rate)
-
-    # left boundary of segment to crop
-    current_time = offset
-
-    # list of FFTs
-    fft_list = []
-    
-    # number of samples
-    k = 0
-
-    while(current_time <= songlen+offset):
-        # index corresponding to left boundary
-        left_id = int(current_time*sample_rate)
-        
-        # index corresponding to right boundary
-        right_id = int((current_time+segsize)*sample_rate)
-        
-        # calculate the fft, append it to fft_list
-        pff = scp.fft.rfft(global_data[left:right])
-        fft_list.append(pff)
-
-        # just to avoid what causes 0.1 + 0.1 == 0.2 to be False
-        k += 1
-        current_time = offset + k*segsize
-
-    # spacing between samples (time)
-    fe = segsize/sample_rate
-    
-    # list that will contain the maximum frequencies/amplitudes for all FFTs
-    maxlist = []
-    maxamps = []
-    
-    # find all maximums
-    for i in range(len(fft_list)):
-        current_max = -1
-        current_fmax = 0
-        
-        for j in range(len(fft_list[i])): 
-            if(pfreq[j] < maxfreq & pfreq[j] >= minfreq & np.abs(fft_list[i][j]) > current_max):
-                current_max = np.abs(fft_list[i][j])
-                current_fmax = pfreq[j]
-                
-        maxlist.append(current_fmax)
-        maxamps.append(current_max)
-        
-    # gg
-    # maxlist[i] corresponds to time (offset + i*segsize)
-    return (maxlist, maxamps, segsize)
-
-def retrieve_dominant_amps(song_name, offset, songlen, segsize, percent):
-    # returns a list with the percent% peak amplitudes alongside the sample rate
-    # /!\ song_name is specified to be a list, NOT a list of couples (aka song is mono)
-    # segsize is in seconds
-    
-    # cutting the song to only keep the one we're interested in
-    subprocess.run(["ffmpeg", "-ss", str(offset), "-t", str(songlen+offset), "-i", song_name, "crop.wav"], shell=False) 
-
-    # extracting data from cropped song
-    sample_rate, song_data = wavfile.read("crop.wav")
-    blit = int(sample_rate*segsize) # Te
-
-    # remove the copy of the song
-    subprocess.run(["rm", "crop.wav"], shell=False)
-    
-    # which notes will be voided
-    is_locked = [False for i in range(len(song_data))]
-    x = int((len(song_data)*threshold)//100)
-
-    print("Retreiving the", int(x), "/", len(song_data), "highest values")
-    elements = heapq.nlargest(int(x), enumerate(song_data), key=lambda x: x[1])
-    #returns a list of couples [id, value]
-
-    for idx in range(len(elements)):
-        is_locked[elements[idx][0]] = True
-
-    for r in range(len(song_data)):
-        if(is_locked[r] == False):
-            song_data[r] = 0
-    
-    # now we need to reduce song_data so that it matches the length of the previous function's return
-    res = []
-    k = 0
-    current_time = offset 
-
-    while(current_time <= songlen+offset):
-        # index corresponding to left boundary
-        left_id = int(current_time*sample_rate)
-        
-        # index corresponding to right boundary
-        right_id = int((current_time+segsize)*sample_rate)
-        
-        # merge the segment into one value
-        cmax = 0
-        for i in range(left_id, right_id):
-            if(i < len(song_data) & cmax < song_data[i]):
-                cmax = song_data[i]
-                
-        res.append(cmax)
-            
-        k += 1
-        current_time = current_time + k*segsize
-        
-    # gg
-    # res[i] corresponds to time (offset + i*segsize)
-    return res
-        
-print("done")
-
-
-
-
-
-
-
-
-
-
-
-
-
--- a/sound_process.py
+++ b/sound_process.py
@ -341,532 +341,3 @@ def main():

 if __name__ == "__main__":
    main()
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-''' -------------------------------------------------------------------- '''
-''' -----------------------| Feuilles mortes |-------------------------- '''
-''' -------------------------------------------------------------------- '''
-
-    
-'''
-def smooth(data, thr, mergeThr, show):
-    mx = max(data)
-    for i in range(len(data)-mergeThr):
-        if(data[i]/mx > thr):
-            for k in range(1, mergeThr):
-                data[i+k] = 0
-    if(show):
-        t = [j/1000 for j in range(len(data))]
-        plt.plot(t, data)
-        plt.xlabel("Time (not scaled to origin)")
-        plt.ylabel("Amplitude")
-        plt.grid()
-        plt.show()
-    
-    return data
-if(False):
-    #t, f, Zxx = fct("no.wav", 0, 0.032, 10, 5000, False)
-    #t, f, Zxx = fct("worlds_end_3.wav", 150.889, 0.032, 170.889, 3000, False)
-    #t, f, Zxx = fct("deltamax.wav", 9.992, 0.032, 114.318, 3000, False)
-    #t, f, Zxx = fct("deltamax.wav", 9.992, 0.032, 20, 3000, False)
-    #t, f, Zxx = fct("da^9.wav", 8.463, 0.032, 20, 5000, False)
-    t, f, Zxx = fct("13.  Cosmic Mind.wav", 0, 0.032, 20, 5000, False)
-    #t, f, Zxx = fct("Furioso Melodia 44100.wav", 4, 0.032, 8, 3000, False)
-    #t, f, Zxx = fct("changing.wav", 0, 0.05, 3.9, 5000, False)
-    #fct("worlds_end_3.wav", 75, (60/178)/4, 75+2, 2500)
-
-    plot_max(t, f, Zxx, True)
-
-if(False):
-    #(t, data) = peaks("worlds_end_3.wav", 0, 300, False, 0.92)
-    (t, data) = peaks("worlds_end_3.wav", 74.582, 6, False, 0.9)
-    #(t, data) = peaks("da^9.wav", 8.463, 301.924 - 8.463, False, 0.95)
-    #(t, data) = peaks("deltamax.wav", 8.463, 30101.924 - 8.463, False, 0.92)
-    da = find_bpm(t, 44100, data, 100, 200, 1, 10)
-    print("BPM data is", da)'''
-
-    #data = [-1 for i in range(int(x))]
-    #ids = [-1 for i in range(int(x))]
-'''
-    data = []
-    ids = []
-    for k in range(int(x)):
-        data.append(int(7*mx/10))
-        ids.append(-1)
-    # structure there is [[index, value]...]
-
-    i = 0
-    calc = 0
-    while(i < len(song_data)):
-        if(i%10 == 0):
-            print(i, "/", len(song_data))
-        if(data[int(x)-1] < song_data[i]):
-            calc += 1
-            #print("\n \n \n \n \n")
-            data[int(x)-1] = song_data[i]
-            ids[int(x)-1] = i
-            
-            k = int(x)-1
-            #while(k < int(x) & data[0] > data[k]):
-            while(k > 0 and data[k-1] <= data[k]):
-                data[k], data[k-1] = data[k-1], data[k]
-                ids[k], ids[k-1] = ids[k-1], ids[k]
-                k -= 1
-
-            #print(data[int(x)-1], calc, "/", x)
-
-            i += skip
-        i += 1
-    
-
-    for s in range(int(x)-1):
-        if(data[s] < data[s+1]):
-            print("Nope", s)
-            assert(0)
-'''
-
-
-'''
-def fct(song_name, offset, increment, songlen, maxfreq, display):
-    to_cut = 20000//maxfreq
-    global_Zxx = np.array([])
-    global_f = np.array([])
-    global_t = np.array([])
-    current_time = offset
-    k = 0
-    while(current_time <= songlen):
-        subprocess.run(["ffmpeg", "-ss", str(current_time), "-t", str(increment), "-i", song_name, "crop.wav"], shell=False) 
-
-        sample_rate, audio_data = wavfile.read('crop.wav')
-        size = audio_data.size
-
-        #subprocess.run(["clear"])
-        subprocess.run(["rm", "crop.wav"], shell=False)
-
-        # do stuff here
-        #f, t, Zxx = signal.stft(audio_data, sample_rate, nperseg=1000)
-        f, t, Zxx = signal.spectrogram(audio_data, fs=sample_rate, nfft=size)
-        leng = len(f)
-
-        f, Zxx = f[:leng//to_cut], Zxx[:leng//to_cut]
-
-        #print(len(Zxx))
-        #print(len(Zxx[0]))
-
-
-        for i in range(len(Zxx)):
-            for j in range(len(Zxx[i])):
-                Zxx[i][j] *= 1127*np.log(1+f[i]/700)
-  
-
-        t = np.array([current_time + x for x in t])
-
-        if(k == 0):
-            global_f = f
-            global_t = t
-            global_Zxx = Zxx
-        else:
-            global_Zxx = np.concatenate((global_Zxx, Zxx), axis=1)
-            global_t = np.concatenate((global_t, t))
-
-        #print(len(global_t))
-        
-        k += 1
-        current_time = offset + k*increment
-
-        print("Completion rate : ", np.round(100*(current_time-offset)/(songlen-offset), 4), "%")
-    
-    if(display):
-        plt.pcolormesh(global_t, global_f, np.abs(global_Zxx), shading='gouraud')
-        # print(len(global_Zxx), len(global_Zxx[0]))
-        # 88 192 = 2500
-        # 70 192 = 2000
-        plt.title('STFT Magnitude')
-        plt.ylabel('Frequency [Hz]')
-        plt.xlabel('Time [sec]')
-        plt.show()
-
-    return global_t, global_f, np.abs(global_Zxx)
-
-def write_to_file(t, flist, maxlist, filename):
-    file = open(filename, 'w')
-    file.writelines('time,frequency,maxvalue\n')
-    for i in range(len(t)):
-        file.writelines(str(np.round(t[i], 3)))
-        file.writelines(',')
-        file.writelines(str(np.round(flist[i], 1)))
-        file.writelines(',')
-        file.writelines(str(np.round(maxlist[i], 0)))
-        file.writelines('\n')
-    #close(file)
-
-def plot_max(time, freq, Zxx, save):
-    fres = [0 for x in range(len(time))]
-    maxres = [0 for x in range(len(time))]
-    for t in range(len(time)):
-        #subprocess.run(["clear"])
-        print(t, "/", len(time))
-        for f in range(len(Zxx)):
-            if(maxres[t] < Zxx[f][t]):
-                maxres[t] = Zxx[f][t]
-                fres[t] = freq[f]
-
-    if(save):
-        write_to_file(time, fres, maxres, 'output.csv')
-
-    ''''''
-    plt.plot(time, fres, 'r')
-    plt.grid()
-    plt.xlabel("Time")
-    plt.ylabel("Maximum frequencies")
-
-    plt.plot(time, maxres, 'g')
-    plt.grid()
-    plt.xlabel("Time")
-    plt.ylabel("Maximun values")
-
-    plt.show()''''''
-
-    fig, (ax1, ax2) = plt.subplots(2)
-    fig.suptitle('Top : time and frequencies\nBottom : time and max values')
-    ax1.plot(time, fres)
-    ax2.plot(time, maxres)
-
-    plt.show()
-
-def extract_peaks(song_data, sample_rate, offset, display, threshold):
-    mx = max(song_data)
-    for i in range(len(song_data)):
-        #subprocess.run(["clear"])
-        print(i, "/", len(song_data))
-        if(song_data[i]/mx < threshold):
-            song_data[i] = 0
-    t = [offset + i/sample_rate for i in range(len(song_data))]
-
-    if(display):
-        plt.plot(t, song_data, 'b+')
-        plt.grid()
-        plt.xlabel("t")
-        plt.ylabel("amp")
-        plt.show()
-
-    return (t, song_data)
-
-def get_local_max(song_data, center, width):
-    mx = 0
-    for o in range(-width, width+1):
-        togo = min(len(song_data)-1, center+o)
-        togo = max(0, togo)
-        if(mx < song_data[togo]):
-            mx = song_data[togo]
-    return mx
-
-def extract_peaks_v2(song_data, sample_rate, offset, display, threshold, seglen):
-    mx = 0
-    for i in range(len(song_data)):
-        if (i%seglen == 0):
-            print("----")
-            mx = get_local_max(song_data, i+seglen//2, seglen//2)
-        #subprocess.run(["clear"])
-        print(i, "/", len(song_data))
-        if(song_data[i]/mx < threshold):
-            song_data[i] = 0
-    
-    t = [offset + i/sample_rate for i in range(len(song_data))]
-
-    if(display):
-        plt.plot(t, song_data, 'b+')
-        plt.grid()
-        plt.xlabel("t")
-        plt.ylabel("amp")
-        plt.show()
-
-    return (t, song_data)
-
-def peaks(song_name, offset, length, display, thr):
-    subprocess.run(["ffmpeg", "-ss", str(offset), "-t", str(length), "-i", song_name, "crop.wav"], shell=False) 
-
-    sample_rate, audio_data = wavfile.read('crop.wav')
-
-    #subprocess.run(["clear"])
-    subprocess.run(["rm", "crop.wav"], shell=False)
-
-    #return extract_peaks(audio_data, sample_rate, offset, display, thr)
-    return extract_peaks_v2(audio_data, sample_rate, offset, display, thr, 44100*2)
-
-def find_bpm(sample_rate, data, minbpm, maxbpm, step, width):
-    optimal = minbpm
-    optimal_acc = 0
-    accuracy = 0
-
-    bpmlst = []
-    scores = []
-    
-    for beat in range(minbpm, maxbpm+step, step):
-        loopturn = 0
-        print("testing", beat)
-        accuracy = 0
-        current = 0
-
-        while(current+width < len(data)):
-            loopturn += 1
-            for o in range(-width, width+1):
-                accuracy += data[current + o]
-            #current = (loopturn*sample_rate)//beat
-            current += (sample_rate)//beat
-
-        #accuracy = accuracy/loopturn
-
-        #accuracy *= (1+(maxbpm-beat)/minbpm)
-        if optimal_acc < accuracy:
-            optimal_acc = accuracy
-            optimal = beat
-        bpmlst.append(beat)
-        scores.append(accuracy)
-
-    if(False):
-        plt.plot(bpmlst, scores)
-        plt.xlabel("BPM")
-        plt.ylabel("Score")
-        plt.grid()
-        plt.show()
-
-    return (optimal, optimal_acc)
-'''
-
-
-
-'''
-def void_freq(song_name, offset, songlen, increment, lthr, gthr):
-    to_cut = 20000//2500
-    global_Zxx = np.array([])
-    global_f = np.array([])
-    global_t = np.array([])
-    current_time = offset
-    k = 0
-    sample_rate, global_data = wavfile.read(song_name)
-    blit = int(sample_rate*increment)
-    print("Blit :", blit)
-    while(current_time <= songlen):
-        #subprocess.run(["ffmpeg", "-ss", str(current_time), "-t", str(increment), "-i", song_name, "crop.wav"]) 
-
-        #sample_rate, audio_data = wavfile.read('crop.wav')
-        audio_data = global_data[int(k*blit):int((k+1)*blit)]
-        size = audio_data.size
-
-        #subprocess.run(["clear"])
-        #subprocess.run(["rm", "crop.wav"])
-
-        # do stuff here
-        #f, t, Zxx = signal.stft(audio_data, sample_rate, nperseg=1000)
-        f, t, Zxx = signal.spectrogram(audio_data, fs=sample_rate, nfft=size)
-        leng = len(f)
-
-        f, Zxx = f[:leng//to_cut], Zxx[:leng//to_cut]
-
-        for i in range(len(Zxx)):
-            for j in range(len(Zxx[i])):
-                #Zxx[i][j] *= 1127*np.log(1+f[i]/700)
-                Zxx[i][j] *= 1000
-  
-        t = np.array([current_time + x for x in t])
-
-        if(k == 0):
-            global_f = f
-            global_t = t
-            global_Zxx = Zxx
-        else:
-            global_Zxx = np.concatenate((global_Zxx, Zxx), axis=1)
-            global_t = np.concatenate((global_t, t))
-
-        #print(len(global_t))
-        
-        k += 1
-        current_time = offset + k*increment
-
-        print("Completion rate : ", np.round(100*(current_time-offset)/(songlen-offset), 4), "%")
-    
-    print("Finding global max...")
-    gmax = 0
-    for i in range(len(global_Zxx)):
-        for j in range(len(global_Zxx[i])):
-            if(global_Zxx[i][j] > gmax):
-                gmax = global_Zxx[i][j]
-
-    print("Trimming...")
-    for j in range(len(global_Zxx[0])):
-        lmax = 0
-        for i in range(len(global_Zxx)):
-            if(global_Zxx[i][j] > lmax):
-                lmax = global_Zxx[i][j]
-
-        for i in range(len(global_Zxx)):
-            val = global_Zxx[i][j]
-            if(val/lmax <= lthr/100):
-                global_Zxx[i][j] = 0
-            elif(val/gmax <= gthr/100):
-                global_Zxx[i][j] = 0
-
-    if(False):
-        print("Plotting...")
-        plt.pcolormesh(global_t, global_f, np.abs(global_Zxx), shading='gouraud')
-        # print(len(global_Zxx), len(global_Zxx[0]))
-        print("XLEN :", len(global_Zxx), "\nYLEN :", len(global_Zxx[0]))
-        plt.title('STFT Magnitude')
-        plt.ylabel('Frequency [Hz]')
-        plt.xlabel('Time [sec]')
-        plt.show()
-
-    if(True):
-        print("Converting...")
-        audio_signal = librosa.griffinlim(global_Zxx)
-        #scipy.io.wavfile.write('trimmed.wav', sample_rate, np.array(audio_signal, dtype=np.int16))
-        wavfile.write('test.wav', sample_rate, np.array(audio_signal, dtype=np.int16))
-
-    print("Done")
-
-def find_bpm_2(sample_rate, data, threshold, maxbpm, show):
-    mx = np.max(data)
-    min_spacing = (60*sample_rate)/maxbpm
-    k = 0
-    while(k < len(data) and data[k]/mx < threshold):
-        k += 1
-
-    k += 1
-    spacing = []
-    current = 1
-    progress = 0
-
-    while(k < len(data)):
-        if(k%(len(data)/100) == 0):
-            print(progress, "%")
-            progress += 1
-        if(data[k]/mx >= threshold and current > min_spacing):
-            spacing.append(current)
-            current = 0
-        else:
-            current += 1
-        k += 1
-
-
-    for x in range(len(spacing)):
-        spacing[x] = 60/(spacing[x]/sample_rate)
-    
-    digits = [i for i in range(len(spacing))]
-    if(show):
-        plt.plot(digits, spacing)
-        plt.xlabel("N")
-        plt.ylabel("BPM")
-        plt.grid()
-        plt.show()
-
-    beat = np.mean(spacing)
-    error = np.std(spacing)
-
-    return (np.round(beat, 3), np.round(error, 3))
-
-def to_ms(song_data, sample_rate, offset):
-    # converts audio data to have exactly 1 sample per millisecond (aka set sample_rate to 1000)
-    new_data = []
-    spacing = int(sample_rate * 0.001)
-    mx = max(song_data)
-    i = 0
-    while(i < len(song_data)):
-        avg = 0
-        for k in range(spacing):
-            if(i+spacing < len(song_data)):
-                avg += song_data[i+spacing]
-        avg = avg / spacing
-        new_data.append(avg)
-        i += spacing
-
-    if(False): # pls dont kill me thx
-        t = [offset + j/1000 for j in range(len(new_data))]
-        plt.plot(t, new_data)
-        plt.xlabel("Time")
-        plt.ylabel("Amplitude")
-        plt.grid()
-        plt.show()
-    
-    return (new_data, len(new_data))
-
-def filter_n_percent(song_name, offset, length, threshold, reduce, show):
-    # threshold is in ]0, 100]
-    # filter data associated with song_name to keep only the highest threshold% values
-
-    subprocess.run(["ffmpeg", "-ss", str(offset), "-t", str(length), "-i", song_name, "crop.wav"], shell=False) 
-
-    sample_rate, song_data = wavfile.read('crop.wav')
-
-    subprocess.run(["clear"], shell=False)
-    subprocess.run(["rm", "crop.wav"], shell=False)
-
-    if(reduce):
-        (song_data,e) = to_ms(song_data, 44100, 1)
-        sample_rate = 1000
-
-    mx = max(song_data)
-    
-    is_locked = [False for i in range(len(song_data))]
-    x = int((len(song_data)*threshold)//100)
-    #print("X = ", x)
-
-    print("Retreiving the", int(x), "/", len(song_data), "highest values")
-    elements = heapq.nlargest(int(x), enumerate(song_data), key=lambda x: x[1])
-    print("Done")
-
-    for idx in range(len(elements)):
-        is_locked[elements[idx][0]] = True
-
-    for r in range(len(song_data)):
-        if(is_locked[r] == False):
-            song_data[r] = 0
-        
-    if(show):
-        #print("EEEEE")
-        t = [offset + j/sample_rate for j in range(len(song_data))]
-        plt.plot(t, song_data)
-        plt.xlabel("Time")
-        plt.ylabel("Amplitude")
-        plt.grid()
-        plt.show()
-
-    return song_data
-
-def get_tpts(data, sample_rate, thr):
-    res = []
-    for i in range(len(data)):
-        if(data[i] > thr):
-            res.append(i/sample_rate)
-    
-    for i in res:
-        print(i)
-    return res
-
-def test_sample(timelist):
-    for i in range(1,len(timelist)):
-        #os.system('play -n synth %s sin %s' % (0.05, 440))
-        for k in range(random.randint(1, 10)):
-            print("E", end="")
-        print("F")
-        sleep(timelist[i]-timelist[i-1])
-'''