# First, some imports and setup
import numpy as np
from matplotlib import pyplot as plt
import IPython.display as ipd
import librosa
import librosa.display
import math
import glob
import os
import pandas as pd

import warnings
warnings.filterwarnings("ignore")


test_cases = [
    # these are all pretty good
    {'src': '**/*Ed*', 'known_tempo': 126, 'start': 60.34, 'len': 2.5 },
    {'src': '**/*Ed*', 'known_tempo': 126, 'start': 60.34, 'len': 5 },
    {'src': '**/*Ed*', 'known_tempo': 126, 'start': 60.34, 'len': 10 },
    {'src': '**/*Ed*', 'known_tempo': 126, 'start': 60.34, 'len': 20 },
    
    # this song has more complicated rhythm, first case is 1.33x tempo, and sounds triplet feel.
    # second is closer to tempo, but still off sounding. 3rd, long 20s window, sounds great
    {'src': '**/*Dua*Rules*', 'known_tempo': 116, 'start': 60.80, 'len': 5 },
    {'src': '**/*Dua*Rules*', 'known_tempo': 116, 'start': 60.80, 'len': 10 },
    {'src': '**/*Dua*Rules*', 'known_tempo': 116, 'start': 80.80, 'len': 20 },
    
    # 
    
    # simple metronomes
    {'src': '**/*126 BPM*', 'known_tempo': 126, 'start': 22.8, 'len': 5 },
    {'src': '**/*120 BPM*', 'known_tempo': 120, 'start': 10,   'len': 5 },
]


TEST_CASE_INDEX = 1

test_case = test_cases[TEST_CASE_INDEX]
test_case['end'] = test_case['start'] + test_case['len']
src = glob.glob(test_case['src'])[0]

y, sr = librosa.load(src, sr=48000, offset=test_case['start'], duration=test_case['len'])

ipd.display(pd.DataFrame([[sr, len(y), len(y.shape), np.max(y), np.min(y)]],
                         columns=["Sample rate Hz", "Num Samples", "Channels", "Sample Max", "Sample Min"]).style.hide())
ipd.Audio(y, rate=sr)


def predict_beats(samples, sr, hop_length=256):
    """I looked in the source code, I'm using 'onset_strength_multi' as it gave more options"""
    
    onset_env = librosa.onset.onset_strength_multi(
        y=samples,
        sr=sr,
        hop_length=hop_length,
        aggregate=np.median,  # default is mean
        lag=1,                # default, unit? "time lag for computing differences"
        max_size=1,           # default, do not filter freq bins
        detrend=False,        # default, do not "filter onset strength to remove DC component"
        center=True,          # Centered frame analysis in STFT, by hop length
    )
    onset_env = onset_env[..., 0, :]
    
    # HOP_LENGTH = 512
    # onset_env = librosa.onset.onset_strength(y=samples, sr=sr,
    #                         # hop_length=hop_length,
    #                         aggregate=np.median, # default is mean
    #                         lag=1, # default, unit? "time lag for computing differences"
    #                         max_size=1, # default, do not filter freq bins
    #                         detrend=False, # default, do not "filter onset strength to remove DC component"
    #                         center=True, # Centered frame analysis in STFT, by hop length
    #                         )

    return librosa.beat.beat_track(
        onset_envelope=onset_env,
        sr=sr,
        units="time",
        hop_length=hop_length,
        tightness=1000,              # yikers island, what does this do... good? 800 1000, bad 400 600 1600
        # start_bpm=126,
        # trim=False,
    )


reported_tempo, beats = predict_beats(y, sr)
expected_beats = math.floor(test_case["known_tempo"] * test_case["len"] / 60.0)

# Display our results
table = [
    ["Reported tempo", reported_tempo],
    ["Averaged tempo", 60 / np.average(np.diff(beats))],
    ["Num beats detected vs expected", f"{len(beats)} vs {expected_beats}"],
]
ipd.display(pd.DataFrame(table).style.hide(axis="columns").hide())

# Add in the click track from these detected beats
click_track = librosa.clicks(times=beats, sr=sr, length=len(y))
ipd.Audio(y + click_track, rate=sr)


pd.DataFrame([
    ['Reported', reported_tempo],
    ['Averaged', 60 / np.average(np.diff(beats))],
    ['Min', 60 / np.max(np.diff(beats))],
    ['Max', 60 / np.min(np.diff(beats))],
    ['Median', 60 / np.median(np.diff(beats))],
    ['-','-'],
    ['Known', test_case['known_tempo']],
    ['Known seconds per beat', 60 / test_case['known_tempo'] ],
    ['Averaged seconds per beat', np.average(np.diff(beats))],
], columns=["Method", "BPM"]).style.hide()


# Now load twice as much audio
duration = 2.0 * test_case['len']
future, _ = librosa.load(src, sr=sr, offset=test_case['start'], duration=duration)

future_beats = np.array(beats)
diffs = np.diff(beats)
beats_added = 0
while future_beats[-1] < duration:
    future_beats = np.append(future_beats, future_beats[-1] + diffs[beats_added % len(diffs)])
    beats_added = beats_added + 1

future_click = librosa.clicks(times=future_beats, sr=sr, length=len(future))
ipd.Audio(future + future_click, rate=sr)


spb = np.average(np.diff(beats))
constant_bpm_clicks = [beats[0]]
while constant_bpm_clicks[-1] < test_case['end']:
    constant_bpm_clicks = constant_bpm_clicks + [ constant_bpm_clicks[-1] + spb ]
ipd.Audio(future + librosa.clicks(times=constant_bpm_clicks, sr=sr, length=len(future)), rate=sr)


# tempo_used = 60 / np.average(np.diff(beats))
tempo_used = reported_tempo
spb = 60 / tempo_used
beat1_ests = [beat - k * spb for k, beat in enumerate(beats)]
anchor = np.mean(beat1_ests)
beat_ests = np.arange(anchor, duration, spb)

# constant_bpm_clicks = [anchor]
# while constant_bpm_clicks[-1] < test_case['end']:
#     constant_bpm_clicks = constant_bpm_clicks + [ constant_bpm_clicks[-1] + spb ]
# ipd.Audio(future + librosa.clicks(times=constant_bpm_clicks, sr=sr, length=len(future)), rate=sr)
ipd.Audio(future + librosa.clicks(times=beat_ests, sr=sr, length=len(future)), rate=sr)


a = [1.3888, 2, 3.37, 0, 0, 0, 0, 0, 0, 4, 5, 6, 0, 0, 0, 0, 9, 8, 7, 0, 10, 11]
# np.ediff1d(np.r_[0, a == 0, 0]).nonzero()[0].reshape(-1, 2)

def find_zero_runs(a):
    # Create an array that is 1 where a is 0, and pad each end with an extra 0.
    iszero = np.concatenate(([0], np.equal(a, 0), [0]))
    absdiff = np.abs(np.diff(iszero))
    # Runs start and end where absdiff is 1.
    ranges = np.where(absdiff == 1)[0].reshape(-1, 2)
    return ranges
zr = find_zero_runs(a)
zr = list(map(list, list(zr)))
ipd.display(zr)

zr = list(filter(lambda x: x[1] - x[0] > 2, zr))
zr

[[3, 9], [12, 16], [19, 20]]

[[3, 9], [12, 16]]


a = [1.3888, 2, 3.37, -1, -2, 0, 0, 0, 0, 0, 0, 4, 5, 6, 0, 0, 0, 0, 9, 8, 7, 0, 10, 11]
a = np.sign(a)
a = np.diff(a)
a

array([ 0.,  0., -2.,  0.,  1.,  0.,  0.,  0.,  0.,  0.,  1.,  0.,  0.,
       -1.,  0.,  0.,  0.,  1.,  0.,  0., -1.,  1.,  0.])


zr = find_zero_runs(y)
zr

array([[ 38081,  38082],
       [152559, 152560],
       [198456, 198457],
       [198700, 198701]])


zero_runs = list(map(list, zr))
if len(zero_runs) >= 4:
    bpm = 60 / ((zero_runs[2][1] - zero_runs[1][1]) / sr)
    beep_len = ((zero_runs[2][0] - zero_runs[1][1] + 1) / sr)
bpm
beep_len

0.9561875

Tempo and Beat Event Detection Using Librosa¶

Next Steps(?):¶

SCRATCH:¶

Reported tempo	126.404494
Averaged tempo	126.720901
Num beats detected vs expected	10 vs 10

Method	BPM
Reported	126.404494
Averaged	126.720901
Min	125.000000
Max	130.813953
Median	126.404494
-	-
Known	126
Known seconds per beat	0.476190
Averaged seconds per beat	0.473481