import numpy as np
import librosa
import soundfile
import IPython.display as ipd

from matplotlib import pylab as plt

def f_pitch(p):
    """Compute center frequency for (single or array of) MIDI note numbers.

    Args:
        p: MIDI note numbers

    Returns:
        freq_center: Center frequency
    """
    # vvvvvvvvvvvvvvvvvvvvv
    freq_center = 2 ** ((p - 69) / 12) * 440
    return freq_center
    # ^^^^^^^^^^^^^^^^^^^^^

def f_all_valid_midi():
    """Compute center frequency for (single or array of) MIDI note numbers.

    Returns:
        center_freqs: Center frequency
    """
    # vvvvvvvvvvvvvvvvvvvvv
    center_freqs = [f_pitch(p) for p in range(0, 128)]
    return center_freqs
    # ^^^^^^^^^^^^^^^^^^^^^

np.all(np.isclose(f_all_valid_midi(), f_pitch(np.arange(0, 128))))

True

def make_h(center_frequencies, num_harmonics):
    """Compute harmonics above center frequencies given
         up to num_harmonics

    Returns:
        H (ndarray): A 2D numpy matrix as above
    """
    # vvvvvvvvvvvvvvvvvvvvv
    multipliers = np.arange(1, num_harmonics + 1)
    H = center_frequencies.reshape(-1, 1) * multipliers
    return H
    # ^^^^^^^^^^^^^^^^^^^^^

cf = f_pitch(np.arange(0, 128))
H = make_h(cf, 128)

H[69][2]

1320.0

def make_o(center_frequencies, num_octaves):
    """Compute octave-related pitches
        center frequencies given, up to num_octaves

    Returns:
        O (ndarray): A 2D numpy matrix as above
    """
    # vvvvvvvvvvvvvvvvvvvvv
    multipliers = 2 ** np.arange(0, num_octaves)
    return center_frequencies.reshape(-1, 1) * multipliers
    # ^^^^^^^^^^^^^^^^^^^^^

O = make_o(cf, 8)

O[69][2]

1760.0

H[60][:10]

array([ 261.6255653 ,  523.2511306 ,  784.8766959 , 1046.5022612 ,
       1308.1278265 , 1569.7533918 , 1831.3789571 , 2093.0045224 ,
       2354.63008771, 2616.25565301])

cf[60 + 12 + 7]

783.9908719634985

def midi_harmonics(center_mnn=60, num_harmonics=16, tolerance=1e-02):
    cf = f_pitch(np.arange(0, 128))
    cax = plt.imshow(np.isclose(H[center_mnn][:num_harmonics], cf[:,None], 1e-02).T, cmap='Greys', 
                     interpolation='none', aspect='auto')
    plt.xlabel('Pitch (MIDI note number)')
    plt.ylabel('n-th Harmonic (n)')
    plt.show()

midi_harmonics()

np.where(np.isclose(H[60][:16], cf[:,None], 1e-02))

(array([ 60,  72,  79,  84,  88,  91,  96,  98, 100, 103, 107, 108]),
 array([ 0,  1,  2,  3,  4,  5,  7,  8,  9, 11, 14, 15]))

cf[60], cf[67]

(261.6255653005986, 391.99543598174927)

cf[60]/cf[67]

0.6674199270850172

cf[60] * (3/2)

392.43834795089793

def check_perfect(mnn):
    """Difference between pure and ET intervals

    Args:
        mnn (int): MIDI note number

    Returns:
        d (scalar): Difference in Hertz between frequency
          of ET perfect fifth above and pure perfect fifth
          above given MIDI note number 

    """
    # vvvvvvvvvvvvvvvvvvvvv    
    cf = f_pitch(np.arange(0, 128))
    base = cf[mnn]
    
    etp5_above = cf[mnn + 7]
    pp5_above = base * (3/2)
    
    d = etp5_above - pp5_above
    
    return d
    # ^^^^^^^^^^^^^^^^^^^^^

checked = check_perfect(np.arange(60, 72))

def generate_sinusoid(dur, Fs, amp, freq, phase):
    """Generation of sinusoid

    Args:
        dur (float): Duration (in seconds) 
        Fs (scalar): Sampling rate 
        amp (float): Amplitude of sinusoid
        freq (float): Frequency of sinusoid (in Hz)
        phase (float): Phase of sinusoid (in radians)

    Returns:
        x (np.ndarray): Signal
        t (np.ndarray): Time axis (in seconds)

    """
    num_samples = int(Fs * dur)
    t = np.arange(num_samples) / Fs
    x = amp * np.sin(2*np.pi*(freq*t-phase))
    return x, t

x0, t0 = generate_sinusoid(dur=2, Fs=512, amp=1, freq=10, phase=0)
x1, t1 = generate_sinusoid(dur=2, Fs=512, amp=0.2, freq=105, phase=(np.pi))

plt.plot(t0, x0)
plt.show()

def generate_sinusoid_exp(dur, Fs, amp, freq, phase):
    """Generation of sinusoid using exponential function

    Args:
        dur (float): Duration (in seconds) 
        Fs (scalar): Sampling rate 
        amp (float): Amplitude of sinusoid
        freq (float): Frequency of sinusoid (in Hz)
        phase (float): Phase of sinusoid (in radians)

    Returns:
        x (np.ndarray): Signal
        t (np.ndarray): Time axis (in seconds)

    """
    # vvvvvvvvvvvvvvvvvvvvv
    num_samples = int(Fs * dur)
    t = np.arange(num_samples) / Fs
    x = amp * np.exp(1j *(2*np.pi*(freq*t-phase))).imag
    return x, t
    # ^^^^^^^^^^^^^^^^^^^^^

x, t = generate_sinusoid(dur=2, Fs=8000, amp=0.1, freq=220, phase=0)
soundfile.write('out.wav',data=x, samplerate=8000)

ipd.Audio('out.wav')

ipd.Audio(t, rate=8000)

!which file

/usr/bin/file

!file 'out.wav'

out.wav: RIFF (little-endian) data, WAVE audio, Microsoft PCM, 16 bit, mono 8000 Hz

def chromatic_scale(dur=2, start_mnn=69, end_mnn=81, Fs=8000):
    """Sonification of the steps of the chromatic scale 
          between two MIDI note numbers, inclusive.

    Args:
        dur (float): Total duration (in seconds) of the sonification
        start_mnn (int): Starting pitch (in MIDI note number)
        end_mnn (int): Ending pitch (in MIDI note number)
        Fs (scalar): Sampling rate 

    Returns:
        x (np.ndarray): Signal
        t (np.ndarray): Time axis (in seconds)

    """
    # vvvvvvvvvvvvvvvvvvvvv   
    x = []
    t = []
    
    for mnn in range(start_mnn, end_mnn + 1):
        xs, ts = generate_sinusoid(dur/(end_mnn - start_mnn + 1), Fs, 0.2, f_pitch(mnn), 0.1)
        x.append(xs)
        t.append(ts)
    
    return np.concatenate(x), np.concatenate(t)
    # ^^^^^^^^^^^^^^^^^^^^^

def random_tune(dur=2, num_tones=8, vocabulary=range(0,127), Fs=1200):
    """Produce a random tune.
    
    Args:
        dur (float): Total duration (in seconds) of the tune
        num_tones (int): Total number of tones in tune
        vocabulary (Iterable[int]): The permissible notes that may appear 
            in the tune (in MIDI note number)
        Fs (scalar): Sampling rate 

    Returns:
        x (np.ndarray): Signal
        t (np.ndarray): Time axis (in seconds)

    """
    # vvvvvvvvvvvvvvvvvvvvv
    import random
    
    x = []
    t = []
    
    for mnn in range(0, num_tones):
        mnn = random.choice(vocabulary)
        xs, ts = generate_sinusoid(dur/num_tones, Fs, 0.2, f_pitch(mnn), 0.1)
        x.append(xs)
        t.append(ts)
    
    return np.concatenate(x), np.concatenate(t)
    # ^^^^^^^^^^^^^^^^^^^^^

x1, t1 = random_tune(8, 32, [6, 32, 90], 22050)
x2, t2 = random_tune(8, 32, [78, 76, 74], 22050)

ipd.Audio((x1 + x2)/2, rate=22050)

def generate_rich(dur, Fs, specification):
    """Generate a rich tone out of simple sinusoids.

    Args:
        dur (float): Duration (in seconds) 
        Fs (scalar): Sampling rate 
        specification: (Iterable[Iterable[float, float, float]]): Specification 
          of the rich tone as a list of
          simultaneous components:
            amplitude (float): Amplitude of sinusoid
            freq (float): Frequency of sinusoid (in Hz)
            phase (float): Phase of sinusoid (in radians)

    Returns:
        x (np.ndarray): Signal
        t (np.ndarray): Time axis (in seconds)

    """
    num_samples = int(Fs * dur)
    t = np.arange(num_samples) / Fs
    x = np.zeros(num_samples)
    for amp, freq, phase in specification:
        x_comp, t_comp = generate_sinusoid(dur=dur, Fs=Fs, amp=amp, freq=freq, phase=phase) 
        x += x_comp
    return x / np.max(x), t

NUM_COMPONENTS = 16

amplitudes = np.log2(np.linspace(2, 16, num=NUM_COMPONENTS))
amplitudes = amplitudes/np.max(amplitudes)

frequencies = (np.arange(1, 17)) * 440 + np.random.randint(-1, 1, size=NUM_COMPONENTS)

phases = np.zeros((NUM_COMPONENTS))

xr, tr = generate_rich(2, 8000, [spec for spec in zip(amplitudes, frequencies, phases)])

ipd.Audio(xr, rate=8000)

xs, Fs = librosa.load('out.wav')

def show_waveform(x, Fs):
    """Sonify the steps of the chromatic scale between two
          MIDI note numbers, inclusive.

    Args:
        x (np.ndarray): Signal
        Fs (scalar): Sampling rate 

    Returns:
        nothing
    """
    t = np.arange(len(x)) / Fs
    plt.figure()
    plt.plot(t, x)
    plt.xlabel('Time (seconds)')
    plt.ylabel('Amplitude')
    plt.show()

show_waveform(generate_sinusoid(1, 512, 0.2, 20, 2)[0], 512)

y, sr = librosa.load(librosa.util.example('trumpet'), duration=10)

ipd.Audio(y, rate=sr)

show_waveform(y, sr)

librosa.display.waveshow(y, sr=sr)

<librosa.display.AdaptiveWaveplot at 0x7f8dc520c7f0>

librosa.display.waveshow(y[:100], sr=sr, marker='.')

<librosa.display.AdaptiveWaveplot at 0x7f8dc5091fa0>

snippet = y[3000:3500]
librosa.display.waveshow(snippet, sr=sr)

<librosa.display.AdaptiveWaveplot at 0x7f8dc52d47c0>

def estimate_frequency(x, Fs):
    """Provide a rough estimate of the frequency

    Args:
        x (np.ndarray): Signal
        Fs (scalar): Sampling rate 

    Returns:
        f_estimate (float): Estimate of the signal based
          on computing distances between detected peaks.
    """
    # vvvvvvvvvvvvvvvvvvvvv
    peaks = librosa.util.peak_pick(x, pre_max=25, post_max=25, pre_avg=25, post_avg=25, delta=0.1, wait=10)
    average_delta = np.mean(np.diff(peaks))
    f_estimate = Fs / average_delta
    return f_estimate
    # ^^^^^^^^^^^^^^^^^^^^^

estimate_frequency(snippet, Fs=sr)

621.8004338394794

ipd.Audio(snippet, rate=sr)

x_est, t_est = generate_sinusoid(dur=2, Fs=16000, amp=1, freq=622.75, phase=0)
ipd.Audio(x_est, rate=16000)

drum_x, drum_Fs = librosa.load(librosa.example('choice'))
ipd.Audio(drum_x, rate=drum_Fs)

tempo, beats_t = librosa.beat.beat_track(y=drum_x, sr=drum_Fs, units='time')

beats_t

array([ 0.06965986,  0.48761905,  0.92879819,  1.36997732,  1.81115646,
        2.22911565,  2.69351474,  3.13469388,  3.57587302,  4.01705215,
        4.45823129,  4.89941043,  5.34058957,  5.78176871,  6.22294785,
        6.66412698,  7.10530612,  7.54648526,  7.9876644 ,  8.42884354,
        8.87002268,  9.31120181,  9.75238095, 10.19356009, 10.63473923,
       11.05269841, 11.49387755, 11.95827664, 12.39945578, 12.84063492,
       13.28181406, 13.7229932 , 14.16417234, 14.60535147, 15.02331066,
       15.48770975, 15.92888889, 16.37006803, 16.81124717, 17.2524263 ,
       17.69360544, 18.11156463, 18.55274376, 19.01714286, 19.458322  ,
       19.89950113, 20.34068027, 20.78185941, 21.22303855, 21.66421769,
       22.08217687, 22.54657596, 22.9877551 , 23.40571429])

fig, ax = plt.subplots(figsize=(18,5))

librosa.display.waveshow(drum_x, ax=ax, label='Waveform (choice.wav)')

ax.vlines(beats_t, ymin=np.min(drum_x), ymax=np.max(drum_x), 
          color='red', label='Detected beats\n(librosa.beat.beat_track)')

ax.legend()

plt.show()

def reverse_by_beat(x, Fs):
    """Reverse a music track by-beat, by doing beat detection,
         segmenting the original track into frames, and
         reordering the segments in reverse order.

    Args:
        x (np.ndarray): Signal
        Fs (scalar): Sampling rate 

    Returns:
        f_estimate (np.ndarray): Remixed music signal.
    """
    # vvvvvvvvvvvvvvvvvvvvv
    tempo, beats_samples = librosa.beat.beat_track(y=x, sr=Fs, units='samples')
    intervals = librosa.util.frame(beats_samples, frame_length=2, hop_length=1).T
    remixed = librosa.effects.remix(drum_x, intervals[::-1])
    return remixed
    # ^^^^^^^^^^^^^^^^^^^^^

ipd.Audio(reverse_by_beat(drum_x, drum_Fs), rate=drum_Fs)

ipd.Audio(drum_x[::-1], rate=drum_Fs)

dir(librosa.feature)

['chroma_cens',
 'chroma_cqt',
 'chroma_stft',
 'chroma_vqt',
 'delta',
 'fourier_tempogram',
 'inverse',
 'melspectrogram',
 'mfcc',
 'poly_features',
 'rms',
 'spectral_bandwidth',
 'spectral_centroid',
 'spectral_contrast',
 'spectral_flatness',
 'spectral_rolloff',
 'stack_memory',
 'tempo',
 'tempogram',
 'tempogram_ratio',
 'tonnetz',
 'zero_crossing_rate']

Practical: Working with sampled audio¶

Before you do anything else¶

1 Working with pitch¶

1.1 Computing center frequency given a MIDI number¶

1.2 Computing center frequency for all valid MIDI note numbers¶

1.3 Computing the frequencies of harmonics¶

1.5 Relationship between 12-tone equal temperament and harmonics¶

2 Making sounds¶

2.1 Synthesizing sine tones using trigonometric functions¶

2.2 Synthesizing sine tones using the exponential function¶

2.3 Synthesizing a 12-tone equal tempered chromatic scale¶

2.4 Synthesizing a random tune¶

2.5 Synthesizing richer tones¶

3 A (very) brief orientation in Librosa¶

3.1 Loading an audio file¶

3.2 Visualising an audio file¶

3.3 Estimating fundamental frequency by peak finding¶

3.4 Programmatic editing of sound files¶

Practical: Working with sampled audio¶

Before you do anything else¶

1 Working with pitch¶

1.1 Computing center frequency given a MIDI number¶

1.2 Computing center frequency for all valid MIDI note numbers¶

1.3 Computing the frequencies of harmonics¶

1.4 Computing center frequencies of pitches related by an octave¶

1.5 Relationship between 12-tone equal temperament and harmonics¶

2 Making sounds¶

2.1 Synthesizing sine tones using trigonometric functions¶

2.2 Synthesizing sine tones using the exponential function¶

2.3 Synthesizing a 12-tone equal tempered chromatic scale¶

2.4 Synthesizing a random tune¶

2.5 Synthesizing richer tones¶

3 A (very) brief orientation in Librosa¶

3.1 Loading an audio file¶

3.2 Visualising an audio file¶

3.3 Estimating fundamental frequency by peak finding¶

3.4 Programmatic editing of sound files¶