import numpy as np
import librosa
import soundfile
import IPython.display as ipd

from matplotlib import pylab as plt

def f_pitch(p):
    """Compute center frequency for (single or array of) MIDI note numbers.

    Args:
        p: MIDI note numbers

    Returns:
        freq_center: Center frequency
    """
    # vvvvvvvvvvvvvvvvvvvvv
    # Put your code here!
    # ^^^^^^^^^^^^^^^^^^^^^

def f_all_valid_midi():
    """Compute center frequency for (single or array of) MIDI note numbers.

    Returns:
        center_freqs: Center frequency
    """
    # vvvvvvvvvvvvvvvvvvvvv
    # Put your code here!
    # ^^^^^^^^^^^^^^^^^^^^^

np.all(np.isclose(f_all_valid_midi(), f_pitch(np.arange(0, 128))))

True

def make_h(center_frequencies, num_harmonics):
    """Compute harmonics above center frequencies given
         up to num_harmonics

    Returns:
        H (ndarray): A 2D numpy matrix as above
    """
    # vvvvvvvvvvvvvvvvvvvvv
    # Put your code here!
    # ^^^^^^^^^^^^^^^^^^^^^

cf = f_pitch(np.arange(0, 128))
H = make_h(cf, 128)

H[69][2]

1320.0

def make_o(center_frequencies, num_octaves):
    """Compute octave-related pitches
        center frequencies given, up to num_octaves

    Returns:
        O (ndarray): A 2D numpy matrix as above
    """
    # vvvvvvvvvvvvvvvvvvvvv
    # Put your code here!
    # ^^^^^^^^^^^^^^^^^^^^^

O = make_o(cf, 8)

O[69][2]

1760.0

H[60][:10]

array([ 261.6255653 ,  523.2511306 ,  784.8766959 , 1046.5022612 ,
       1308.1278265 , 1569.7533918 , 1831.3789571 , 2093.0045224 ,
       2354.63008771, 2616.25565301])

cf[60 + 12 + 7]

783.9908719634985

def midi_harmonics(center_mnn=60, num_harmonics=16, tolerance=1e-02):
    cf = f_pitch(np.arange(0, 128))
    cax = plt.imshow(np.isclose(H[center_mnn][:num_harmonics], cf[:,None], 1e-02).T, cmap='Greys', 
                     interpolation='none', aspect='auto')
    plt.xlabel('Pitch (MIDI note number)')
    plt.ylabel('n-th Harmonic (n)')
    plt.show()

midi_harmonics()

np.where(np.isclose(H[60][:16], cf[:,None], 1e-02))

(array([ 60,  72,  79,  84,  88,  91,  96,  98, 100, 103, 107, 108]),
 array([ 0,  1,  2,  3,  4,  5,  7,  8,  9, 11, 14, 15]))

cf[60], cf[67]

(261.6255653005986, 391.99543598174927)

cf[60]/cf[67]

0.6674199270850172

cf[60] * (3/2)

392.43834795089793

def check_perfect(mnn):
    """Difference between pure and ET intervals

    Args:
        mnn (int): MIDI note number

    Returns:
        d (scalar): Difference in Hertz between frequency
          of ET perfect fifth above and pure perfect fifth
          above given MIDI note number 

    """
    # vvvvvvvvvvvvvvvvvvvvv    
    # Put your code here!
    # ^^^^^^^^^^^^^^^^^^^^^

checked = check_perfect(np.arange(60, 72))

def generate_sinusoid(dur, Fs, amp, freq, phase):
    """Generation of sinusoid

    Args:
        dur (float): Duration (in seconds) 
        Fs (scalar): Sampling rate 
        amp (float): Amplitude of sinusoid
        freq (float): Frequency of sinusoid (in Hz)
        phase (float): Phase of sinusoid (in radians)

    Returns:
        x (np.ndarray): Signal
        t (np.ndarray): Time axis (in seconds)

    """
    num_samples = int(Fs * dur)
    t = np.arange(num_samples) / Fs
    x = amp * np.sin(2*np.pi*(freq*t-phase))
    return x, t

x0, t0 = generate_sinusoid(dur=2, Fs=512, amp=1, freq=10, phase=0)
x1, t1 = generate_sinusoid(dur=2, Fs=512, amp=0.2, freq=105, phase=(np.pi))

plt.plot(t0, x0)
plt.show()

def generate_sinusoid_exp(dur, Fs, amp, freq, phase):
    """Generation of sinusoid using exponential function

    Args:
        dur (float): Duration (in seconds) 
        Fs (scalar): Sampling rate 
        amp (float): Amplitude of sinusoid
        freq (float): Frequency of sinusoid (in Hz)
        phase (float): Phase of sinusoid (in radians)

    Returns:
        x (np.ndarray): Signal
        t (np.ndarray): Time axis (in seconds)

    """
    # vvvvvvvvvvvvvvvvvvvvv
    # Put your code here!
    # ^^^^^^^^^^^^^^^^^^^^^

x, t = generate_sinusoid(dur=2, Fs=8000, amp=0.1, freq=220, phase=0)
soundfile.write('out.wav',data=x, samplerate=8000)

ipd.Audio('out.wav')

ipd.Audio(t, rate=8000)

!which file

/usr/bin/file

!file 'out.wav'

out.wav: RIFF (little-endian) data, WAVE audio, Microsoft PCM, 16 bit, mono 8000 Hz

def chromatic_scale(dur=2, start_mnn=69, end_mnn=81, Fs=8000):
    """Sonification of the steps of the chromatic scale 
          between two MIDI note numbers, inclusive.

    Args:
        dur (float): Total duration (in seconds) of the sonification
        start_mnn (int): Starting pitch (in MIDI note number)
        end_mnn (int): Ending pitch (in MIDI note number)
        Fs (scalar): Sampling rate 

    Returns:
        x (np.ndarray): Signal
        t (np.ndarray): Time axis (in seconds)

    """
    # vvvvvvvvvvvvvvvvvvvvv   
    # Put your code here!
    # ^^^^^^^^^^^^^^^^^^^^^

def random_tune(dur=2, num_tones=8, vocabulary=range(0,127), Fs=1200):
    """Produce a random tune.
    
    Args:
        dur (float): Total duration (in seconds) of the tune
        num_tones (int): Total number of tones in tune
        vocabulary (Iterable[int]): The permissible notes that may appear 
            in the tune (in MIDI note number)
        Fs (scalar): Sampling rate 

    Returns:
        x (np.ndarray): Signal
        t (np.ndarray): Time axis (in seconds)

    """
    # vvvvvvvvvvvvvvvvvvvvv
    # Put your code here!
    # ^^^^^^^^^^^^^^^^^^^^^

x1, t1 = random_tune(8, 32, [6, 32, 90], 22050)
x2, t2 = random_tune(8, 32, [78, 76, 74], 22050)

ipd.Audio((x1 + x2)/2, rate=22050)

def generate_rich(dur, Fs, specification):
    """Generate a rich tone out of simple sinusoids.

    Args:
        dur (float): Duration (in seconds) 
        Fs (scalar): Sampling rate 
        specification: (Iterable[Iterable[float, float, float]]): Specification 
          of the rich tone as a list of
          simultaneous components:
            amplitude (float): Amplitude of sinusoid
            freq (float): Frequency of sinusoid (in Hz)
            phase (float): Phase of sinusoid (in radians)

    Returns:
        x (np.ndarray): Signal
        t (np.ndarray): Time axis (in seconds)

    """
    num_samples = int(Fs * dur)
    t = np.arange(num_samples) / Fs
    x = np.zeros(num_samples)
    for amp, freq, phase in specification:
        x_comp, t_comp = generate_sinusoid(dur=dur, Fs=Fs, amp=amp, freq=freq, phase=phase) 
        x += x_comp
    return x / np.max(x), t

NUM_COMPONENTS = 16

amplitudes = np.log2(np.linspace(2, 16, num=NUM_COMPONENTS))
amplitudes = amplitudes/np.max(amplitudes)

frequencies = (np.arange(1, 17)) * 440 + np.random.randint(-1, 1, size=NUM_COMPONENTS)

phases = np.zeros((NUM_COMPONENTS))

xr, tr = generate_rich(2, 8000, [spec for spec in zip(amplitudes, frequencies, phases)])

ipd.Audio(xr, rate=8000)

xs, Fs = librosa.load('out.wav')

def show_waveform(x, Fs):
    """Sonify the steps of the chromatic scale between two
          MIDI note numbers, inclusive.

    Args:
        x (np.ndarray): Signal
        Fs (scalar): Sampling rate 

    Returns:
        nothing
    """
    t = np.arange(len(x)) / Fs
    plt.figure()
    plt.plot(t, x)
    plt.xlabel('Time (seconds)')
    plt.ylabel('Amplitude')
    plt.show()

show_waveform(generate_sinusoid(1, 512, 0.2, 20, 2)[0], 512)

y, sr = librosa.load(librosa.util.example('trumpet'), duration=10)

ipd.Audio(y, rate=sr)

show_waveform(y, sr)

librosa.display.waveshow(y, sr=sr)

<librosa.display.AdaptiveWaveplot at 0x7f8dc520c7f0>

librosa.display.waveshow(y[:100], sr=sr, marker='.')

<librosa.display.AdaptiveWaveplot at 0x7f8dc5091fa0>

snippet = y[3000:3500]
librosa.display.waveshow(snippet, sr=sr)

<librosa.display.AdaptiveWaveplot at 0x7f8dc52d47c0>

def estimate_frequency(x, Fs):
    """Provide a rough estimate of the frequency

    Args:
        x (np.ndarray): Signal
        Fs (scalar): Sampling rate 

    Returns:
        f_estimate (float): Estimate of the signal based
          on computing distances between detected peaks.
    """
    # vvvvvvvvvvvvvvvvvvvvv
    # Put your code here!
    # ^^^^^^^^^^^^^^^^^^^^^

estimate_frequency(snippet, Fs=sr)

621.8004338394794

ipd.Audio(snippet, rate=sr)

x_est, t_est = generate_sinusoid(dur=2, Fs=16000, amp=1, freq=622.75, phase=0)
ipd.Audio(x_est, rate=16000)

drum_x, drum_Fs = librosa.load(librosa.example('choice'))
ipd.Audio(drum_x, rate=drum_Fs)

tempo, beats_t = librosa.beat.beat_track(y=drum_x, sr=drum_Fs, units='time')

beats_t

array([ 0.06965986,  0.48761905,  0.92879819,  1.36997732,  1.81115646,
        2.22911565,  2.69351474,  3.13469388,  3.57587302,  4.01705215,
        4.45823129,  4.89941043,  5.34058957,  5.78176871,  6.22294785,
        6.66412698,  7.10530612,  7.54648526,  7.9876644 ,  8.42884354,
        8.87002268,  9.31120181,  9.75238095, 10.19356009, 10.63473923,
       11.05269841, 11.49387755, 11.95827664, 12.39945578, 12.84063492,
       13.28181406, 13.7229932 , 14.16417234, 14.60535147, 15.02331066,
       15.48770975, 15.92888889, 16.37006803, 16.81124717, 17.2524263 ,
       17.69360544, 18.11156463, 18.55274376, 19.01714286, 19.458322  ,
       19.89950113, 20.34068027, 20.78185941, 21.22303855, 21.66421769,
       22.08217687, 22.54657596, 22.9877551 , 23.40571429])

fig, ax = plt.subplots(figsize=(18,5))

librosa.display.waveshow(drum_x, ax=ax, label='Waveform (choice.wav)')

ax.vlines(beats_t, ymin=np.min(drum_x), ymax=np.max(drum_x), 
          color='red', label='Detected beats\n(librosa.beat.beat_track)')

ax.legend()

plt.show()

def reverse_by_beat(x, Fs):
    """Reverse a music track by-beat, by doing beat detection,
         segmenting the original track into frames, and
         reordering the segments in reverse order.

    Args:
        x (np.ndarray): Signal
        Fs (scalar): Sampling rate 

    Returns:
        f_estimate (np.ndarray): Remixed music signal.
    """
    # vvvvvvvvvvvvvvvvvvvvv
    # Put your code here!
    # ^^^^^^^^^^^^^^^^^^^^^

ipd.Audio(reverse_by_beat(drum_x, drum_Fs), rate=drum_Fs)

ipd.Audio(drum_x[::-1], rate=drum_Fs)

dir(librosa.feature)

['chroma_cens',
 'chroma_cqt',
 'chroma_stft',
 'chroma_vqt',
 'delta',
 'fourier_tempogram',
 'inverse',
 'melspectrogram',
 'mfcc',
 'poly_features',
 'rms',
 'spectral_bandwidth',
 'spectral_centroid',
 'spectral_contrast',
 'spectral_flatness',
 'spectral_rolloff',
 'stack_memory',
 'tempo',
 'tempogram',
 'tempogram_ratio',
 'tonnetz',
 'zero_crossing_rate']

Practical: Working with sampled audio¶

Before you do anything else¶

1 Working with pitch¶

1.1 Computing center frequency given a MIDI number¶

1.2 Computing center frequency for all valid MIDI note numbers¶

1.3 Computing the frequencies of harmonics¶

1.5 Relationship between 12-tone equal temperament and harmonics¶

2 Making sounds¶

2.1 Synthesizing sine tones using trigonometric functions¶

2.2 Synthesizing sine tones using the exponential function¶

2.3 Synthesizing a 12-tone equal tempered chromatic scale¶

2.4 Synthesizing a random tune¶

2.5 Synthesizing richer tones¶

3 A (very) brief orientation in Librosa¶

3.1 Loading an audio file¶

3.2 Visualising an audio file¶

3.3 Estimating fundamental frequency by peak finding¶

3.4 Programmatic editing of sound files¶

Practical: Working with sampled audio¶

Before you do anything else¶

1 Working with pitch¶

1.1 Computing center frequency given a MIDI number¶

1.2 Computing center frequency for all valid MIDI note numbers¶

1.3 Computing the frequencies of harmonics¶

1.4 Computing center frequencies of pitches related by an octave¶

1.5 Relationship between 12-tone equal temperament and harmonics¶

2 Making sounds¶

2.1 Synthesizing sine tones using trigonometric functions¶

2.2 Synthesizing sine tones using the exponential function¶

2.3 Synthesizing a 12-tone equal tempered chromatic scale¶

2.4 Synthesizing a random tune¶

2.5 Synthesizing richer tones¶

3 A (very) brief orientation in Librosa¶

3.1 Loading an audio file¶

3.2 Visualising an audio file¶

3.3 Estimating fundamental frequency by peak finding¶

3.4 Programmatic editing of sound files¶