Spaces:
Runtime error
Runtime error
| from math import log2, pow | |
| import numpy as np | |
| from scipy.fftpack import fft | |
| import gradio as gr | |
| from gradio.media import get_audio | |
| A4 = 440 | |
| C0 = A4 * pow(2, -4.75) | |
| name = ["C", "C#", "D", "D#", "E", "F", "F#", "G", "G#", "A", "A#", "B"] | |
| def get_pitch(freq): | |
| h = round(12 * log2(freq / C0)) | |
| n = h % 12 | |
| return name[n] | |
| def main_note(audio): | |
| rate, y = audio | |
| if len(y.shape) == 2: | |
| y = y.T[0] | |
| N = len(y) | |
| T = 1.0 / rate | |
| yf = fft(y) | |
| yf2 = 2.0 / N * np.abs(yf[0 : N // 2]) | |
| xf = np.linspace(0.0, 1.0 / (2.0 * T), N // 2) | |
| volume_per_pitch = {} | |
| total_volume = np.sum(yf2) | |
| for freq, volume in zip(xf, yf2): | |
| if freq == 0: | |
| continue | |
| pitch = get_pitch(freq) | |
| if pitch not in volume_per_pitch: | |
| volume_per_pitch[pitch] = 0 | |
| volume_per_pitch[pitch] += 1.0 * volume / total_volume | |
| volume_per_pitch = {k: float(v) for k, v in volume_per_pitch.items()} | |
| return volume_per_pitch | |
| demo = gr.Interface( | |
| main_note, | |
| gr.Audio(sources=["microphone"]), | |
| gr.Label(num_top_classes=4), | |
| examples=[ | |
| [get_audio("recording1.wav")], | |
| [get_audio("cantina.wav")], | |
| ], | |
| api_name="predict" | |
| ) | |
| if __name__ == "__main__": | |
| demo.launch() | |