|
import gradio as gr |
|
import numpy as np |
|
import matplotlib.pyplot as plt |
|
from matplotlib.animation import FuncAnimation |
|
import io |
|
import librosa |
|
import tempfile |
|
|
|
def extract_waveform_animation(audio_file, window_seconds=5): |
|
y, sr = librosa.load(audio_file, sr=None) |
|
duration = librosa.get_duration(y=y, sr=sr) |
|
|
|
fig, ax = plt.subplots() |
|
line, = ax.plot([], [], lw=2) |
|
window_length = int(window_seconds * sr) |
|
|
|
|
|
first_window = y[:window_length] |
|
x_vals = np.linspace(0, duration, num=len(y)) |
|
ax.set_axis_off() |
|
|
|
def init(): |
|
ax.set_xlim(0, window_seconds) |
|
ax.set_ylim(np.min(y), np.max(y)) |
|
return line, |
|
|
|
def update(frame): |
|
|
|
start = frame * sr |
|
end = start + window_length |
|
window = y[start:end] |
|
|
|
|
|
ax.set_xlim(frame, frame + window_seconds) |
|
|
|
|
|
line.set_data(x_vals[start:end], window) |
|
return line, |
|
|
|
total_frames = int(duration) |
|
ani = FuncAnimation(fig, update, frames=range(total_frames), |
|
init_func=init, interval=7, blit=False) |
|
|
|
with tempfile.NamedTemporaryFile(delete=False, suffix='.mp4') as tmpfile: |
|
ani.save(tmpfile.name, writer='ffmpeg', fps=1) |
|
video_path = tmpfile.name |
|
|
|
return video_path |
|
|
|
|
|
iface = gr.Interface( |
|
fn=extract_waveform_animation, |
|
inputs=[ |
|
gr.Audio(type="filepath"), |
|
gr.Slider(1, 10, value=5, step=1, label="Window Size (seconds)") |
|
], |
|
outputs=gr.Video(), |
|
description="Scroll through audio waveform with a moving window." |
|
) |
|
|
|
if __name__ == "__main__": |
|
iface.launch() |