from pytube import YouTube import librosa import numpy as np def download_youtube_audio(url): yt = YouTube(url) stream = yt.streams.filter(only_audio=True).first() filename = stream.download() audio, sr = librosa.load(filename, sr=44100, mono=False) if audio.ndim == 1: audio = np.stack([audio, audio]) return audio.T