{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# PyTorch VGGish" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "%reload_ext autoreload\n", "%autoreload 2\n", "%matplotlib inline" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "import os" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "from local.torch_basics import *\n", "from local.test import *\n", "from local.basics import *\n", "from local.data.all import *\n", "from local.vision.core import *\n", "from local.notebook.showdoc import show_doc\n", "from local.audio.core import *\n", "from local.audio.augment import *\n", "from local.vision.learner import *\n", "from local.vision.models.xresnet import *\n", "from local.metrics import *\n", "from local.callback.schedule import *\n", "import torchaudio\n", "from IPython.display import Audio, display" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "#def arc_extract(fname, dest): Archive(fname).extractall(dest)\n", "URLs.ESC50 = 'https://github.com/karoldvl/ESC-50/archive/master.zip'\n", "pESC50 = Config()['data_path'] / 'ESC-50/ESC-50-master'\n", "PATH_AUDIO = pESC50/\"audio\"\n", "PATH_CSV = pESC50/\"meta/esc50.csv\"\n", "DF = pd.read_csv(PATH_CSV)\n", "#untar_data(URLs.ESC50, fname=str(pESC50)+'.zip', dest=pESC50, extract_func=arc_extract)" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "x = AudioGetter(\"\", recurse=True, folders=None)\n", "files_ESC50 = x(pESC50)\n", "#original_aud = AudioItem.create(files[0])" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | filename | \n", "fold | \n", "target | \n", "category | \n", "esc10 | \n", "src_file | \n", "take | \n", "
---|---|---|---|---|---|---|---|
0 | \n", "1-100032-A-0.wav | \n", "1 | \n", "0 | \n", "dog | \n", "True | \n", "100032 | \n", "A | \n", "
1 | \n", "1-100038-A-14.wav | \n", "1 | \n", "14 | \n", "chirping_birds | \n", "False | \n", "100038 | \n", "A | \n", "
2 | \n", "1-100210-A-36.wav | \n", "1 | \n", "36 | \n", "vacuum_cleaner | \n", "False | \n", "100210 | \n", "A | \n", "
3 | \n", "1-100210-B-36.wav | \n", "1 | \n", "36 | \n", "vacuum_cleaner | \n", "False | \n", "100210 | \n", "B | \n", "
4 | \n", "1-101296-A-19.wav | \n", "1 | \n", "19 | \n", "thunderstorm | \n", "False | \n", "101296 | \n", "A | \n", "