{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Scraping and Parsing: EAD XML Finding Aids from the Library of Congress" ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import os\n", "from urllib.request import urlopen\n", "from bs4 import BeautifulSoup\n", "import subprocess" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "## Creating a directory called 'LOC_Metadata' and setting it as our current working directory\n", "\n", "!mkdir /sharedfolder/LOC_Metadata\n", "\n", "os.chdir('/sharedfolder/LOC_Metadata')" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "\n", " \n", " \n", " \n", "
\n", " \n", "