Davey-Hughes · December 22, 2021 19:27
diff --git a/README.md b/README.md
diff --git a/dl_co_outbreak.py b/dl_co_outbreak.py
 import subprocess

 import requests
 from bs4 import BeautifulSoup


 CO_COVID_URL = 'https://covid19.colorado.gov/covid19-outbreak-data'


 def main():
    # download page source
    page = requests.get(CO_COVID_URL)

    # parse page with beautiful soup's HTML parser
    soup = BeautifulSoup(page.text, 'html.parser')

    # find the class with name 'file-link'
    file_class = soup.find(class_='file-link')

    # get the contents of the <a href> tag from the found class
    file_href = file_class.find('a', href=True)['href']

    # download the file using wget command line utility
    subprocess.run(['wget', file_href], check=True)


 if __name__ == '__main__':
    main()
diff --git a/pandas_co_outbreak.py b/pandas_co_outbreak.py
 import subprocess

 import requests
 from bs4 import BeautifulSoup
 import pandas as pd


 CO_COVID_URL = 'https://covid19.colorado.gov/covid19-outbreak-data'


 def main():
    # download page source
    page = requests.get(CO_COVID_URL)

    # parse page with beautiful soup's HTML parser
    soup = BeautifulSoup(page.text, 'html.parser')

    # find the class with name 'file-link'
    file_class = soup.find(class_='file-link')

    # get the contents of the <a href> tag from the found class
    file_href = file_class.find('a', href=True)['href']

    # load all sheets from the URL into a pandas dataframe
    file = pd.read_excel(file_href, sheet_name=None)

    # print a preview of the dataframe
    print(file)


 if __name__ == '__main__':
    main()
diff --git a/synapse_jupyter_example.png b/synapse_jupyter_example.png
	import subprocess

	import requests
	from bs4 import BeautifulSoup


	CO_COVID_URL = 'https://covid19.colorado.gov/covid19-outbreak-data'


	def main():
	# download page source
	page = requests.get(CO_COVID_URL)

	# parse page with beautiful soup's HTML parser
	soup = BeautifulSoup(page.text, 'html.parser')

	# find the class with name 'file-link'
	file_class = soup.find(class_='file-link')

	# get the contents of the <a href> tag from the found class
	file_href = file_class.find('a', href=True)['href']

	# download the file using wget command line utility
	subprocess.run(['wget', file_href], check=True)


	if __name__ == '__main__':
	main()