shaddyshad · May 1, 2020 09:38
diff --git a/main.py b/main.py
 import re 
 import requests
 from bs4 import BeautifulSoup

 def extract_images(site):
    """ Extract images from the url given"""
    response = requests.get(site)

    soup = BeautifulSoup(response.text, 'html.parser')
    
    img_tags = soup.find_all('img')
    

    # extract the urls
    urls = [img['src'] for img in img_tags]

    for url in urls:
        pattern = r'/([\w_-]+[.](jpg|gif|png))$' # pattern to extract image files

        filename = re.search(pattern, url)
        
        if not filename:
            print("No filename {}", url)
            continue
        
        with open(filename.group(1), 'wb') as f:
            if 'http' not in url:       # relative reques?
                url = "{}{}".format(site, url)

            print(url)

            response = requests.get(url)
            f.write(response.content)


 if __name__ == "__main__":
    site = "https://heartofvegasslots.com/#="
    
    extract_images(site)
	import re
	import requests
	from bs4 import BeautifulSoup

	def extract_images(site):
	""" Extract images from the url given"""
	response = requests.get(site)

	soup = BeautifulSoup(response.text, 'html.parser')

	img_tags = soup.find_all('img')


	# extract the urls
	urls = [img['src'] for img in img_tags]

	for url in urls:
	pattern = r'/([\w_-]+[.](jpg\|gif\|png))$' # pattern to extract image files

	filename = re.search(pattern, url)

	if not filename:
	print("No filename {}", url)
	continue

	with open(filename.group(1), 'wb') as f:
	if 'http' not in url: # relative reques?
	url = "{}{}".format(site, url)

	print(url)

	response = requests.get(url)
	f.write(response.content)


	if __name__ == "__main__":
	site = "https://heartofvegasslots.com/#="

	extract_images(site)