Added 'Python/asciifarts_scrapper.py'

2024-12-10 20:39:02 +01:00
parent 253a4d7529
commit 9ddf68f653
1 changed files with 33 additions and 0 deletions
--- a/Python/asciifarts_scrapper.py
+++ b/Python/asciifarts_scrapper.py
@ -0,0 +1,33 @@
 import requests
 import bs4
 import re
 base_url = "http://www.asciiartfarts.com/"
 hub_url  = "http://www.asciiartfarts.com/number.html"
 out_dir  = "out/"
 hub = bs4.BeautifulSoup(requests.get(hub_url).text, 'html.parser')
 href_list = set()
 for a in hub.find('ul').find('li').find_all('a'):
 	try: href = a['href']
 	except: continue
 	if re.match(r'\d+.html', href):
 		href_list.add(href)
 #print(href_list)
 for h in href_list:
 	page = bs4.BeautifulSoup(requests.get(base_url + h).text, 'html.parser')
 	name = (page
 			.find('h1')
 			.text.split(':')[1]
 			.strip()
 			.replace(' ', '_')
 			.replace('/', '_')
 			+ '.ascii'
 	)
 	ascii_art = page.find_all('pre')[1].text
 	print(name)
 	with open(out_dir + name, 'w') as f: f.write(ascii_art)