diff --git a/requirements.txt b/requirements.txt index 6baa507f..f053885b 100644 --- a/requirements.txt +++ b/requirements.txt @@ -3,3 +3,4 @@ feedparser lxml Pillow datetime +beautifulsoup4 \ No newline at end of file diff --git a/spoilers.py b/spoilers.py index f4be14f0..d0d5c5f5 100644 --- a/spoilers.py +++ b/spoilers.py @@ -12,6 +12,9 @@ import datetime import urllib import json import xml.dom.minidom +from bs4 import BeautifulSoup as BS +from bs4 import Comment + def scrape_mtgs(url): return requests.get(url, headers={'Cache-Control':'no-cache', 'Pragma':'no-cache', 'Expires': 'Thu, 01 Jan 1970 00:00:00 GMT'}).text @@ -1146,3 +1149,81 @@ def add_headers(mtgjson, setinfos): if 'blockname' in setinfos: mtgjson2['block'] = setinfos['blockname'] return mtgjson2 + +def get_mythic_cards(url='http://mythicspoiler.com/ixa/', mtgjson=False): #mtgjson is optional, will ignore cards found if passed + cards = {'cards':[]} + r = requests.get(url) + soup = BS(r.text, "html.parser") + cardurls = soup.find_all('a', 'card') + urllist = [] + for cardurl in cardurls: + try: + urllist.append(url + str(cardurl).split("href=\"")[1].split('">