Bug fix museodelprado.es URL

This commit is contained in:
Edward Betts 2019-09-27 14:17:07 +01:00
parent d7df704327
commit 541443df02

View file

@ -3,7 +3,7 @@ import lxml.html
import os
import re
re_url = re.compile(r'www.museodelprado.es/en/.*/([^/]+)$')
re_url = re.compile(r'www.museodelprado.es/(.+)$')
def get_html(url):
catalog_id = re_url.search(url).group(1).replace('/', '_')