diff --git a/scripts/extractors/generic.py b/scripts/extractors/generic.py index 5715ee0..c1bdd0f 100644 --- a/scripts/extractors/generic.py +++ b/scripts/extractors/generic.py @@ -128,6 +128,10 @@ def extract (url, page=None, network=False, verbosity=3, args={}): feed = extract_from_page (page, verbosity, url, args) if not feed is None: if feed.startswith("/"): - domain = url[:url.find("/",url.find("//")+2)] + index = url.find("/",url.find("//")+2) + if index == -1: + domain = url + else: + domain = url[:index] feed = domain + feed return feed diff --git a/scripts/extractors/tumblr.py b/scripts/extractors/tumblr.py index 0476945..351e2e3 100644 --- a/scripts/extractors/tumblr.py +++ b/scripts/extractors/tumblr.py @@ -12,8 +12,12 @@ if platform.endswith(".py"): def extract_from_url (url, verbosity): # split into domain and path index = url.find("/",url.find("//")+2) - domain = url[:index] - path = url[index:] + if index == -1: + domain = url + path = "/" + else: + domain = url[:index] + path = url[index:] primary_domain = { "https://tumblr.com",