diff --git a/src/extractors/generic.py b/src/extractors/generic.py index c4e6a88..03e42d8 100644 --- a/src/extractors/generic.py +++ b/src/extractors/generic.py @@ -36,11 +36,12 @@ def try_common_paths (verbosity, url, args): for path in common_paths: page,response_code = download (platform, url + '/' + path, args, verbosity, True) if response_code == 200: - # TODO: verify it is a valid RSS feed - # Some pages serve response 200 for invalid pages - - # assume we found a feed - return url + '/' + path + # basic check that it looks like an RSS or Atom file + if "