Preserve order of URLs fetched from page--especially important for anthologies.

This commit is contained in:
Jim Miller 2015-06-09 13:08:56 -05:00
parent 390c661a88
commit 69d1ce6c01

View file

@ -117,7 +117,7 @@ def get_urls_from_html(data,url=None,configuration=None,normalize=False,restrict
def get_urls_from_text(data,configuration=None,normalize=False): def get_urls_from_text(data,configuration=None,normalize=False):
urls = collections.OrderedDict(list) urls = collections.OrderedDict()
data=unicode(data) data=unicode(data)
if not configuration: if not configuration: