dont remove query when uniquifying links

This commit is contained in:
Nick Sweeting 2018-04-17 03:54:59 -04:00
parent 542b1d14f6
commit 0099849df9

View file

@ -33,7 +33,7 @@ without_query = lambda url: url.split('?', 1)[0]
without_hash = lambda url: url.split('#', 1)[0] without_hash = lambda url: url.split('#', 1)[0]
without_path = lambda url: url.split('/', 1)[0] without_path = lambda url: url.split('/', 1)[0]
domain = lambda url: without_hash(without_query(without_path(without_scheme(url)))) domain = lambda url: without_hash(without_query(without_path(without_scheme(url))))
base_url = lambda url: without_query(without_scheme(url)) base_url = lambda url: without_scheme(url) # uniq base url used to dedupe links
short_ts = lambda ts: ts.split('.')[0] short_ts = lambda ts: ts.split('.')[0]