mirror of
https://github.com/pirate/ArchiveBox.git
synced 2025-09-01 10:23:38 +02:00
fix parsing links from stdin with whitespace
This commit is contained in:
@@ -262,6 +262,7 @@ def parse_plain_text(text_file):
|
||||
urls = re.findall(URL_REGEX, line)
|
||||
|
||||
for url in urls:
|
||||
url = url.strip()
|
||||
info = {
|
||||
'url': url,
|
||||
'domain': domain(url),
|
||||
|
Reference in New Issue
Block a user