diff --git a/utils.py b/utils.py index 9febca5..c7b9722 100644 --- a/utils.py +++ b/utils.py @@ -160,7 +160,7 @@ def clean_title(title): if found: line = line[found.end():] line = unlabeled_link_pattern.sub(r'\1', line) - line = line.replace('\t', ' ') + line = line.replace('\t', ' ').replace('\r', '') cleaned.append(line) title = ' '.join(cleaned).strip() return title @@ -225,7 +225,7 @@ def prefix_links(src, prefix):   def strip_invalid(src): - return src.replace('\x00', '') + return src.replace('\x00', '').replace('\r', '')   def shorten_text(text, n):