Added some more non-ASCII characters to be translated.

4 years ago · 3c57ea22e8
parent 92204ca22c
commit 3c57ea22e8
1 changed files with 2 additions and 1 deletions
--- a/asl_articles/utils.py
+++ b/asl_articles/utils.py
@ -86,7 +86,8 @@ def clean_html( val, allow_tags=None, safe_attrs=None ): #pylint: disable=too-ma
    val = replace_chars( val, '"', [ "\u00ab", "\u00bb", "\u201c", "\u201d", "\u201e", "\u201f" ] )
    val = replace_chars( val, "'", [ "\u2018", "\u2019", "\u201a", "\u201b", "\u2039", "\u203a" ] )
    val = replace_chars( val, r"\1 - \2", [ re.compile( r"(\S+)\u2014(\S+)" ) ] )
-    val = replace_chars( val, "-", [ "\u2014" ] )
+    val = replace_chars( val, "-", [ "\u2013", "\u2014" ] )
+    val = replace_chars( val, "...", [ "\u2026" ] )

    # FUDGE! lxml replaces HTML entities with their actual character :-/ It's possible to stop it from doing this,
    # by passing in an ElementTree, which gives us an ElementTree back, and we can then control how it is serialized