Merge pull request #1828 from andreacorbellini/chr-to-unichr

Use unichr() instead of chr() with Python 2.
2025-10-15 20:28:56 +02:00 · 2015-09-23 09:00:09 -07:00 · 2015-09-23 09:00:09 -07:00 · 72ee73f886
commit 72ee73f886
parent b152aba6c6 c255a35800
2 changed files with 14 additions and 2 deletions
--- a/pelican/tests/test_utils.py
+++ b/pelican/tests/test_utils.py
@ -190,6 +190,18 @@ class TestUtils(LoggedTestCase):
        self.assertEqual(
            utils.truncate_html_words("cafeti&eacute;re " * 100, 20),
            "cafeti&eacute;re " * 20 + '...')
        self.assertEqual(
            utils.truncate_html_words("&int;dx " * 100, 20),
            "&int;dx " * 20 + '...')
        # Words with HTML character references inside and outside
        # the ASCII range.
        self.assertEqual(
            utils.truncate_html_words("&#xe9; " * 100, 20),
            "&#xe9; " * 20 + '...')
        self.assertEqual(
            utils.truncate_html_words("&#x222b;dx " * 100, 20),
            "&#x222b;dx " * 20 + '...')
    def test_process_translations(self):
        # create a bunch of articles
--- a/pelican/utils.py
+++ b/pelican/utils.py
@ -512,14 +512,14 @@ class _HTMLWordTruncator(HTMLParser):
        except KeyError:
            self.handle_ref('')
        else:
-            self.handle_ref(chr(codepoint))
+            self.handle_ref(six.unichr(codepoint))
    def handle_charref(self, name):
        if name.startswith('x'):
            codepoint = int(name[1:], 16)
        else:
            codepoint = int(name)
-        self.handle_ref(chr(codepoint))
+        self.handle_ref(six.unichr(codepoint))
 def truncate_html_words(s, num, end_text='...'):