pelican-theme/pelican/tests/test_importer.py

# -*- coding: utf-8 -*-
from __future__ import print_function, unicode_literals

import locale
import os
import re
from codecs import open

from pelican.settings import DEFAULT_CONFIG
from pelican.tests.support import (mute, skipIfNoExecutable, temporary_folder,
                                   unittest)
from pelican.tools.pelican_import import (blogger2fields, build_header,
                                          build_markdown_header,
                                          decode_wp_content,
                                          download_attachments, fields2pelican,
                                          get_attachments, wp2fields)
from pelican.utils import path_to_file_url, slugify

CUR_DIR = os.path.abspath(os.path.dirname(__file__))
BLOGGER_XML_SAMPLE = os.path.join(CUR_DIR, 'content', 'bloggerexport.xml')
WORDPRESS_XML_SAMPLE = os.path.join(CUR_DIR, 'content', 'wordpressexport.xml')
WORDPRESS_ENCODED_CONTENT_SAMPLE = os.path.join(CUR_DIR,
                                                'content',
                                                'wordpress_content_encoded')
WORDPRESS_DECODED_CONTENT_SAMPLE = os.path.join(CUR_DIR,
                                                'content',
                                                'wordpress_content_decoded')

try:
    from bs4 import BeautifulSoup
except ImportError:
    BeautifulSoup = False  # NOQA

try:
    import bs4.builder._lxml as LXML
except ImportError:
    LXML = False


@skipIfNoExecutable(['pandoc', '--version'])
@unittest.skipUnless(BeautifulSoup, 'Needs BeautifulSoup module')
class TestBloggerXmlImporter(unittest.TestCase):

    def setUp(self):
        self.old_locale = locale.setlocale(locale.LC_ALL)
        locale.setlocale(locale.LC_ALL, str('C'))
        self.posts = list(blogger2fields(BLOGGER_XML_SAMPLE))

    def tearDown(self):
        locale.setlocale(locale.LC_ALL, self.old_locale)

    def test_recognise_kind_and_title(self):
        """Check that importer only outputs pages, articles and comments,
        that these are correctly identified and that titles are correct.
        """
        kinds = {x[8] for x in self.posts}
        self.assertEqual({'page', 'article', 'comment'}, kinds)
        page_titles = {x[0] for x in self.posts if x[8] == 'page'}
        self.assertEqual({'Test page', 'Test page 2'}, page_titles)
        article_titles = {x[0] for x in self.posts if x[8] == 'article'}
        self.assertEqual({'Black as Egypt\'s Night', 'The Steel Windpipe'},
                         article_titles)
        comment_titles = {x[0] for x in self.posts if x[8] == 'comment'}
        self.assertEqual({'Mishka, always a pleasure to read your '
                          'adventures!...'},
                         comment_titles)

    def test_recognise_status_with_correct_filename(self):
        """Check that importerer outputs only statuses 'published' and 'draft',
        that these are correctly identified and that filenames are correct.
        """
        statuses = {x[7] for x in self.posts}
        self.assertEqual({'published', 'draft'}, statuses)

        draft_filenames = {x[2] for x in self.posts if x[7] == 'draft'}
        # draft filenames are id-based
        self.assertEqual({'page-4386962582497458967',
                          'post-1276418104709695660'}, draft_filenames)

        published_filenames = {x[2] for x in self.posts if x[7] == 'published'}
        # published filenames are url-based, except comments
        self.assertEqual({'the-steel-windpipe',
                          'test-page',
                          'post-5590533389087749201'}, published_filenames)


@skipIfNoExecutable(['pandoc', '--version'])
@unittest.skipUnless(BeautifulSoup, 'Needs BeautifulSoup module')
class TestWordpressXmlImporter(unittest.TestCase):

    def setUp(self):
        self.old_locale = locale.setlocale(locale.LC_ALL)
        locale.setlocale(locale.LC_ALL, str('C'))
        self.posts = list(wp2fields(WORDPRESS_XML_SAMPLE))
        self.custposts = list(wp2fields(WORDPRESS_XML_SAMPLE, True))

    def tearDown(self):
        locale.setlocale(locale.LC_ALL, self.old_locale)

    def test_ignore_empty_posts(self):
        self.assertTrue(self.posts)
        for (title, content, fname, date, author,
             categ, tags, status, kind, format) in self.posts:
                self.assertTrue(title.strip())

    def test_recognise_page_kind(self):
        """ Check that we recognise pages in wordpress, as opposed to posts """
        self.assertTrue(self.posts)
        # Collect (title, filename, kind) of non-empty posts recognised as page
        pages_data = []
        for (title, content, fname, date, author,
             categ, tags, status, kind, format) in self.posts:
                if kind == 'page':
                    pages_data.append((title, fname))
        self.assertEqual(2, len(pages_data))
        self.assertEqual(('Page', 'contact'), pages_data[0])
        self.assertEqual(('Empty Page', 'empty'), pages_data[1])

    def test_dirpage_directive_for_page_kind(self):
        silent_f2p = mute(True)(fields2pelican)
        test_post = filter(lambda p: p[0].startswith("Empty Page"), self.posts)
        with temporary_folder() as temp:
            fname = list(silent_f2p(test_post, 'markdown',
                                    temp, dirpage=True))[0]
            self.assertTrue(fname.endswith('pages%sempty.md' % os.path.sep))

    def test_dircat(self):
        silent_f2p = mute(True)(fields2pelican)
        test_posts = []
        for post in self.posts:
            # check post kind
            if len(post[5]) > 0:  # Has a category
                test_posts.append(post)
        with temporary_folder() as temp:
            fnames = list(silent_f2p(test_posts, 'markdown',
                                     temp, dircat=True))
        subs = DEFAULT_CONFIG['SLUG_REGEX_SUBSTITUTIONS']
        index = 0
        for post in test_posts:
            name = post[2]
            category = slugify(post[5][0], regex_subs=subs)
            name += '.md'
            filename = os.path.join(category, name)
            out_name = fnames[index]
            self.assertTrue(out_name.endswith(filename))
            index += 1

    def test_unless_custom_post_all_items_should_be_pages_or_posts(self):
        self.assertTrue(self.posts)
        pages_data = []
        for (title, content, fname, date, author, categ,
             tags, status, kind, format) in self.posts:
                if kind == 'page' or kind == 'article':
                    pass
                else:
                    pages_data.append((title, fname))
        self.assertEqual(0, len(pages_data))

    def test_recognise_custom_post_type(self):
        self.assertTrue(self.custposts)
        cust_data = []
        for (title, content, fname, date, author, categ,
             tags, status, kind, format) in self.custposts:
                if kind == 'article' or kind == 'page':
                    pass
                else:
                    cust_data.append((title, kind))
        self.assertEqual(3, len(cust_data))
        self.assertEqual(
            ('A custom post in category 4', 'custom1'),
            cust_data[0])
        self.assertEqual(
            ('A custom post in category 5', 'custom1'),
            cust_data[1])
        self.assertEqual(
            ('A 2nd custom post type also in category 5', 'custom2'),
            cust_data[2])

    def test_custom_posts_put_in_own_dir(self):
        silent_f2p = mute(True)(fields2pelican)
        test_posts = []
        for post in self.custposts:
            # check post kind
            if post[8] == 'article' or post[8] == 'page':
                pass
            else:
                test_posts.append(post)
        with temporary_folder() as temp:
            fnames = list(silent_f2p(test_posts, 'markdown',
                                     temp, wp_custpost=True))
        index = 0
        for post in test_posts:
            name = post[2]
            kind = post[8]
            name += '.md'
            filename = os.path.join(kind, name)
            out_name = fnames[index]
            self.assertTrue(out_name.endswith(filename))
            index += 1

    def test_custom_posts_put_in_own_dir_and_catagory_sub_dir(self):
        silent_f2p = mute(True)(fields2pelican)
        test_posts = []
        for post in self.custposts:
            # check post kind
            if post[8] == 'article' or post[8] == 'page':
                pass
            else:
                test_posts.append(post)
        with temporary_folder() as temp:
            fnames = list(silent_f2p(test_posts, 'markdown', temp,
                                     wp_custpost=True, dircat=True))
        subs = DEFAULT_CONFIG['SLUG_REGEX_SUBSTITUTIONS']
        index = 0
        for post in test_posts:
            name = post[2]
            kind = post[8]
            category = slugify(post[5][0], regex_subs=subs)
            name += '.md'
            filename = os.path.join(kind, category, name)
            out_name = fnames[index]
            self.assertTrue(out_name.endswith(filename))
            index += 1

    def test_wp_custpost_true_dirpage_false(self):
        # pages should only be put in their own directory when dirpage = True
        silent_f2p = mute(True)(fields2pelican)
        test_posts = []
        for post in self.custposts:
            # check post kind
            if post[8] == 'page':
                test_posts.append(post)
        with temporary_folder() as temp:
            fnames = list(silent_f2p(test_posts, 'markdown', temp,
                                     wp_custpost=True, dirpage=False))
        index = 0
        for post in test_posts:
            name = post[2]
            name += '.md'
            filename = os.path.join('pages', name)
            out_name = fnames[index]
            self.assertFalse(out_name.endswith(filename))

    def test_can_toggle_raw_html_code_parsing(self):
        def r(f):
            with open(f, encoding='utf-8') as infile:
                return infile.read()
        silent_f2p = mute(True)(fields2pelican)

        with temporary_folder() as temp:

            rst_files = (r(f) for f
                         in silent_f2p(self.posts, 'markdown', temp))
            self.assertTrue(any('<iframe' in rst for rst in rst_files))
            rst_files = (r(f) for f
                         in silent_f2p(self.posts, 'markdown',
                                       temp, strip_raw=True))
            self.assertFalse(any('<iframe' in rst for rst in rst_files))
            # no effect in rst
            rst_files = (r(f) for f in silent_f2p(self.posts, 'rst', temp))
            self.assertFalse(any('<iframe' in rst for rst in rst_files))
            rst_files = (r(f) for f in silent_f2p(self.posts, 'rst', temp,
                         strip_raw=True))
            self.assertFalse(any('<iframe' in rst for rst in rst_files))

    def test_decode_html_entities_in_titles(self):
        test_posts = [post for post
                      in self.posts if post[2] == 'html-entity-test']
        self.assertEqual(len(test_posts), 1)

        post = test_posts[0]
        title = post[0]
        self.assertTrue(title, "A normal post with some <html> entities in "
                               "the title. You can't miss them.")
        self.assertNotIn('&', title)

    def test_decode_wp_content_returns_empty(self):
        """ Check that given an empty string we return an empty string."""
        self.assertEqual(decode_wp_content(""), "")

    def test_decode_wp_content(self):
        """ Check that we can decode a wordpress content string."""
        with open(WORDPRESS_ENCODED_CONTENT_SAMPLE, 'r') as encoded_file:
            encoded_content = encoded_file.read()
            with open(WORDPRESS_DECODED_CONTENT_SAMPLE, 'r') as decoded_file:
                decoded_content = decoded_file.read()
                self.assertEqual(
                    decode_wp_content(encoded_content, br=False),
                    decoded_content)

    def test_preserve_verbatim_formatting(self):
        def r(f):
            with open(f, encoding='utf-8') as infile:
                return infile.read()
        silent_f2p = mute(True)(fields2pelican)
        test_post = filter(
            lambda p: p[0].startswith("Code in List"),
            self.posts)
        with temporary_folder() as temp:
            md = [r(f) for f in silent_f2p(test_post, 'markdown', temp)][0]
            self.assertTrue(re.search(r'\s+a = \[1, 2, 3\]', md))
            self.assertTrue(re.search(r'\s+b = \[4, 5, 6\]', md))

            for_line = re.search(r'\s+for i in zip\(a, b\):', md).group(0)
            print_line = re.search(r'\s+print i', md).group(0)
            self.assertTrue(
                for_line.rindex('for') < print_line.rindex('print'))

    def test_code_in_list(self):
        def r(f):
            with open(f, encoding='utf-8') as infile:
                return infile.read()
        silent_f2p = mute(True)(fields2pelican)
        test_post = filter(
            lambda p: p[0].startswith("Code in List"),
            self.posts)
        with temporary_folder() as temp:
            md = [r(f) for f in silent_f2p(test_post, 'markdown', temp)][0]
            sample_line = re.search(r'-   This is a code sample', md).group(0)
            code_line = re.search(r'\s+a = \[1, 2, 3\]', md).group(0)
            self.assertTrue(sample_line.rindex('This') < code_line.rindex('a'))

    def test_dont_use_smart_quotes(self):
        def r(f):
            with open(f, encoding='utf-8') as infile:
                return infile.read()
        silent_f2p = mute(True)(fields2pelican)
        test_post = filter(
            lambda p: p[0].startswith("Post with raw data"),
            self.posts)
        with temporary_folder() as temp:
            md = [r(f) for f in silent_f2p(test_post, 'markdown', temp)][0]
            escaped_quotes = re.search(r'\\[\'"“”‘’]', md)
            self.assertFalse(escaped_quotes)


class TestBuildHeader(unittest.TestCase):
    def test_build_header(self):
        header = build_header('test', None, None, None, None, None)
        self.assertEqual(header, 'test\n####\n\n')

    def test_build_header_with_fields(self):
        header_data = [
            'Test Post',
            '2014-11-04',
            'Alexis Métaireau',
            ['Programming'],
            ['Pelican', 'Python'],
            'test-post',
        ]

        expected_docutils = '\n'.join([
            'Test Post',
            '#########',
            ':date: 2014-11-04',
            ':author: Alexis Métaireau',
            ':category: Programming',
            ':tags: Pelican, Python',
            ':slug: test-post',
            '\n',
        ])

        expected_md = '\n'.join([
            'Title: Test Post',
            'Date: 2014-11-04',
            'Author: Alexis Métaireau',
            'Category: Programming',
            'Tags: Pelican, Python',
            'Slug: test-post',
            '\n',
        ])

        self.assertEqual(build_header(*header_data), expected_docutils)
        self.assertEqual(build_markdown_header(*header_data), expected_md)

    def test_build_header_with_east_asian_characters(self):
        header = build_header('これは広い幅の文字だけで構成されたタイトルです',
                              None, None, None, None, None)

        self.assertEqual(header,
                         ('これは広い幅の文字だけで構成されたタイトルです\n'
                          '##############################################'
                          '\n\n'))

    def test_galleries_added_to_header(self):
        header = build_header('test', None, None, None, None, None,
                              attachments=['output/test1', 'output/test2'])
        self.assertEqual(header, ('test\n####\n'
                                  ':attachments: output/test1, '
                                  'output/test2\n\n'))

    def test_galleries_added_to_markdown_header(self):
        header = build_markdown_header('test', None, None, None, None, None,
                                       attachments=['output/test1',
                                                    'output/test2'])
        self.assertEqual(
            header,
            'Title: test\nAttachments: output/test1, output/test2\n\n')


@unittest.skipUnless(BeautifulSoup, 'Needs BeautifulSoup module')
@unittest.skipUnless(LXML, 'Needs lxml module')
class TestWordpressXMLAttachements(unittest.TestCase):
    def setUp(self):
        self.old_locale = locale.setlocale(locale.LC_ALL)
        locale.setlocale(locale.LC_ALL, str('C'))
        self.attachments = get_attachments(WORDPRESS_XML_SAMPLE)

    def tearDown(self):
        locale.setlocale(locale.LC_ALL, self.old_locale)

    def test_recognise_attachments(self):
        self.assertTrue(self.attachments)
        self.assertTrue(len(self.attachments.keys()) == 3)

    def test_attachments_associated_with_correct_post(self):
        self.assertTrue(self.attachments)
        for post in self.attachments.keys():
            if post is None:
                expected = ('https://upload.wikimedia.org/wikipedia/commons/'
                            'thumb/2/2c/Pelican_lakes_entrance02.jpg/'
                            '240px-Pelican_lakes_entrance02.jpg')
                self.assertEqual(self.attachments[post][0], expected)
            elif post == 'with-excerpt':
                expected_invalid = ('http://thisurlisinvalid.notarealdomain/'
                                    'not_an_image.jpg')
                expected_pelikan = ('http://en.wikipedia.org/wiki/'
                                    'File:Pelikan_Walvis_Bay.jpg')
                self.assertEqual(self.attachments[post][0], expected_invalid)
                self.assertEqual(self.attachments[post][1], expected_pelikan)
            elif post == 'with-tags':
                expected_invalid = ('http://thisurlisinvalid.notarealdomain')
                self.assertEqual(self.attachments[post][0], expected_invalid)
            else:
                self.fail('all attachments should match to a '
                          'filename or None, {}'
                          .format(post))

    def test_download_attachments(self):
        real_file = os.path.join(CUR_DIR, 'content/article.rst')
        good_url = path_to_file_url(real_file)
        bad_url = 'http://localhost:1/not_a_file.txt'
        silent_da = mute()(download_attachments)
        with temporary_folder() as temp:
            locations = list(silent_da(temp, [good_url, bad_url]))
            self.assertEqual(1, len(locations))
            directory = locations[0]
            self.assertTrue(
                directory.endswith(os.path.join('content', 'article.rst')),
                directory)
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								# -*- coding: utf-8 -*-
 								from __future__ import print_function, unicode_literals
-												Added strip raw option to wordpress xml importer

											
										
										
											2012-05-13 23:37:33 +02:00
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								import locale
-												Added strip raw option to wordpress xml importer

											
										
										
											2012-05-13 23:37:33 +02:00
+								import os
-												Added WordPress content decoding to importer

											
										
										
											2013-03-25 15:28:53 -04:00
+								import re
-												Fix for tests that were broken in #1607

											
										
										
											2015-02-10 20:59:57 -05:00
+								from codecs import open
-												Added strip raw option to wordpress xml importer

											
										
										
											2012-05-13 23:37:33 +02:00
-												control slug substitutions from settings with regex

											
										
										
											2018-08-07 17:35:16 +02:00
+								from pelican.settings import DEFAULT_CONFIG
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								from pelican.tests.support import (mute, skipIfNoExecutable, temporary_folder,
 								                                   unittest)
-												add blogger importer

											
										
										
											2018-08-07 14:06:46 +02:00
+								from pelican.tools.pelican_import import (blogger2fields, build_header,
 								                                          build_markdown_header,
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								                                          decode_wp_content,
 								                                          download_attachments, fields2pelican,
 								                                          get_attachments, wp2fields)
 								from pelican.utils import path_to_file_url, slugify
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
-												multiple authors implemented

											
										
										
											2013-07-05 01:08:45 +02:00
+								CUR_DIR = os.path.abspath(os.path.dirname(__file__))
-												add blogger importer

											
										
										
											2018-08-07 14:06:46 +02:00
+								BLOGGER_XML_SAMPLE = os.path.join(CUR_DIR, 'content', 'bloggerexport.xml')
-												Added strip raw option to wordpress xml importer

											
										
										
											2012-05-13 23:37:33 +02:00
+								WORDPRESS_XML_SAMPLE = os.path.join(CUR_DIR, 'content', 'wordpressexport.xml')
-												Added WordPress content decoding to importer

											
										
										
											2013-03-25 15:28:53 -04:00
+								WORDPRESS_ENCODED_CONTENT_SAMPLE = os.path.join(CUR_DIR,
 								                                                'content',
 								                                                'wordpress_content_encoded')
 								WORDPRESS_DECODED_CONTENT_SAMPLE = os.path.join(CUR_DIR,
 								                                                'content',
 								                                                'wordpress_content_decoded')
-												Added strip raw option to wordpress xml importer

											
										
										
											2012-05-13 23:37:33 +02:00
-												skip unless deps are installed in tests

											
										
										
											2012-06-10 21:56:06 +02:00
+								try:
-												Port pelican to python 3.

Stays compatible with 2.x series, thanks to an unified codebase.

											
										
										
											2013-01-11 02:57:43 +01:00
+								    from bs4 import BeautifulSoup
-												skip unless deps are installed in tests

											
										
										
											2012-06-10 21:56:06 +02:00
+								except ImportError:
 								    BeautifulSoup = False  # NOQA
-												add skips for tests relying on dev_requirements modules

											
										
										
											2015-04-11 22:45:31 +02:00
+								try:
 								    import bs4.builder._lxml as LXML
 								except ImportError:
 								    LXML = False
-												add blogger importer

											
										
										
											2018-08-07 14:06:46 +02:00
+								@skipIfNoExecutable(['pandoc', '--version'])
 								@unittest.skipUnless(BeautifulSoup, 'Needs BeautifulSoup module')
 								class TestBloggerXmlImporter(unittest.TestCase):
 								    def setUp(self):
 								        self.old_locale = locale.setlocale(locale.LC_ALL)
 								        locale.setlocale(locale.LC_ALL, str('C'))
 								        self.posts = list(blogger2fields(BLOGGER_XML_SAMPLE))
 								    def tearDown(self):
 								        locale.setlocale(locale.LC_ALL, self.old_locale)
 								    def test_recognise_kind_and_title(self):
 								        """Check that importer only outputs pages, articles and comments,
 								        that these are correctly identified and that titles are correct.
 								        """
 								        kinds = {x[8] for x in self.posts}
 								        self.assertEqual({'page', 'article', 'comment'}, kinds)
 								        page_titles = {x[0] for x in self.posts if x[8] == 'page'}
 								        self.assertEqual({'Test page', 'Test page 2'}, page_titles)
 								        article_titles = {x[0] for x in self.posts if x[8] == 'article'}
 								        self.assertEqual({'Black as Egypt\'s Night', 'The Steel Windpipe'},
 								                         article_titles)
 								        comment_titles = {x[0] for x in self.posts if x[8] == 'comment'}
 								        self.assertEqual({'Mishka, always a pleasure to read your '
 								                          'adventures!...'},
 								                         comment_titles)
 								    def test_recognise_status_with_correct_filename(self):
 								        """Check that importerer outputs only statuses 'published' and 'draft',
 								        that these are correctly identified and that filenames are correct.
 								        """
 								        statuses = {x[7] for x in self.posts}
 								        self.assertEqual({'published', 'draft'}, statuses)
 								        draft_filenames = {x[2] for x in self.posts if x[7] == 'draft'}
 								        # draft filenames are id-based
 								        self.assertEqual({'page-4386962582497458967',
 								                          'post-1276418104709695660'}, draft_filenames)
 								        published_filenames = {x[2] for x in self.posts if x[7] == 'published'}
 								        # published filenames are url-based, except comments
 								        self.assertEqual({'the-steel-windpipe',
 								                          'test-page',
 								                          'post-5590533389087749201'}, published_filenames)
-												refactor the check of executable for unit tests

pandoc was checked directly with a `os.system` call, and the output with version
and copyright of pandoc was displayed when running tests.

- replace the pandoc check with the `skipIfNoExecutable` function.
- in `skipIfNoExecutable`, the `valid_exit_code` is not needed, the executable
  is not found if an `OSError` exception is catched.

											
										
										
											2012-10-25 22:43:58 +02:00
+								@skipIfNoExecutable(['pandoc', '--version'])
 								@unittest.skipUnless(BeautifulSoup, 'Needs BeautifulSoup module')
-												Added strip raw option to wordpress xml importer

											
										
										
											2012-05-13 23:37:33 +02:00
+								class TestWordpressXmlImporter(unittest.TestCase):
 								    def setUp(self):
-												Make sure locale is what we want before/after the tests

The locale is a global state, and it was not properly reset to
whatever it was before the unitttest possibly changed it.
This is now fixed.

Not restoring the locale led to weird issues: depending on
the order chosen by "python -m unittest discover" to run
the unit tests, some tests would apparently randomly fail
due to the locale not being what was expected.

For example, test_period_in_timeperiod_archive would
call mock('posts/1970/ 1月/index.html',...) instead of
expected mock('posts/1970/Jan/index.html',...) and fail.

											
										
										
											2014-04-15 16:36:29 +02:00
+								        self.old_locale = locale.setlocale(locale.LC_ALL)
 								        locale.setlocale(locale.LC_ALL, str('C'))
-												Added WordPress content decoding to importer

											
										
										
											2013-03-25 15:28:53 -04:00
+								        self.posts = list(wp2fields(WORDPRESS_XML_SAMPLE))
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								        self.custposts = list(wp2fields(WORDPRESS_XML_SAMPLE, True))
-												Added strip raw option to wordpress xml importer

											
										
										
											2012-05-13 23:37:33 +02:00
-												Make sure locale is what we want before/after the tests

The locale is a global state, and it was not properly reset to
whatever it was before the unitttest possibly changed it.
This is now fixed.

Not restoring the locale led to weird issues: depending on
the order chosen by "python -m unittest discover" to run
the unit tests, some tests would apparently randomly fail
due to the locale not being what was expected.

For example, test_period_in_timeperiod_archive would
call mock('posts/1970/ 1月/index.html',...) instead of
expected mock('posts/1970/Jan/index.html',...) and fail.

											
										
										
											2014-04-15 16:36:29 +02:00
+								    def tearDown(self):
 								        locale.setlocale(locale.LC_ALL, self.old_locale)
-												Added strip raw option to wordpress xml importer

											
										
										
											2012-05-13 23:37:33 +02:00
+								    def test_ignore_empty_posts(self):
-												Added WordPress content decoding to importer

											
										
										
											2013-03-25 15:28:53 -04:00
+								        self.assertTrue(self.posts)
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								        for (title, content, fname, date, author,
 								             categ, tags, status, kind, format) in self.posts:
 								                self.assertTrue(title.strip())
-												Added strip raw option to wordpress xml importer

											
										
										
											2012-05-13 23:37:33 +02:00
-												Import wordpress pages to pages/ subdir with --dir-page option

When importing from Wordpress, the --dir-page directive (disabled by
default) automatically adds files to the pages/ when they are recognised
as pages, as opposed to posts.

											
										
										
											2013-04-19 23:06:59 +01:00
+								    def test_recognise_page_kind(self):
 								        """ Check that we recognise pages in wordpress, as opposed to posts """
 								        self.assertTrue(self.posts)
 								        # Collect (title, filename, kind) of non-empty posts recognised as page
 								        pages_data = []
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								        for (title, content, fname, date, author,
 								             categ, tags, status, kind, format) in self.posts:
 								                if kind == 'page':
 								                    pages_data.append((title, fname))
-												Import wordpress pages to pages/ subdir with --dir-page option

When importing from Wordpress, the --dir-page directive (disabled by
default) automatically adds files to the pages/ when they are recognised
as pages, as opposed to posts.

											
										
										
											2013-04-19 23:06:59 +01:00
+								        self.assertEqual(2, len(pages_data))
 								        self.assertEqual(('Page', 'contact'), pages_data[0])
 								        self.assertEqual(('Empty Page', 'empty'), pages_data[1])
 								    def test_dirpage_directive_for_page_kind(self):
 								        silent_f2p = mute(True)(fields2pelican)
 								        test_post = filter(lambda p: p[0].startswith("Empty Page"), self.posts)
 								        with temporary_folder() as temp:
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								            fname = list(silent_f2p(test_post, 'markdown',
 								                                    temp, dirpage=True))[0]
-												Import wordpress pages to pages/ subdir with --dir-page option

When importing from Wordpress, the --dir-page directive (disabled by
default) automatically adds files to the pages/ when they are recognised
as pages, as opposed to posts.

											
										
										
											2013-04-19 23:06:59 +01:00
+								            self.assertTrue(fname.endswith('pages%sempty.md' % os.path.sep))
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								    def test_dircat(self):
 								        silent_f2p = mute(True)(fields2pelican)
 								        test_posts = []
 								        for post in self.posts:
 								            # check post kind
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								            if len(post[5]) > 0:  # Has a category
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								                test_posts.append(post)
 								        with temporary_folder() as temp:
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								            fnames = list(silent_f2p(test_posts, 'markdown',
 								                                     temp, dircat=True))
-												control slug substitutions from settings with regex

											
										
										
											2018-08-07 17:35:16 +02:00
+								        subs = DEFAULT_CONFIG['SLUG_REGEX_SUBSTITUTIONS']
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								        index = 0
 								        for post in test_posts:
 								            name = post[2]
-												control slug substitutions from settings with regex

											
										
										
											2018-08-07 17:35:16 +02:00
+								            category = slugify(post[5][0], regex_subs=subs)
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								            name += '.md'
 								            filename = os.path.join(category, name)
 								            out_name = fnames[index]
 								            self.assertTrue(out_name.endswith(filename))
 								            index += 1
-												multiple authors implemented

											
										
										
											2013-07-05 01:08:45 +02:00
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								    def test_unless_custom_post_all_items_should_be_pages_or_posts(self):
 								        self.assertTrue(self.posts)
 								        pages_data = []
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								        for (title, content, fname, date, author, categ,
 								             tags, status, kind, format) in self.posts:
 								                if kind == 'page' or kind == 'article':
 								                    pass
 								                else:
 								                    pages_data.append((title, fname))
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								        self.assertEqual(0, len(pages_data))
-												multiple authors implemented

											
										
										
											2013-07-05 01:08:45 +02:00
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								    def test_recognise_custom_post_type(self):
 								        self.assertTrue(self.custposts)
 								        cust_data = []
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								        for (title, content, fname, date, author, categ,
 								             tags, status, kind, format) in self.custposts:
 								                if kind == 'article' or kind == 'page':
 								                    pass
 								                else:
 								                    cust_data.append((title, kind))
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								        self.assertEqual(3, len(cust_data))
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								        self.assertEqual(
 								            ('A custom post in category 4', 'custom1'),
 								            cust_data[0])
 								        self.assertEqual(
 								            ('A custom post in category 5', 'custom1'),
 								            cust_data[1])
 								        self.assertEqual(
 								            ('A 2nd custom post type also in category 5', 'custom2'),
 								            cust_data[2])
-												multiple authors implemented

											
										
										
											2013-07-05 01:08:45 +02:00
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								    def test_custom_posts_put_in_own_dir(self):
 								        silent_f2p = mute(True)(fields2pelican)
 								        test_posts = []
 								        for post in self.custposts:
 								            # check post kind
-												Fix for tests that were broken in #1607

											
										
										
											2015-02-10 20:59:57 -05:00
+								            if post[8] == 'article' or post[8] == 'page':
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								                pass
 								            else:
 								                test_posts.append(post)
 								        with temporary_folder() as temp:
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								            fnames = list(silent_f2p(test_posts, 'markdown',
 								                                     temp, wp_custpost=True))
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								        index = 0
 								        for post in test_posts:
 								            name = post[2]
-												Fix for tests that were broken in #1607

											
										
										
											2015-02-10 20:59:57 -05:00
+								            kind = post[8]
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								            name += '.md'
 								            filename = os.path.join(kind, name)
 								            out_name = fnames[index]
 								            self.assertTrue(out_name.endswith(filename))
 								            index += 1
 								    def test_custom_posts_put_in_own_dir_and_catagory_sub_dir(self):
 								        silent_f2p = mute(True)(fields2pelican)
 								        test_posts = []
 								        for post in self.custposts:
 								            # check post kind
-												Fix for tests that were broken in #1607

											
										
										
											2015-02-10 20:59:57 -05:00
+								            if post[8] == 'article' or post[8] == 'page':
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								                pass
 								            else:
 								                test_posts.append(post)
 								        with temporary_folder() as temp:
-												multiple authors implemented

											
										
										
											2013-07-05 01:08:45 +02:00
+								            fnames = list(silent_f2p(test_posts, 'markdown', temp,
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								                                     wp_custpost=True, dircat=True))
-												control slug substitutions from settings with regex

											
										
										
											2018-08-07 17:35:16 +02:00
+								        subs = DEFAULT_CONFIG['SLUG_REGEX_SUBSTITUTIONS']
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								        index = 0
 								        for post in test_posts:
 								            name = post[2]
-												Fix for tests that were broken in #1607

											
										
										
											2015-02-10 20:59:57 -05:00
+								            kind = post[8]
-												control slug substitutions from settings with regex

											
										
										
											2018-08-07 17:35:16 +02:00
+								            category = slugify(post[5][0], regex_subs=subs)
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								            name += '.md'
 								            filename = os.path.join(kind, category, name)
 								            out_name = fnames[index]
 								            self.assertTrue(out_name.endswith(filename))
 								            index += 1
 								    def test_wp_custpost_true_dirpage_false(self):
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								        # pages should only be put in their own directory when dirpage = True
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								        silent_f2p = mute(True)(fields2pelican)
 								        test_posts = []
 								        for post in self.custposts:
 								            # check post kind
-												Fix for tests that were broken in #1607

											
										
										
											2015-02-10 20:59:57 -05:00
+								            if post[8] == 'page':
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								                test_posts.append(post)
 								        with temporary_folder() as temp:
-												multiple authors implemented

											
										
										
											2013-07-05 01:08:45 +02:00
+								            fnames = list(silent_f2p(test_posts, 'markdown', temp,
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								                                     wp_custpost=True, dirpage=False))
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								        index = 0
 								        for post in test_posts:
 								            name = post[2]
 								            name += '.md'
 								            filename = os.path.join('pages', name)
 								            out_name = fnames[index]
 								            self.assertFalse(out_name.endswith(filename))
-												multiple authors implemented

											
										
										
											2013-07-05 01:08:45 +02:00
-												Added strip raw option to wordpress xml importer

											
										
										
											2012-05-13 23:37:33 +02:00
+								    def test_can_toggle_raw_html_code_parsing(self):
-												remove unittest2 and fix various warnings in py3

											
										
										
											2013-04-13 16:36:05 -04:00
+								        def r(f):
-												Fix for tests that were broken in #1607

											
										
										
											2015-02-10 20:59:57 -05:00
+								            with open(f, encoding='utf-8') as infile:
-												remove unittest2 and fix various warnings in py3

											
										
										
											2013-04-13 16:36:05 -04:00
+								                return infile.read()
-												Added strip raw option to wordpress xml importer

											
										
										
											2012-05-13 23:37:33 +02:00
+								        silent_f2p = mute(True)(fields2pelican)
 								        with temporary_folder() as temp:
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								            rst_files = (r(f) for f
 								                         in silent_f2p(self.posts, 'markdown', temp))
-												Added strip raw option to wordpress xml importer

											
										
										
											2012-05-13 23:37:33 +02:00
+								            self.assertTrue(any('<iframe' in rst for rst in rst_files))
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								            rst_files = (r(f) for f
 								                         in silent_f2p(self.posts, 'markdown',
 								                                       temp, strip_raw=True))
-												Added strip raw option to wordpress xml importer

											
										
										
											2012-05-13 23:37:33 +02:00
+								            self.assertFalse(any('<iframe' in rst for rst in rst_files))
 								            # no effect in rst
-												Added WordPress content decoding to importer

											
										
										
											2013-03-25 15:28:53 -04:00
+								            rst_files = (r(f) for f in silent_f2p(self.posts, 'rst', temp))
-												Added strip raw option to wordpress xml importer

											
										
										
											2012-05-13 23:37:33 +02:00
+								            self.assertFalse(any('<iframe' in rst for rst in rst_files))
-												Added WordPress content decoding to importer

											
										
										
											2013-03-25 15:28:53 -04:00
+								            rst_files = (r(f) for f in silent_f2p(self.posts, 'rst', temp,
-												pandoc is optional

											
										
										
											2012-06-10 13:27:36 +02:00
+								                         strip_raw=True))
-												Added strip raw option to wordpress xml importer

											
										
										
											2012-05-13 23:37:33 +02:00
+								            self.assertFalse(any('<iframe' in rst for rst in rst_files))
-												Decode HTML entities in titles on WP import

											
										
										
											2012-11-03 21:55:56 +10:00
 								    def test_decode_html_entities_in_titles(self):
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								        test_posts = [post for post
 								                      in self.posts if post[2] == 'html-entity-test']
-												tests: Avoid hidden logic with better .assert*() method choices

We'll get better failure messages if we use an assertion method that
understands the comparison we're trying to make.  If you make the
comparison by hand and assertTrue(), you don't get much constructive
feedback ;).

											
										
										
											2013-06-12 14:52:23 -04:00
+								        self.assertEqual(len(test_posts), 1)
-												flake8-ed the tests

											
										
										
											2013-03-03 19:44:57 -08:00
-												Decode HTML entities in titles on WP import

											
										
										
											2012-11-03 21:55:56 +10:00
+								        post = test_posts[0]
 								        title = post[0]
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								        self.assertTrue(title, "A normal post with some <html> entities in "
 								                               "the title. You can't miss them.")
-												tests: Avoid hidden logic with better .assert*() method choices

We'll get better failure messages if we use an assertion method that
understands the comparison we're trying to make.  If you make the
comparison by hand and assertTrue(), you don't get much constructive
feedback ;).

											
										
										
											2013-06-12 14:52:23 -04:00
+								        self.assertNotIn('&', title)
-												Added WordPress content decoding to importer

											
										
										
											2013-03-25 15:28:53 -04:00
 								    def test_decode_wp_content_returns_empty(self):
 								        """ Check that given an empty string we return an empty string."""
 								        self.assertEqual(decode_wp_content(""), "")
 								    def test_decode_wp_content(self):
 								        """ Check that we can decode a wordpress content string."""
 								        with open(WORDPRESS_ENCODED_CONTENT_SAMPLE, 'r') as encoded_file:
 								            encoded_content = encoded_file.read()
 								            with open(WORDPRESS_DECODED_CONTENT_SAMPLE, 'r') as decoded_file:
 								                decoded_content = decoded_file.read()
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								                self.assertEqual(
 								                    decode_wp_content(encoded_content, br=False),
 								                    decoded_content)
-												Added WordPress content decoding to importer

											
										
										
											2013-03-25 15:28:53 -04:00
 								    def test_preserve_verbatim_formatting(self):
-												remove unittest2 and fix various warnings in py3

											
										
										
											2013-04-13 16:36:05 -04:00
+								        def r(f):
-												Fix for tests that were broken in #1607

											
										
										
											2015-02-10 20:59:57 -05:00
+								            with open(f, encoding='utf-8') as infile:
-												remove unittest2 and fix various warnings in py3

											
										
										
											2013-04-13 16:36:05 -04:00
+								                return infile.read()
-												Added WordPress content decoding to importer

											
										
										
											2013-03-25 15:28:53 -04:00
+								        silent_f2p = mute(True)(fields2pelican)
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								        test_post = filter(
 								            lambda p: p[0].startswith("Code in List"),
 								            self.posts)
-												Added WordPress content decoding to importer

											
										
										
											2013-03-25 15:28:53 -04:00
+								        with temporary_folder() as temp:
 								            md = [r(f) for f in silent_f2p(test_post, 'markdown', temp)][0]
 								            self.assertTrue(re.search(r'\s+a = \[1, 2, 3\]', md))
 								            self.assertTrue(re.search(r'\s+b = \[4, 5, 6\]', md))
 								            for_line = re.search(r'\s+for i in zip\(a, b\):', md).group(0)
 								            print_line = re.search(r'\s+print i', md).group(0)
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								            self.assertTrue(
 								                for_line.rindex('for') < print_line.rindex('print'))
-												Added WordPress content decoding to importer

											
										
										
											2013-03-25 15:28:53 -04:00
 								    def test_code_in_list(self):
-												remove unittest2 and fix various warnings in py3

											
										
										
											2013-04-13 16:36:05 -04:00
+								        def r(f):
-												Fix for tests that were broken in #1607

											
										
										
											2015-02-10 20:59:57 -05:00
+								            with open(f, encoding='utf-8') as infile:
-												remove unittest2 and fix various warnings in py3

											
										
										
											2013-04-13 16:36:05 -04:00
+								                return infile.read()
-												Added WordPress content decoding to importer

											
										
										
											2013-03-25 15:28:53 -04:00
+								        silent_f2p = mute(True)(fields2pelican)
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								        test_post = filter(
 								            lambda p: p[0].startswith("Code in List"),
 								            self.posts)
-												Added WordPress content decoding to importer

											
										
										
											2013-03-25 15:28:53 -04:00
+								        with temporary_folder() as temp:
 								            md = [r(f) for f in silent_f2p(test_post, 'markdown', temp)][0]
 								            sample_line = re.search(r'-   This is a code sample', md).group(0)
 								            code_line = re.search(r'\s+a = \[1, 2, 3\]', md).group(0)
 								            self.assertTrue(sample_line.rindex('This') < code_line.rindex('a'))
-												Handle east asian character column width in the importer

Fixes #682
Closes #923

											
										
										
											2013-10-08 09:46:40 +01:00
-												Add pandoc2 support to pelican-import. Fix #2255

Specific options passed to pandoc2 in order to get similar results than
with pandoc1:

- Disable smart quotes from the markdown output.

- Enable raw parsing from html.

											
										
										
											2018-06-26 18:47:42 +02:00
+								    def test_dont_use_smart_quotes(self):
 								        def r(f):
 								            with open(f, encoding='utf-8') as infile:
 								                return infile.read()
 								        silent_f2p = mute(True)(fields2pelican)
 								        test_post = filter(
 								            lambda p: p[0].startswith("Post with raw data"),
 								            self.posts)
 								        with temporary_folder() as temp:
 								            md = [r(f) for f in silent_f2p(test_post, 'markdown', temp)][0]
 								            escaped_quotes = re.search(r'\\[\'"“”‘’]', md)
 								            self.assertFalse(escaped_quotes)
-												Handle east asian character column width in the importer

Fixes #682
Closes #923

											
										
										
											2013-10-08 09:46:40 +01:00
 								class TestBuildHeader(unittest.TestCase):
 								    def test_build_header(self):
 								        header = build_header('test', None, None, None, None, None)
 								        self.assertEqual(header, 'test\n####\n\n')
-												Add tests for Pelican and pelican_import tool

Added tests to ensure that:
- THEME and deprecated *_DIR settings result in the expected configurations
- Post headers are formatted correctly in both Markdown and reStructuredText
- Files specified in IGNORE_FILES setting are properly ignored
- Generator.get_files()'s `paths` argument is backwards-compatible with strings

											
										
										
											2014-11-03 21:00:09 -08:00
+								    def test_build_header_with_fields(self):
 								        header_data = [
 								            'Test Post',
 								            '2014-11-04',
 								            'Alexis Métaireau',
 								            ['Programming'],
 								            ['Pelican', 'Python'],
 								            'test-post',
 								        ]
 								        expected_docutils = '\n'.join([
 								            'Test Post',
 								            '#########',
 								            ':date: 2014-11-04',
 								            ':author: Alexis Métaireau',
 								            ':category: Programming',
 								            ':tags: Pelican, Python',
 								            ':slug: test-post',
 								            '\n',
 								        ])
 								        expected_md = '\n'.join([
 								            'Title: Test Post',
 								            'Date: 2014-11-04',
 								            'Author: Alexis Métaireau',
 								            'Category: Programming',
 								            'Tags: Pelican, Python',
 								            'Slug: test-post',
 								            '\n',
 								        ])
 								        self.assertEqual(build_header(*header_data), expected_docutils)
 								        self.assertEqual(build_markdown_header(*header_data), expected_md)
-												Handle east asian character column width in the importer

Fixes #682
Closes #923

											
										
										
											2013-10-08 09:46:40 +01:00
+								    def test_build_header_with_east_asian_characters(self):
 								        header = build_header('これは広い幅の文字だけで構成されたタイトルです',
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								                              None, None, None, None, None)
-												Handle east asian character column width in the importer

Fixes #682
Closes #923

											
										
										
											2013-10-08 09:46:40 +01:00
 								        self.assertEqual(header,
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								                         ('これは広い幅の文字だけで構成されたタイトルです\n'
 								                          '##############################################'
 								                          '\n\n'))
-												Handle east asian character column width in the importer

Fixes #682
Closes #923

											
										
										
											2013-10-08 09:46:40 +01:00
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								    def test_galleries_added_to_header(self):
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								        header = build_header('test', None, None, None, None, None,
 								                              attachments=['output/test1', 'output/test2'])
 								        self.assertEqual(header, ('test\n####\n'
 								                                  ':attachments: output/test1, '
 								                                  'output/test2\n\n'))
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
 								    def test_galleries_added_to_markdown_header(self):
 								        header = build_markdown_header('test', None, None, None, None, None,
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								                                       attachments=['output/test1',
 								                                                    'output/test2'])
 								        self.assertEqual(
 								            header,
 								            'Title: test\nAttachments: output/test1, output/test2\n\n')
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
-												Add tests for Pelican and pelican_import tool

Added tests to ensure that:
- THEME and deprecated *_DIR settings result in the expected configurations
- Post headers are formatted correctly in both Markdown and reStructuredText
- Files specified in IGNORE_FILES setting are properly ignored
- Generator.get_files()'s `paths` argument is backwards-compatible with strings

											
										
										
											2014-11-03 21:00:09 -08:00
-												multiple authors implemented

											
										
										
											2013-07-05 01:08:45 +02:00
+								@unittest.skipUnless(BeautifulSoup, 'Needs BeautifulSoup module')
-												add skips for tests relying on dev_requirements modules

											
										
										
											2015-04-11 22:45:31 +02:00
+								@unittest.skipUnless(LXML, 'Needs lxml module')
-												multiple authors implemented

											
										
										
											2013-07-05 01:08:45 +02:00
+								class TestWordpressXMLAttachements(unittest.TestCase):
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								    def setUp(self):
-												Make sure locale is what we want before/after the tests

The locale is a global state, and it was not properly reset to
whatever it was before the unitttest possibly changed it.
This is now fixed.

Not restoring the locale led to weird issues: depending on
the order chosen by "python -m unittest discover" to run
the unit tests, some tests would apparently randomly fail
due to the locale not being what was expected.

For example, test_period_in_timeperiod_archive would
call mock('posts/1970/ 1月/index.html',...) instead of
expected mock('posts/1970/Jan/index.html',...) and fail.

											
										
										
											2014-04-15 16:36:29 +02:00
+								        self.old_locale = locale.setlocale(locale.LC_ALL)
 								        locale.setlocale(locale.LC_ALL, str('C'))
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								        self.attachments = get_attachments(WORDPRESS_XML_SAMPLE)
-												multiple authors implemented

											
										
										
											2013-07-05 01:08:45 +02:00
-												Make sure locale is what we want before/after the tests

The locale is a global state, and it was not properly reset to
whatever it was before the unitttest possibly changed it.
This is now fixed.

Not restoring the locale led to weird issues: depending on
the order chosen by "python -m unittest discover" to run
the unit tests, some tests would apparently randomly fail
due to the locale not being what was expected.

For example, test_period_in_timeperiod_archive would
call mock('posts/1970/ 1月/index.html',...) instead of
expected mock('posts/1970/Jan/index.html',...) and fail.

											
										
										
											2014-04-15 16:36:29 +02:00
+								    def tearDown(self):
 								        locale.setlocale(locale.LC_ALL, self.old_locale)
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								    def test_recognise_attachments(self):
 								        self.assertTrue(self.attachments)
 								        self.assertTrue(len(self.attachments.keys()) == 3)
 								    def test_attachments_associated_with_correct_post(self):
 								        self.assertTrue(self.attachments)
 								        for post in self.attachments.keys():
 								            if post is None:
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								                expected = ('https://upload.wikimedia.org/wikipedia/commons/'
 								                            'thumb/2/2c/Pelican_lakes_entrance02.jpg/'
 								                            '240px-Pelican_lakes_entrance02.jpg')
 								                self.assertEqual(self.attachments[post][0], expected)
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								            elif post == 'with-excerpt':
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								                expected_invalid = ('http://thisurlisinvalid.notarealdomain/'
 								                                    'not_an_image.jpg')
 								                expected_pelikan = ('http://en.wikipedia.org/wiki/'
 								                                    'File:Pelikan_Walvis_Bay.jpg')
 								                self.assertEqual(self.attachments[post][0], expected_invalid)
 								                self.assertEqual(self.attachments[post][1], expected_pelikan)
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								            elif post == 'with-tags':
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								                expected_invalid = ('http://thisurlisinvalid.notarealdomain')
 								                self.assertEqual(self.attachments[post][0], expected_invalid)
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								            else:
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								                self.fail('all attachments should match to a '
 								                          'filename or None, {}'
 								                          .format(post))
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
 								    def test_download_attachments(self):
 								        real_file = os.path.join(CUR_DIR, 'content/article.rst')
-												Fix Pelican rendering and unit tests on Windows.

* Fix {filename} links on Windows.
  Otherwise '{filename}/foo/bar.jpg' doesn't work
* Clean up relative Posix path handling in contents.
* Use Posix paths in readers
* Environment for Popen must be strs, not unicodes.
* Ignore Git CRLF warnings.
* Replace CRLFs with LFs in inputs on Windows.
* Fix importer tests
* Fix test_contents
* Fix one last backslash in paginated output
* Skip the remaining failing locale tests on Windows.
* Document the use of forward slashes on Windows.
* Add some Fabric and ghp-import notes

											
										
										
											2015-01-02 23:45:44 -08:00
+								        good_url = path_to_file_url(real_file)
-												multiple authors implemented

											
										
										
											2013-07-05 01:08:45 +02:00
+								        bad_url = 'http://localhost:1/not_a_file.txt'
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								        silent_da = mute()(download_attachments)
 								        with temporary_folder() as temp:
 								            locations = list(silent_da(temp, [good_url, bad_url]))
-												Fix Pelican rendering and unit tests on Windows.

* Fix {filename} links on Windows.
  Otherwise '{filename}/foo/bar.jpg' doesn't work
* Clean up relative Posix path handling in contents.
* Use Posix paths in readers
* Environment for Popen must be strs, not unicodes.
* Ignore Git CRLF warnings.
* Replace CRLFs with LFs in inputs on Windows.
* Fix importer tests
* Fix test_contents
* Fix one last backslash in paginated output
* Skip the remaining failing locale tests on Windows.
* Document the use of forward slashes on Windows.
* Add some Fabric and ghp-import notes

											
										
										
											2015-01-02 23:45:44 -08:00
+								            self.assertEqual(1, len(locations))
-												Extra functionality for pelican-import for wordpress imports

											
										
										
											2014-01-10 16:09:29 +00:00
+								            directory = locations[0]
-												fulfil pep8 standard

											
										
										
											2015-06-16 09:25:09 +02:00
+								            self.assertTrue(
 								                directory.endswith(os.path.join('content', 'article.rst')),
 								                directory)