cpython/Lib/test/test_source_encoding.py

# -*- coding: koi8-r -*-

import unittest
from test.support import TESTFN, unlink, unload, rmtree, script_helper, captured_stdout
import importlib
import os
import sys
import subprocess
import tempfile

class MiscSourceEncodingTest(unittest.TestCase):

    def test_pep263(self):
        self.assertEqual(
            "<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>".encode("utf-8"),
            b'\xd0\x9f\xd0\xb8\xd1\x82\xd0\xbe\xd0\xbd'
        )
        self.assertEqual(
            "\<EFBFBD>".encode("utf-8"),
            b'\\\xd0\x9f'
        )

    def test_compilestring(self):
        # see #1882
        c = compile(b"\n# coding: utf-8\nu = '\xc3\xb3'\n", "dummy", "exec")
        d = {}
        exec(c, d)
        self.assertEqual(d['u'], '\xf3')

    def test_issue2301(self):
        try:
            compile(b"# coding: cp932\nprint '\x94\x4e'", "dummy", "exec")
        except SyntaxError as v:
            self.assertEqual(v.text, "print '\u5e74'\n")
        else:
            self.fail()

    def test_issue4626(self):
        c = compile("# coding=latin-1\n\u00c6 = '\u00c6'", "dummy", "exec")
        d = {}
        exec(c, d)
        self.assertEqual(d['\xc6'], '\xc6')

    def test_issue3297(self):
        c = compile("a, b = '\U0001010F', '\\U0001010F'", "dummy", "exec")
        d = {}
        exec(c, d)
        self.assertEqual(d['a'], d['b'])
        self.assertEqual(len(d['a']), len(d['b']))
        self.assertEqual(ascii(d['a']), ascii(d['b']))

    def test_issue7820(self):
        # Ensure that check_bom() restores all bytes in the right order if
        # check_bom() fails in pydebug mode: a buffer starts with the first
        # byte of a valid BOM, but next bytes are different

        # one byte in common with the UTF-16-LE BOM
        self.assertRaises(SyntaxError, eval, b'\xff\x20')

        # two bytes in common with the UTF-8 BOM
        self.assertRaises(SyntaxError, eval, b'\xef\xbb\x20')

    def test_20731(self):
        sub = subprocess.Popen([sys.executable,
                        os.path.join(os.path.dirname(__file__),
                                     'coding20731.py')],
                        stderr=subprocess.PIPE)
        err = sub.communicate()[1]
        self.assertEqual(sub.returncode, 0)
        self.assertNotIn(b'SyntaxError', err)

    def test_error_message(self):
        compile(b'# -*- coding: iso-8859-15 -*-\n', 'dummy', 'exec')
        compile(b'\xef\xbb\xbf\n', 'dummy', 'exec')
        compile(b'\xef\xbb\xbf# -*- coding: utf-8 -*-\n', 'dummy', 'exec')
        with self.assertRaisesRegex(SyntaxError, 'fake'):
            compile(b'# -*- coding: fake -*-\n', 'dummy', 'exec')
        with self.assertRaisesRegex(SyntaxError, 'iso-8859-15'):
            compile(b'\xef\xbb\xbf# -*- coding: iso-8859-15 -*-\n',
                    'dummy', 'exec')
        with self.assertRaisesRegex(SyntaxError, 'BOM'):
            compile(b'\xef\xbb\xbf# -*- coding: iso-8859-15 -*-\n',
                    'dummy', 'exec')
        with self.assertRaisesRegex(SyntaxError, 'fake'):
            compile(b'\xef\xbb\xbf# -*- coding: fake -*-\n', 'dummy', 'exec')
        with self.assertRaisesRegex(SyntaxError, 'BOM'):
            compile(b'\xef\xbb\xbf# -*- coding: fake -*-\n', 'dummy', 'exec')

    def test_bad_coding(self):
        module_name = 'bad_coding'
        self.verify_bad_module(module_name)

    def test_bad_coding2(self):
        module_name = 'bad_coding2'
        self.verify_bad_module(module_name)

    def verify_bad_module(self, module_name):
        self.assertRaises(SyntaxError, __import__, 'test.' + module_name)

        path = os.path.dirname(__file__)
        filename = os.path.join(path, module_name + '.py')
        with open(filename, "rb") as fp:
            bytes = fp.read()
        self.assertRaises(SyntaxError, compile, bytes, filename, 'exec')

    def test_exec_valid_coding(self):
        d = {}
        exec(b'# coding: cp949\na = "\xaa\xa7"\n', d)
        self.assertEqual(d['a'], '\u3047')

    def test_file_parse(self):
        # issue1134: all encodings outside latin-1 and utf-8 fail on
        # multiline strings and long lines (>512 columns)
        unload(TESTFN)
        filename = TESTFN + ".py"
        f = open(filename, "w", encoding="cp1252")
        sys.path.insert(0, os.curdir)
        try:
            with f:
                f.write("# -*- coding: cp1252 -*-\n")
                f.write("'''A short string\n")
                f.write("'''\n")
                f.write("'A very long string %s'\n" % ("X" * 1000))

            importlib.invalidate_caches()
            __import__(TESTFN)
        finally:
            del sys.path[0]
            unlink(filename)
            unlink(filename + "c")
            unlink(filename + "o")
            unload(TESTFN)
            rmtree('__pycache__')

    def test_error_from_string(self):
        # See http://bugs.python.org/issue6289
        input = "# coding: ascii\n\N{SNOWMAN}".encode('utf-8')
        with self.assertRaises(SyntaxError) as c:
            compile(input, "<string>", "exec")
        expected = "'ascii' codec can't decode byte 0xe2 in position 16: " \
                   "ordinal not in range(128)"
        self.assertTrue(c.exception.args[0].startswith(expected),
                        msg=c.exception.args[0])


class AbstractSourceEncodingTest:

    def test_default_coding(self):
        src = (b'print(ascii("\xc3\xa4"))\n')
        self.check_script_output(src, br"'\xe4'")

    def test_first_coding_line(self):
        src = (b'#coding:iso8859-15\n'
               b'print(ascii("\xc3\xa4"))\n')
        self.check_script_output(src, br"'\xc3\u20ac'")

    def test_second_coding_line(self):
        src = (b'#\n'
               b'#coding:iso8859-15\n'
               b'print(ascii("\xc3\xa4"))\n')
        self.check_script_output(src, br"'\xc3\u20ac'")

    def test_third_coding_line(self):
        # Only first two lines are tested for a magic comment.
        src = (b'#\n'
               b'#\n'
               b'#coding:iso8859-15\n'
               b'print(ascii("\xc3\xa4"))\n')
        self.check_script_output(src, br"'\xe4'")

    def test_double_coding_line(self):
        # If the first line matches the second line is ignored.
        src = (b'#coding:iso8859-15\n'
               b'#coding:latin1\n'
               b'print(ascii("\xc3\xa4"))\n')
        self.check_script_output(src, br"'\xc3\u20ac'")

    def test_double_coding_same_line(self):
        src = (b'#coding:iso8859-15 coding:latin1\n'
               b'print(ascii("\xc3\xa4"))\n')
        self.check_script_output(src, br"'\xc3\u20ac'")

    def test_first_non_utf8_coding_line(self):
        src = (b'#coding:iso-8859-15 \xa4\n'
               b'print(ascii("\xc3\xa4"))\n')
        self.check_script_output(src, br"'\xc3\u20ac'")

    def test_second_non_utf8_coding_line(self):
        src = (b'\n'
               b'#coding:iso-8859-15 \xa4\n'
               b'print(ascii("\xc3\xa4"))\n')
        self.check_script_output(src, br"'\xc3\u20ac'")

    def test_utf8_bom(self):
        src = (b'\xef\xbb\xbfprint(ascii("\xc3\xa4"))\n')
        self.check_script_output(src, br"'\xe4'")

    def test_utf8_bom_and_utf8_coding_line(self):
        src = (b'\xef\xbb\xbf#coding:utf-8\n'
               b'print(ascii("\xc3\xa4"))\n')
        self.check_script_output(src, br"'\xe4'")


class BytesSourceEncodingTest(AbstractSourceEncodingTest, unittest.TestCase):

    def check_script_output(self, src, expected):
        with captured_stdout() as stdout:
            exec(src)
        out = stdout.getvalue().encode('latin1')
        self.assertEqual(out.rstrip(), expected)


class FileSourceEncodingTest(AbstractSourceEncodingTest, unittest.TestCase):

    def check_script_output(self, src, expected):
        with tempfile.TemporaryDirectory() as tmpd:
            fn = os.path.join(tmpd, 'test.py')
            with open(fn, 'wb') as fp:
                fp.write(src)
            res = script_helper.assert_python_ok(fn)
        self.assertEqual(res.out.rstrip(), expected)


if __name__ == "__main__":
    unittest.main()
-												Merged revisions 69576,69579-69580,69589,69619-69620,69633,69703-69704,69728-69730 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r69576 | georg.brandl | 2009-02-13 04:56:50 -0600 (Fri, 13 Feb 2009) | 1 line

  #1661108: note that urlsafe encoded string can contain "=".
........
  r69579 | georg.brandl | 2009-02-13 05:06:59 -0600 (Fri, 13 Feb 2009) | 2 lines

  Fix warnings GCC emits where the argument of PyErr_Format is a single variable.
........
  r69580 | georg.brandl | 2009-02-13 05:10:04 -0600 (Fri, 13 Feb 2009) | 2 lines

  Fix warnings GCC emits where the argument of PyErr_Format is a single variable.
........
  r69589 | martin.v.loewis | 2009-02-13 14:11:34 -0600 (Fri, 13 Feb 2009) | 2 lines

  Move amd64 properties further to the top, so that they override
  the linker options correctly.
........
  r69619 | benjamin.peterson | 2009-02-14 11:00:51 -0600 (Sat, 14 Feb 2009) | 1 line

  this needn't be a shebang line
........
  r69620 | georg.brandl | 2009-02-14 11:01:36 -0600 (Sat, 14 Feb 2009) | 1 line

  #5179: don't leak PIPE fds when child execution fails.
........
  r69633 | hirokazu.yamamoto | 2009-02-15 03:19:48 -0600 (Sun, 15 Feb 2009) | 1 line

  Fixed typo.
........
  r69703 | raymond.hettinger | 2009-02-16 16:42:54 -0600 (Mon, 16 Feb 2009) | 3 lines

  Issue 5229: Documentation for super() neglects to say what super() actually does
........
  r69704 | raymond.hettinger | 2009-02-16 17:00:25 -0600 (Mon, 16 Feb 2009) | 1 line

  Add explanation for super(type1, type2).
........
  r69728 | georg.brandl | 2009-02-17 18:22:55 -0600 (Tue, 17 Feb 2009) | 2 lines

  #5297: fix example.
........
  r69729 | georg.brandl | 2009-02-17 18:25:13 -0600 (Tue, 17 Feb 2009) | 2 lines

  #5296: sequence -> iterable.
........
  r69730 | georg.brandl | 2009-02-17 18:31:36 -0600 (Tue, 17 Feb 2009) | 2 lines

  #5268: mention VMSError.
........

											
										
										
											2009-02-19 12:22:03 +08:00
+								# -*- coding: koi8-r -*-
-												Merged revisions 69617 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r69617 | benjamin.peterson | 2009-02-14 10:51:03 -0600 (Sat, 14 Feb 2009) | 1 line

  we're no longer using CVS, so this doesn't have to be binary
........

											
										
										
											2009-02-15 01:00:16 +08:00
 								import unittest
-												Added new tests for detecting Python source code encoding.

											
										
										
											2016-03-21 04:29:40 +08:00
+								from test.support import TESTFN, unlink, unload, rmtree, script_helper, captured_stdout
-												Issue #18048: Merge test_pep263.py and test_coding.py into test_source_encoding.py.

											
										
										
											2013-06-13 15:08:00 +08:00
+								import importlib
 								import os
 								import sys
-												Merge with 3.3

											
										
										
											2014-02-28 22:43:36 +08:00
+								import subprocess
-												Added new tests for detecting Python source code encoding.

											
										
										
											2016-03-21 04:29:40 +08:00
+								import tempfile
-												Merged revisions 69617 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r69617 | benjamin.peterson | 2009-02-14 10:51:03 -0600 (Sat, 14 Feb 2009) | 1 line

  we're no longer using CVS, so this doesn't have to be binary
........

											
										
										
											2009-02-15 01:00:16 +08:00
-												Added new tests for detecting Python source code encoding.

											
										
										
											2016-03-21 04:29:40 +08:00
+								class MiscSourceEncodingTest(unittest.TestCase):
-												Merged revisions 69617 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r69617 | benjamin.peterson | 2009-02-14 10:51:03 -0600 (Sat, 14 Feb 2009) | 1 line

  we're no longer using CVS, so this doesn't have to be binary
........

											
										
										
											2009-02-15 01:00:16 +08:00
 								    def test_pep263(self):
 								        self.assertEqual(
 								            "<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>".encode("utf-8"),
 								            b'\xd0\x9f\xd0\xb8\xd1\x82\xd0\xbe\xd0\xbd'
 								        )
 								        self.assertEqual(
 								            "\<EFBFBD>".encode("utf-8"),
 								            b'\\\xd0\x9f'
 								        )
 								    def test_compilestring(self):
 								        # see #1882
 								        c = compile(b"\n# coding: utf-8\nu = '\xc3\xb3'\n", "dummy", "exec")
 								        d = {}
 								        exec(c, d)
 								        self.assertEqual(d['u'], '\xf3')
 								    def test_issue2301(self):
 								        try:
 								            compile(b"# coding: cp932\nprint '\x94\x4e'", "dummy", "exec")
 								        except SyntaxError as v:
-												#9424: Replace deprecated assert* methods in the Python test suite.

											
										
										
											2010-11-21 03:04:17 +08:00
+								            self.assertEqual(v.text, "print '\u5e74'\n")
-												Merged revisions 69617 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r69617 | benjamin.peterson | 2009-02-14 10:51:03 -0600 (Sat, 14 Feb 2009) | 1 line

  we're no longer using CVS, so this doesn't have to be binary
........

											
										
										
											2009-02-15 01:00:16 +08:00
+								        else:
 								            self.fail()
-												ignore the coding cookie in compile(), exec(), and eval() if the source is a string #4626

											
										
										
											2009-03-03 07:31:26 +08:00
+								    def test_issue4626(self):
 								        c = compile("# coding=latin-1\n\u00c6 = '\u00c6'", "dummy", "exec")
 								        d = {}
 								        exec(c, d)
-												#9424: Replace deprecated assert* methods in the Python test suite.

											
										
										
											2010-11-21 03:04:17 +08:00
+								        self.assertEqual(d['\xc6'], '\xc6')
-												ignore the coding cookie in compile(), exec(), and eval() if the source is a string #4626

											
										
										
											2009-03-03 07:31:26 +08:00
-												in wide builds, avoid storing high unicode characters from source code with surrogates

This is accomplished by decoding with utf-32 instead of utf-16 on all builds.
The patch is by Adam Olsen.

											
										
										
											2009-10-29 05:59:39 +08:00
+								    def test_issue3297(self):
 								        c = compile("a, b = '\U0001010F', '\\U0001010F'", "dummy", "exec")
 								        d = {}
 								        exec(c, d)
 								        self.assertEqual(d['a'], d['b'])
 								        self.assertEqual(len(d['a']), len(d['b']))
 								        self.assertEqual(ascii(d['a']), ascii(d['b']))
-												Merged revisions 78603 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r78603 | victor.stinner | 2010-03-03 00:20:02 +0100 (mer., 03 mars 2010) | 5 lines

  Issue #7820: The parser tokenizer restores all bytes in the right if the BOM
  check fails.

  Fix an assertion in pydebug mode.
........

											
										
										
											2010-03-03 08:18:49 +08:00
+								    def test_issue7820(self):
 								        # Ensure that check_bom() restores all bytes in the right order if
 								        # check_bom() fails in pydebug mode: a buffer starts with the first
 								        # byte of a valid BOM, but next bytes are different
 								        # one byte in common with the UTF-16-LE BOM
 								        self.assertRaises(SyntaxError, eval, b'\xff\x20')
 								        # two bytes in common with the UTF-8 BOM
 								        self.assertRaises(SyntaxError, eval, b'\xef\xbb\x20')
-												Merge with 3.3

											
										
										
											2014-02-28 22:43:36 +08:00
+								    def test_20731(self):
-												Reindent

											
										
										
											2014-02-28 22:49:06 +08:00
+								        sub = subprocess.Popen([sys.executable,
-												Merge with 3.3

											
										
										
											2014-02-28 22:43:36 +08:00
+								                        os.path.join(os.path.dirname(__file__),
 								                                     'coding20731.py')],
 								                        stderr=subprocess.PIPE)
 								        err = sub.communicate()[1]
-												merge 3.3

											
										
										
											2014-03-01 23:34:22 +08:00
+								        self.assertEqual(sub.returncode, 0)
 								        self.assertNotIn(b'SyntaxError', err)
-												Merge with 3.3

											
										
										
											2014-02-28 22:43:36 +08:00
-												Issue #18038: SyntaxError raised during compilation sources with illegal
encoding now always contains an encoding name.

											
										
										
											2013-06-09 21:51:52 +08:00
+								    def test_error_message(self):
 								        compile(b'# -*- coding: iso-8859-15 -*-\n', 'dummy', 'exec')
 								        compile(b'\xef\xbb\xbf\n', 'dummy', 'exec')
 								        compile(b'\xef\xbb\xbf# -*- coding: utf-8 -*-\n', 'dummy', 'exec')
-												Stop using the deprecated unittest.TestCase.assertRaisesRegexp()

											
										
										
											2013-06-16 23:37:57 +08:00
+								        with self.assertRaisesRegex(SyntaxError, 'fake'):
-												Issue #18038: SyntaxError raised during compilation sources with illegal
encoding now always contains an encoding name.

											
										
										
											2013-06-09 21:51:52 +08:00
+								            compile(b'# -*- coding: fake -*-\n', 'dummy', 'exec')
-												Stop using the deprecated unittest.TestCase.assertRaisesRegexp()

											
										
										
											2013-06-16 23:37:57 +08:00
+								        with self.assertRaisesRegex(SyntaxError, 'iso-8859-15'):
-												Issue #18038: SyntaxError raised during compilation sources with illegal
encoding now always contains an encoding name.

											
										
										
											2013-06-09 21:51:52 +08:00
+								            compile(b'\xef\xbb\xbf# -*- coding: iso-8859-15 -*-\n',
 								                    'dummy', 'exec')
-												Stop using the deprecated unittest.TestCase.assertRaisesRegexp()

											
										
										
											2013-06-16 23:37:57 +08:00
+								        with self.assertRaisesRegex(SyntaxError, 'BOM'):
-												Issue #18038: SyntaxError raised during compilation sources with illegal
encoding now always contains an encoding name.

											
										
										
											2013-06-09 21:51:52 +08:00
+								            compile(b'\xef\xbb\xbf# -*- coding: iso-8859-15 -*-\n',
 								                    'dummy', 'exec')
-												Stop using the deprecated unittest.TestCase.assertRaisesRegexp()

											
										
										
											2013-06-16 23:37:57 +08:00
+								        with self.assertRaisesRegex(SyntaxError, 'fake'):
-												Issue #18038: SyntaxError raised during compilation sources with illegal
encoding now always contains an encoding name.

											
										
										
											2013-06-09 21:51:52 +08:00
+								            compile(b'\xef\xbb\xbf# -*- coding: fake -*-\n', 'dummy', 'exec')
-												Stop using the deprecated unittest.TestCase.assertRaisesRegexp()

											
										
										
											2013-06-16 23:37:57 +08:00
+								        with self.assertRaisesRegex(SyntaxError, 'BOM'):
-												Issue #18038: SyntaxError raised during compilation sources with illegal
encoding now always contains an encoding name.

											
										
										
											2013-06-09 21:51:52 +08:00
+								            compile(b'\xef\xbb\xbf# -*- coding: fake -*-\n', 'dummy', 'exec')
-												- Fix segfault with invalid coding.
- SF Bug #772896, unknown encoding results in MemoryError, which is not helpful

I will only backport the segfault fix.  I'll let Anthony decide if he wants
the other changes backported.  I will do the backport if asked.

											
										
										
											2005-10-02 09:48:49 +08:00
 								    def test_bad_coding(self):
 								        module_name = 'bad_coding'
-												Fix Bug #1378022, UTF-8 files with a leading BOM crashed the interpreter.

Needs backport.

											
										
										
											2005-12-18 13:29:30 +08:00
+								        self.verify_bad_module(module_name)
 								    def test_bad_coding2(self):
 								        module_name = 'bad_coding2'
 								        self.verify_bad_module(module_name)
 								    def verify_bad_module(self, module_name):
-												- Fix segfault with invalid coding.
- SF Bug #772896, unknown encoding results in MemoryError, which is not helpful

I will only backport the segfault fix.  I'll let Anthony decide if he wants
the other changes backported.  I will do the backport if asked.

											
										
										
											2005-10-02 09:48:49 +08:00
+								        self.assertRaises(SyntaxError, __import__, 'test.' + module_name)
 								        path = os.path.dirname(__file__)
 								        filename = os.path.join(path, module_name + '.py')
-												Merged revisions 79030-79032 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r79030 | florent.xicluna | 2010-03-17 20:05:04 +0100 (mer, 17 mar 2010) | 2 lines

  Cleanup in test_import and test_coding.
........
  r79031 | florent.xicluna | 2010-03-17 20:15:56 +0100 (mer, 17 mar 2010) | 2 lines

  Cleanup some test cases using check_warnings and check_py3k_warnings.
........
  r79032 | florent.xicluna | 2010-03-17 21:05:11 +0100 (mer, 17 mar 2010) | 2 lines

  Fix and check cgi module deprecation warnings.  Revert an unwanted rename in test_import.
........

											
										
										
											2010-03-18 04:29:51 +08:00
+								        with open(filename, "rb") as fp:
 								            bytes = fp.read()
-												ignore the coding cookie in compile(), exec(), and eval() if the source is a string #4626

											
										
										
											2009-03-03 07:31:26 +08:00
+								        self.assertRaises(SyntaxError, compile, bytes, filename, 'exec')
-												- Fix segfault with invalid coding.
- SF Bug #772896, unknown encoding results in MemoryError, which is not helpful

I will only backport the segfault fix.  I'll let Anthony decide if he wants
the other changes backported.  I will do the backport if asked.

											
										
										
											2005-10-02 09:48:49 +08:00
-												Fix problem when exec'ing a string with a coding

											
										
										
											2007-08-12 05:31:25 +08:00
+								    def test_exec_valid_coding(self):
 								        d = {}
-												Issue #18202: Fix minor bugs and cleanup test_source_encoding.py.

											
										
										
											2013-06-19 15:29:58 +08:00
+								        exec(b'# coding: cp949\na = "\xaa\xa7"\n', d)
 								        self.assertEqual(d['a'], '\u3047')
-												Fix problem when exec'ing a string with a coding

											
										
										
											2007-08-12 05:31:25 +08:00
-												Correction for issue1134: all source files with a coding spec, except latin-1
and utf-8, crashed when parsing a multiline string, or a line longer that 512
columns.

											
										
										
											2007-11-16 07:19:43 +08:00
+								    def test_file_parse(self):
 								        # issue1134: all encodings outside latin-1 and utf-8 fail on
 								        # multiline strings and long lines (>512 columns)
-												Merged revisions 79030-79032 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r79030 | florent.xicluna | 2010-03-17 20:05:04 +0100 (mer, 17 mar 2010) | 2 lines

  Cleanup in test_import and test_coding.
........
  r79031 | florent.xicluna | 2010-03-17 20:15:56 +0100 (mer, 17 mar 2010) | 2 lines

  Cleanup some test cases using check_warnings and check_py3k_warnings.
........
  r79032 | florent.xicluna | 2010-03-17 21:05:11 +0100 (mer, 17 mar 2010) | 2 lines

  Fix and check cgi module deprecation warnings.  Revert an unwanted rename in test_import.
........

											
										
										
											2010-03-18 04:29:51 +08:00
+								        unload(TESTFN)
-												Correct a failing test when test_import is run after test_coding:
be sure to import a fresh module by removing it from sys.modules

											
										
										
											2007-11-16 08:56:23 +08:00
+								        filename = TESTFN + ".py"
-												Issue #18202: Fix minor bugs and cleanup test_source_encoding.py.

											
										
										
											2013-06-19 15:29:58 +08:00
+								        f = open(filename, "w", encoding="cp1252")
 								        sys.path.insert(0, os.curdir)
-												Correction for issue1134: all source files with a coding spec, except latin-1
and utf-8, crashed when parsing a multiline string, or a line longer that 512
columns.

											
										
										
											2007-11-16 07:19:43 +08:00
+								        try:
-												Issue #18202: Fix minor bugs and cleanup test_source_encoding.py.

											
										
										
											2013-06-19 15:29:58 +08:00
+								            with f:
 								                f.write("# -*- coding: cp1252 -*-\n")
 								                f.write("'''A short string\n")
 								                f.write("'''\n")
 								                f.write("'A very long string %s'\n" % ("X" * 1000))
-												Correction for issue1134: all source files with a coding spec, except latin-1
and utf-8, crashed when parsing a multiline string, or a line longer that 512
columns.

											
										
										
											2007-11-16 07:19:43 +08:00
-												Fix an import race condition.

											
										
										
											2012-04-15 03:06:17 +08:00
+								            importlib.invalidate_caches()
-												Correct a failing test when test_import is run after test_coding:
be sure to import a fresh module by removing it from sys.modules

											
										
										
											2007-11-16 08:56:23 +08:00
+								            __import__(TESTFN)
-												Correction for issue1134: all source files with a coding spec, except latin-1
and utf-8, crashed when parsing a multiline string, or a line longer that 512
columns.

											
										
										
											2007-11-16 07:19:43 +08:00
+								        finally:
-												Issue #18202: Fix minor bugs and cleanup test_source_encoding.py.

											
										
										
											2013-06-19 15:29:58 +08:00
+								            del sys.path[0]
-												Merged revisions 79030-79032 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r79030 | florent.xicluna | 2010-03-17 20:05:04 +0100 (mer, 17 mar 2010) | 2 lines

  Cleanup in test_import and test_coding.
........
  r79031 | florent.xicluna | 2010-03-17 20:15:56 +0100 (mer, 17 mar 2010) | 2 lines

  Cleanup some test cases using check_warnings and check_py3k_warnings.
........
  r79032 | florent.xicluna | 2010-03-17 21:05:11 +0100 (mer, 17 mar 2010) | 2 lines

  Fix and check cgi module deprecation warnings.  Revert an unwanted rename in test_import.
........

											
										
										
											2010-03-18 04:29:51 +08:00
+								            unlink(filename)
 								            unlink(filename + "c")
-												Issue #18202: Fix minor bugs and cleanup test_source_encoding.py.

											
										
										
											2013-06-19 15:29:58 +08:00
+								            unlink(filename + "o")
-												Merged revisions 79030-79032 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r79030 | florent.xicluna | 2010-03-17 20:05:04 +0100 (mer, 17 mar 2010) | 2 lines

  Cleanup in test_import and test_coding.
........
  r79031 | florent.xicluna | 2010-03-17 20:15:56 +0100 (mer, 17 mar 2010) | 2 lines

  Cleanup some test cases using check_warnings and check_py3k_warnings.
........
  r79032 | florent.xicluna | 2010-03-17 21:05:11 +0100 (mer, 17 mar 2010) | 2 lines

  Fix and check cgi module deprecation warnings.  Revert an unwanted rename in test_import.
........

											
										
										
											2010-03-18 04:29:51 +08:00
+								            unload(TESTFN)
-												Issue #22390: Remove files created by tests

											
										
										
											2014-10-05 23:37:41 +08:00
+								            rmtree('__pycache__')
-												Correction for issue1134: all source files with a coding spec, except latin-1
and utf-8, crashed when parsing a multiline string, or a line longer that 512
columns.

											
										
										
											2007-11-16 07:19:43 +08:00
-												Merged revisions 73004,73439,73496,73509,73529,73564,73576-73577,73595-73596,73605 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r73004 | jeffrey.yasskin | 2009-05-28 22:44:31 -0500 (Thu, 28 May 2009) | 5 lines

  Fix nearly all compilation warnings under Apple gcc-4.0.  Tested with OPT="-g
  -Wall -Wstrict-prototypes -Werror" in both --with-pydebug mode and --without.
  There's still a batch of non-prototype warnings in Xlib.h that I don't know how
  to fix.
........
  r73439 | benjamin.peterson | 2009-06-15 19:29:31 -0500 (Mon, 15 Jun 2009) | 1 line

  don't mask encoding errors when decoding a string #6289
........
  r73496 | vinay.sajip | 2009-06-21 12:37:27 -0500 (Sun, 21 Jun 2009) | 1 line

  Issue #6314: logging.basicConfig() performs extra checks on the "level" argument.
........
  r73509 | amaury.forgeotdarc | 2009-06-22 14:33:48 -0500 (Mon, 22 Jun 2009) | 2 lines

  #4490 Fix sample code run by "python -m xml.sax.xmlreader"
........
  r73529 | r.david.murray | 2009-06-23 13:02:46 -0500 (Tue, 23 Jun 2009) | 4 lines

  Fix issue 5230 by having pydoc's safeimport check to see if the import
  error was thrown from itself in order to decide if the module can't be
  found.  Thanks to Lucas Prado Melo for collaborating on the fix and tests.
........
  r73564 | amaury.forgeotdarc | 2009-06-25 17:29:29 -0500 (Thu, 25 Jun 2009) | 6 lines

  #2016 Fix a crash in function call when the **kwargs dictionary is mutated
  during the function call setup.

  This even gives a slight speedup, probably because tuple allocation
  is faster than PyMem_NEW.
........
  r73576 | benjamin.peterson | 2009-06-26 18:37:06 -0500 (Fri, 26 Jun 2009) | 1 line

  document is_declared_global()
........
  r73577 | benjamin.peterson | 2009-06-27 09:16:23 -0500 (Sat, 27 Jun 2009) | 1 line

  link to extensive generator docs in the reference manual
........
  r73595 | ezio.melotti | 2009-06-27 18:45:39 -0500 (Sat, 27 Jun 2009) | 1 line

  stmt and setup can contain multiple statements, see #5896
........
  r73596 | ezio.melotti | 2009-06-27 19:07:45 -0500 (Sat, 27 Jun 2009) | 1 line

  Fixed a wrong apostrophe
........
  r73605 | georg.brandl | 2009-06-28 07:10:18 -0500 (Sun, 28 Jun 2009) | 1 line

  Remove stray pychecker directive.
........

											
										
										
											2009-06-29 01:22:03 +08:00
+								    def test_error_from_string(self):
 								        # See http://bugs.python.org/issue6289
 								        input = "# coding: ascii\n\N{SNOWMAN}".encode('utf-8')
-												Merged revisions 79030-79032 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r79030 | florent.xicluna | 2010-03-17 20:05:04 +0100 (mer, 17 mar 2010) | 2 lines

  Cleanup in test_import and test_coding.
........
  r79031 | florent.xicluna | 2010-03-17 20:15:56 +0100 (mer, 17 mar 2010) | 2 lines

  Cleanup some test cases using check_warnings and check_py3k_warnings.
........
  r79032 | florent.xicluna | 2010-03-17 21:05:11 +0100 (mer, 17 mar 2010) | 2 lines

  Fix and check cgi module deprecation warnings.  Revert an unwanted rename in test_import.
........

											
										
										
											2010-03-18 04:29:51 +08:00
+								        with self.assertRaises(SyntaxError) as c:
-												Merged revisions 73004,73439,73496,73509,73529,73564,73576-73577,73595-73596,73605 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r73004 | jeffrey.yasskin | 2009-05-28 22:44:31 -0500 (Thu, 28 May 2009) | 5 lines

  Fix nearly all compilation warnings under Apple gcc-4.0.  Tested with OPT="-g
  -Wall -Wstrict-prototypes -Werror" in both --with-pydebug mode and --without.
  There's still a batch of non-prototype warnings in Xlib.h that I don't know how
  to fix.
........
  r73439 | benjamin.peterson | 2009-06-15 19:29:31 -0500 (Mon, 15 Jun 2009) | 1 line

  don't mask encoding errors when decoding a string #6289
........
  r73496 | vinay.sajip | 2009-06-21 12:37:27 -0500 (Sun, 21 Jun 2009) | 1 line

  Issue #6314: logging.basicConfig() performs extra checks on the "level" argument.
........
  r73509 | amaury.forgeotdarc | 2009-06-22 14:33:48 -0500 (Mon, 22 Jun 2009) | 2 lines

  #4490 Fix sample code run by "python -m xml.sax.xmlreader"
........
  r73529 | r.david.murray | 2009-06-23 13:02:46 -0500 (Tue, 23 Jun 2009) | 4 lines

  Fix issue 5230 by having pydoc's safeimport check to see if the import
  error was thrown from itself in order to decide if the module can't be
  found.  Thanks to Lucas Prado Melo for collaborating on the fix and tests.
........
  r73564 | amaury.forgeotdarc | 2009-06-25 17:29:29 -0500 (Thu, 25 Jun 2009) | 6 lines

  #2016 Fix a crash in function call when the **kwargs dictionary is mutated
  during the function call setup.

  This even gives a slight speedup, probably because tuple allocation
  is faster than PyMem_NEW.
........
  r73576 | benjamin.peterson | 2009-06-26 18:37:06 -0500 (Fri, 26 Jun 2009) | 1 line

  document is_declared_global()
........
  r73577 | benjamin.peterson | 2009-06-27 09:16:23 -0500 (Sat, 27 Jun 2009) | 1 line

  link to extensive generator docs in the reference manual
........
  r73595 | ezio.melotti | 2009-06-27 18:45:39 -0500 (Sat, 27 Jun 2009) | 1 line

  stmt and setup can contain multiple statements, see #5896
........
  r73596 | ezio.melotti | 2009-06-27 19:07:45 -0500 (Sat, 27 Jun 2009) | 1 line

  Fixed a wrong apostrophe
........
  r73605 | georg.brandl | 2009-06-28 07:10:18 -0500 (Sun, 28 Jun 2009) | 1 line

  Remove stray pychecker directive.
........

											
										
										
											2009-06-29 01:22:03 +08:00
+								            compile(input, "<string>", "exec")
-												Merged revisions 79030-79032 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r79030 | florent.xicluna | 2010-03-17 20:05:04 +0100 (mer, 17 mar 2010) | 2 lines

  Cleanup in test_import and test_coding.
........
  r79031 | florent.xicluna | 2010-03-17 20:15:56 +0100 (mer, 17 mar 2010) | 2 lines

  Cleanup some test cases using check_warnings and check_py3k_warnings.
........
  r79032 | florent.xicluna | 2010-03-17 21:05:11 +0100 (mer, 17 mar 2010) | 2 lines

  Fix and check cgi module deprecation warnings.  Revert an unwanted rename in test_import.
........

											
										
										
											2010-03-18 04:29:51 +08:00
+								        expected = "'ascii' codec can't decode byte 0xe2 in position 16: " \
 								                   "ordinal not in range(128)"
-												Issue #18202: Fix minor bugs and cleanup test_source_encoding.py.

											
										
										
											2013-06-19 15:29:58 +08:00
+								        self.assertTrue(c.exception.args[0].startswith(expected),
 								                        msg=c.exception.args[0])
-												Merged revisions 79030-79032 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r79030 | florent.xicluna | 2010-03-17 20:05:04 +0100 (mer, 17 mar 2010) | 2 lines

  Cleanup in test_import and test_coding.
........
  r79031 | florent.xicluna | 2010-03-17 20:15:56 +0100 (mer, 17 mar 2010) | 2 lines

  Cleanup some test cases using check_warnings and check_py3k_warnings.
........
  r79032 | florent.xicluna | 2010-03-17 21:05:11 +0100 (mer, 17 mar 2010) | 2 lines

  Fix and check cgi module deprecation warnings.  Revert an unwanted rename in test_import.
........

											
										
										
											2010-03-18 04:29:51 +08:00
-												Merged revisions 73004,73439,73496,73509,73529,73564,73576-73577,73595-73596,73605 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk

........
  r73004 | jeffrey.yasskin | 2009-05-28 22:44:31 -0500 (Thu, 28 May 2009) | 5 lines

  Fix nearly all compilation warnings under Apple gcc-4.0.  Tested with OPT="-g
  -Wall -Wstrict-prototypes -Werror" in both --with-pydebug mode and --without.
  There's still a batch of non-prototype warnings in Xlib.h that I don't know how
  to fix.
........
  r73439 | benjamin.peterson | 2009-06-15 19:29:31 -0500 (Mon, 15 Jun 2009) | 1 line

  don't mask encoding errors when decoding a string #6289
........
  r73496 | vinay.sajip | 2009-06-21 12:37:27 -0500 (Sun, 21 Jun 2009) | 1 line

  Issue #6314: logging.basicConfig() performs extra checks on the "level" argument.
........
  r73509 | amaury.forgeotdarc | 2009-06-22 14:33:48 -0500 (Mon, 22 Jun 2009) | 2 lines

  #4490 Fix sample code run by "python -m xml.sax.xmlreader"
........
  r73529 | r.david.murray | 2009-06-23 13:02:46 -0500 (Tue, 23 Jun 2009) | 4 lines

  Fix issue 5230 by having pydoc's safeimport check to see if the import
  error was thrown from itself in order to decide if the module can't be
  found.  Thanks to Lucas Prado Melo for collaborating on the fix and tests.
........
  r73564 | amaury.forgeotdarc | 2009-06-25 17:29:29 -0500 (Thu, 25 Jun 2009) | 6 lines

  #2016 Fix a crash in function call when the **kwargs dictionary is mutated
  during the function call setup.

  This even gives a slight speedup, probably because tuple allocation
  is faster than PyMem_NEW.
........
  r73576 | benjamin.peterson | 2009-06-26 18:37:06 -0500 (Fri, 26 Jun 2009) | 1 line

  document is_declared_global()
........
  r73577 | benjamin.peterson | 2009-06-27 09:16:23 -0500 (Sat, 27 Jun 2009) | 1 line

  link to extensive generator docs in the reference manual
........
  r73595 | ezio.melotti | 2009-06-27 18:45:39 -0500 (Sat, 27 Jun 2009) | 1 line

  stmt and setup can contain multiple statements, see #5896
........
  r73596 | ezio.melotti | 2009-06-27 19:07:45 -0500 (Sat, 27 Jun 2009) | 1 line

  Fixed a wrong apostrophe
........
  r73605 | georg.brandl | 2009-06-28 07:10:18 -0500 (Sun, 28 Jun 2009) | 1 line

  Remove stray pychecker directive.
........

											
										
										
											2009-06-29 01:22:03 +08:00
-												Added new tests for detecting Python source code encoding.

											
										
										
											2016-03-21 04:29:40 +08:00
+								class AbstractSourceEncodingTest:
 								    def test_default_coding(self):
 								        src = (b'print(ascii("\xc3\xa4"))\n')
 								        self.check_script_output(src, br"'\xe4'")
 								    def test_first_coding_line(self):
 								        src = (b'#coding:iso8859-15\n'
 								               b'print(ascii("\xc3\xa4"))\n')
 								        self.check_script_output(src, br"'\xc3\u20ac'")
 								    def test_second_coding_line(self):
 								        src = (b'#\n'
 								               b'#coding:iso8859-15\n'
 								               b'print(ascii("\xc3\xa4"))\n')
 								        self.check_script_output(src, br"'\xc3\u20ac'")
 								    def test_third_coding_line(self):
 								        # Only first two lines are tested for a magic comment.
 								        src = (b'#\n'
 								               b'#\n'
 								               b'#coding:iso8859-15\n'
 								               b'print(ascii("\xc3\xa4"))\n')
 								        self.check_script_output(src, br"'\xe4'")
 								    def test_double_coding_line(self):
 								        # If the first line matches the second line is ignored.
 								        src = (b'#coding:iso8859-15\n'
 								               b'#coding:latin1\n'
 								               b'print(ascii("\xc3\xa4"))\n')
 								        self.check_script_output(src, br"'\xc3\u20ac'")
 								    def test_double_coding_same_line(self):
 								        src = (b'#coding:iso8859-15 coding:latin1\n'
 								               b'print(ascii("\xc3\xa4"))\n')
-												Issue #26581: Use the first coding cookie on a line, not the last one.

											
										
										
											2016-03-21 05:36:29 +08:00
+								        self.check_script_output(src, br"'\xc3\u20ac'")
-												Added new tests for detecting Python source code encoding.

											
										
										
											2016-03-21 04:29:40 +08:00
 								    def test_first_non_utf8_coding_line(self):
 								        src = (b'#coding:iso-8859-15 \xa4\n'
 								               b'print(ascii("\xc3\xa4"))\n')
 								        self.check_script_output(src, br"'\xc3\u20ac'")
 								    def test_second_non_utf8_coding_line(self):
 								        src = (b'\n'
 								               b'#coding:iso-8859-15 \xa4\n'
 								               b'print(ascii("\xc3\xa4"))\n')
 								        self.check_script_output(src, br"'\xc3\u20ac'")
 								    def test_utf8_bom(self):
 								        src = (b'\xef\xbb\xbfprint(ascii("\xc3\xa4"))\n')
 								        self.check_script_output(src, br"'\xe4'")
 								    def test_utf8_bom_and_utf8_coding_line(self):
 								        src = (b'\xef\xbb\xbf#coding:utf-8\n'
 								               b'print(ascii("\xc3\xa4"))\n')
 								        self.check_script_output(src, br"'\xe4'")
 								class BytesSourceEncodingTest(AbstractSourceEncodingTest, unittest.TestCase):
 								    def check_script_output(self, src, expected):
 								        with captured_stdout() as stdout:
 								            exec(src)
 								        out = stdout.getvalue().encode('latin1')
 								        self.assertEqual(out.rstrip(), expected)
 								class FileSourceEncodingTest(AbstractSourceEncodingTest, unittest.TestCase):
 								    def check_script_output(self, src, expected):
 								        with tempfile.TemporaryDirectory() as tmpd:
 								            fn = os.path.join(tmpd, 'test.py')
 								            with open(fn, 'wb') as fp:
 								                fp.write(src)
 								            res = script_helper.assert_python_ok(fn)
 								        self.assertEqual(res.out.rstrip(), expected)
-												- Fix segfault with invalid coding.
- SF Bug #772896, unknown encoding results in MemoryError, which is not helpful

I will only backport the segfault fix.  I'll let Anthony decide if he wants
the other changes backported.  I will do the backport if asked.

											
										
										
											2005-10-02 09:48:49 +08:00
+								if __name__ == "__main__":
-												Issue #18048: Merge test_pep263.py and test_coding.py into test_source_encoding.py.

											
										
										
											2013-06-13 15:08:00 +08:00
+								    unittest.main()