| # Test some Unicode file name semantics | |
| # We dont test many operations on files other than | |
| # that their names can be used with Unicode characters. | |
| import os, glob, time, shutil | |
| import unicodedata | |
| import unittest | |
| from test.test_support import run_unittest, TESTFN_UNICODE | |
| from test.test_support import TESTFN_ENCODING, TESTFN_UNENCODABLE | |
| try: | |
| TESTFN_ENCODED = TESTFN_UNICODE.encode(TESTFN_ENCODING) | |
| except (UnicodeError, TypeError): | |
| # Either the file system encoding is None, or the file name | |
| # cannot be encoded in the file system encoding. | |
| raise unittest.SkipTest("No Unicode filesystem semantics on this platform.") | |
| if TESTFN_ENCODED.decode(TESTFN_ENCODING) != TESTFN_UNICODE: | |
| # The file system encoding does not support Latin-1 | |
| # (which test_support assumes), so try the file system | |
| # encoding instead. | |
| import sys | |
| try: | |
| TESTFN_UNICODE = unicode("@test-\xe0\xf2", sys.getfilesystemencoding()) | |
| TESTFN_ENCODED = TESTFN_UNICODE.encode(TESTFN_ENCODING) | |
| if '?' in TESTFN_ENCODED: | |
| # MBCS will not report the error properly | |
| raise UnicodeError, "mbcs encoding problem" | |
| except (UnicodeError, TypeError): | |
| raise unittest.SkipTest("Cannot find a suiteable filename.") | |
| if TESTFN_ENCODED.decode(TESTFN_ENCODING) != TESTFN_UNICODE: | |
| raise unittest.SkipTest("Cannot find a suitable filename.") | |
| def remove_if_exists(filename): | |
| if os.path.exists(filename): | |
| os.unlink(filename) | |
| class TestUnicodeFiles(unittest.TestCase): | |
| # The 'do_' functions are the actual tests. They generally assume the | |
| # file already exists etc. | |
| # Do all the tests we can given only a single filename. The file should | |
| # exist. | |
| def _do_single(self, filename): | |
| self.assertTrue(os.path.exists(filename)) | |
| self.assertTrue(os.path.isfile(filename)) | |
| self.assertTrue(os.access(filename, os.R_OK)) | |
| self.assertTrue(os.path.exists(os.path.abspath(filename))) | |
| self.assertTrue(os.path.isfile(os.path.abspath(filename))) | |
| self.assertTrue(os.access(os.path.abspath(filename), os.R_OK)) | |
| os.chmod(filename, 0777) | |
| os.utime(filename, None) | |
| os.utime(filename, (time.time(), time.time())) | |
| # Copy/rename etc tests using the same filename | |
| self._do_copyish(filename, filename) | |
| # Filename should appear in glob output | |
| self.assertTrue( | |
| os.path.abspath(filename)==os.path.abspath(glob.glob(filename)[0])) | |
| # basename should appear in listdir. | |
| path, base = os.path.split(os.path.abspath(filename)) | |
| if isinstance(base, str): | |
| base = base.decode(TESTFN_ENCODING) | |
| file_list = os.listdir(path) | |
| # listdir() with a unicode arg may or may not return Unicode | |
| # objects, depending on the platform. | |
| if file_list and isinstance(file_list[0], str): | |
| file_list = [f.decode(TESTFN_ENCODING) for f in file_list] | |
| # Normalize the unicode strings, as round-tripping the name via the OS | |
| # may return a different (but equivalent) value. | |
| base = unicodedata.normalize("NFD", base) | |
| file_list = [unicodedata.normalize("NFD", f) for f in file_list] | |
| self.assertIn(base, file_list) | |
| # Do as many "equivalancy' tests as we can - ie, check that although we | |
| # have different types for the filename, they refer to the same file. | |
| def _do_equivalent(self, filename1, filename2): | |
| # Note we only check "filename1 against filename2" - we don't bother | |
| # checking "filename2 against 1", as we assume we are called again with | |
| # the args reversed. | |
| self.assertTrue(type(filename1)!=type(filename2), | |
| "No point checking equivalent filenames of the same type") | |
| # stat and lstat should return the same results. | |
| self.assertEqual(os.stat(filename1), | |
| os.stat(filename2)) | |
| self.assertEqual(os.lstat(filename1), | |
| os.lstat(filename2)) | |
| # Copy/rename etc tests using equivalent filename | |
| self._do_copyish(filename1, filename2) | |
| # Tests that copy, move, etc one file to another. | |
| def _do_copyish(self, filename1, filename2): | |
| # Should be able to rename the file using either name. | |
| self.assertTrue(os.path.isfile(filename1)) # must exist. | |
| os.rename(filename1, filename2 + ".new") | |
| self.assertTrue(os.path.isfile(filename1+".new")) | |
| os.rename(filename1 + ".new", filename2) | |
| self.assertTrue(os.path.isfile(filename2)) | |
| shutil.copy(filename1, filename2 + ".new") | |
| os.unlink(filename1 + ".new") # remove using equiv name. | |
| # And a couple of moves, one using each name. | |
| shutil.move(filename1, filename2 + ".new") | |
| self.assertTrue(not os.path.exists(filename2)) | |
| shutil.move(filename1 + ".new", filename2) | |
| self.assertTrue(os.path.exists(filename1)) | |
| # Note - due to the implementation of shutil.move, | |
| # it tries a rename first. This only fails on Windows when on | |
| # different file systems - and this test can't ensure that. | |
| # So we test the shutil.copy2 function, which is the thing most | |
| # likely to fail. | |
| shutil.copy2(filename1, filename2 + ".new") | |
| os.unlink(filename1 + ".new") | |
| def _do_directory(self, make_name, chdir_name, encoded): | |
| cwd = os.getcwd() | |
| if os.path.isdir(make_name): | |
| os.rmdir(make_name) | |
| os.mkdir(make_name) | |
| try: | |
| os.chdir(chdir_name) | |
| try: | |
| if not encoded: | |
| cwd_result = os.getcwdu() | |
| name_result = make_name | |
| else: | |
| cwd_result = os.getcwd().decode(TESTFN_ENCODING) | |
| name_result = make_name.decode(TESTFN_ENCODING) | |
| cwd_result = unicodedata.normalize("NFD", cwd_result) | |
| name_result = unicodedata.normalize("NFD", name_result) | |
| self.assertEqual(os.path.basename(cwd_result),name_result) | |
| finally: | |
| os.chdir(cwd) | |
| finally: | |
| os.rmdir(make_name) | |
| # The '_test' functions 'entry points with params' - ie, what the | |
| # top-level 'test' functions would be if they could take params | |
| def _test_single(self, filename): | |
| remove_if_exists(filename) | |
| f = file(filename, "w") | |
| f.close() | |
| try: | |
| self._do_single(filename) | |
| finally: | |
| os.unlink(filename) | |
| self.assertTrue(not os.path.exists(filename)) | |
| # and again with os.open. | |
| f = os.open(filename, os.O_CREAT) | |
| os.close(f) | |
| try: | |
| self._do_single(filename) | |
| finally: | |
| os.unlink(filename) | |
| def _test_equivalent(self, filename1, filename2): | |
| remove_if_exists(filename1) | |
| self.assertTrue(not os.path.exists(filename2)) | |
| f = file(filename1, "w") | |
| f.close() | |
| try: | |
| self._do_equivalent(filename1, filename2) | |
| finally: | |
| os.unlink(filename1) | |
| # The 'test' functions are unittest entry points, and simply call our | |
| # _test functions with each of the filename combinations we wish to test | |
| def test_single_files(self): | |
| self._test_single(TESTFN_ENCODED) | |
| self._test_single(TESTFN_UNICODE) | |
| if TESTFN_UNENCODABLE is not None: | |
| self._test_single(TESTFN_UNENCODABLE) | |
| def test_equivalent_files(self): | |
| self._test_equivalent(TESTFN_ENCODED, TESTFN_UNICODE) | |
| self._test_equivalent(TESTFN_UNICODE, TESTFN_ENCODED) | |
| def test_directories(self): | |
| # For all 'equivalent' combinations: | |
| # Make dir with encoded, chdir with unicode, checkdir with encoded | |
| # (or unicode/encoded/unicode, etc | |
| ext = ".dir" | |
| self._do_directory(TESTFN_ENCODED+ext, TESTFN_ENCODED+ext, True) | |
| self._do_directory(TESTFN_ENCODED+ext, TESTFN_UNICODE+ext, True) | |
| self._do_directory(TESTFN_UNICODE+ext, TESTFN_ENCODED+ext, False) | |
| self._do_directory(TESTFN_UNICODE+ext, TESTFN_UNICODE+ext, False) | |
| # Our directory name that can't use a non-unicode name. | |
| if TESTFN_UNENCODABLE is not None: | |
| self._do_directory(TESTFN_UNENCODABLE+ext, | |
| TESTFN_UNENCODABLE+ext, | |
| False) | |
| def test_main(): | |
| run_unittest(__name__) | |
| if __name__ == "__main__": | |
| test_main() |