test_unicode_file.py 5.8 KB
Newer Older
1 2 3
# Test some Unicode file name semantics
# We dont test many operations on files other than
# that their names can be used with Unicode characters.
4
import os, glob, time, shutil
5
import unicodedata
6

7
import unittest
8
from test.support import (run_unittest, rmtree,
9
    TESTFN_ENCODING, TESTFN_UNICODE, TESTFN_UNENCODABLE, create_empty_file)
10

11 12 13 14 15 16 17
if not os.path.supports_unicode_filenames:
    try:
        TESTFN_UNICODE.encode(TESTFN_ENCODING)
    except (UnicodeError, TypeError):
        # Either the file system encoding is None, or the file name
        # cannot be encoded in the file system encoding.
        raise unittest.SkipTest("No Unicode filesystem semantics on this platform.")
18

19 20 21
def remove_if_exists(filename):
    if os.path.exists(filename):
        os.unlink(filename)
22

23 24 25
class TestUnicodeFiles(unittest.TestCase):
    # The 'do_' functions are the actual tests.  They generally assume the
    # file already exists etc.
Tim Peters's avatar
Tim Peters committed
26

27 28 29
    # Do all the tests we can given only a single filename.  The file should
    # exist.
    def _do_single(self, filename):
30 31 32 33 34 35
        self.assertTrue(os.path.exists(filename))
        self.assertTrue(os.path.isfile(filename))
        self.assertTrue(os.access(filename, os.R_OK))
        self.assertTrue(os.path.exists(os.path.abspath(filename)))
        self.assertTrue(os.path.isfile(os.path.abspath(filename)))
        self.assertTrue(os.access(os.path.abspath(filename), os.R_OK))
36
        os.chmod(filename, 0o777)
37 38 39 40 41
        os.utime(filename, None)
        os.utime(filename, (time.time(), time.time()))
        # Copy/rename etc tests using the same filename
        self._do_copyish(filename, filename)
        # Filename should appear in glob output
42
        self.assertTrue(
43 44 45
            os.path.abspath(filename)==os.path.abspath(glob.glob(filename)[0]))
        # basename should appear in listdir.
        path, base = os.path.split(os.path.abspath(filename))
46 47 48 49
        file_list = os.listdir(path)
        # Normalize the unicode strings, as round-tripping the name via the OS
        # may return a different (but equivalent) value.
        base = unicodedata.normalize("NFD", base)
50 51
        file_list = [unicodedata.normalize("NFD", f) for f in file_list]

52
        self.assertIn(base, file_list)
Tim Peters's avatar
Tim Peters committed
53

54 55 56
    # Tests that copy, move, etc one file to another.
    def _do_copyish(self, filename1, filename2):
        # Should be able to rename the file using either name.
57
        self.assertTrue(os.path.isfile(filename1)) # must exist.
58
        os.rename(filename1, filename2 + ".new")
59 60
        self.assertFalse(os.path.isfile(filename2))
        self.assertTrue(os.path.isfile(filename1 + '.new'))
61
        os.rename(filename1 + ".new", filename2)
62
        self.assertFalse(os.path.isfile(filename1 + '.new'))
63
        self.assertTrue(os.path.isfile(filename2))
64

65 66 67 68
        shutil.copy(filename1, filename2 + ".new")
        os.unlink(filename1 + ".new") # remove using equiv name.
        # And a couple of moves, one using each name.
        shutil.move(filename1, filename2 + ".new")
69 70
        self.assertFalse(os.path.exists(filename2))
        self.assertTrue(os.path.exists(filename1 + '.new'))
71
        shutil.move(filename1 + ".new", filename2)
72
        self.assertFalse(os.path.exists(filename2 + '.new'))
73
        self.assertTrue(os.path.exists(filename1))
74 75 76 77 78 79
        # Note - due to the implementation of shutil.move,
        # it tries a rename first.  This only fails on Windows when on
        # different file systems - and this test can't ensure that.
        # So we test the shutil.copy2 function, which is the thing most
        # likely to fail.
        shutil.copy2(filename1, filename2 + ".new")
80
        self.assertTrue(os.path.isfile(filename1 + '.new'))
81
        os.unlink(filename1 + ".new")
82
        self.assertFalse(os.path.exists(filename2 + '.new'))
83

84
    def _do_directory(self, make_name, chdir_name):
85
        cwd = os.getcwd()
86
        if os.path.isdir(make_name):
87
            rmtree(make_name)
88 89 90 91
        os.mkdir(make_name)
        try:
            os.chdir(chdir_name)
            try:
92 93
                cwd_result = os.getcwd()
                name_result = make_name
94 95 96 97

                cwd_result = unicodedata.normalize("NFD", cwd_result)
                name_result = unicodedata.normalize("NFD", name_result)

98
                self.assertEqual(os.path.basename(cwd_result),name_result)
99 100 101 102
            finally:
                os.chdir(cwd)
        finally:
            os.rmdir(make_name)
103

104 105 106 107
    # The '_test' functions 'entry points with params' - ie, what the
    # top-level 'test' functions would be if they could take params
    def _test_single(self, filename):
        remove_if_exists(filename)
108
        create_empty_file(filename)
109 110 111 112
        try:
            self._do_single(filename)
        finally:
            os.unlink(filename)
113
        self.assertTrue(not os.path.exists(filename))
114 115 116 117 118 119 120
        # and again with os.open.
        f = os.open(filename, os.O_CREAT)
        os.close(f)
        try:
            self._do_single(filename)
        finally:
            os.unlink(filename)
Tim Peters's avatar
Tim Peters committed
121

122 123 124 125
    # The 'test' functions are unittest entry points, and simply call our
    # _test functions with each of the filename combinations we wish to test
    def test_single_files(self):
        self._test_single(TESTFN_UNICODE)
126 127
        if TESTFN_UNENCODABLE is not None:
            self._test_single(TESTFN_UNENCODABLE)
128

129
    def test_directories(self):
130 131 132
        # For all 'equivalent' combinations:
        #  Make dir with encoded, chdir with unicode, checkdir with encoded
        #  (or unicode/encoded/unicode, etc
133
        ext = ".dir"
134
        self._do_directory(TESTFN_UNICODE+ext, TESTFN_UNICODE+ext)
135
        # Our directory name that can't use a non-unicode name.
136 137
        if TESTFN_UNENCODABLE is not None:
            self._do_directory(TESTFN_UNENCODABLE+ext,
138
                               TESTFN_UNENCODABLE+ext)
139

140
def test_main():
141
    run_unittest(__name__)
142

143 144
if __name__ == "__main__":
    test_main()