plistlib.py 14.6 KB
Newer Older
1 2
"""plistlib.py -- a tool to generate and parse MacOSX .plist files.

3
The PropertyList (.plist) file format is a simple XML pickle supporting
4 5
basic object types, like dictionaries, lists, numbers and strings.
Usually the top level object is a dictionary.
6

7 8 9
To write out a plist file, use the writePlist(rootObject, pathOrFile)
function. 'rootObject' is the top level object, 'pathOrFile' is a
filename or a (writable) file object.
10

11 12 13 14 15 16
To parse a plist from a file, use the readPlist(pathOrFile) function,
with a file name or a (readable) file object as the only argument. It
returns the top level object (again, usually a dictionary).

To work with plist data in strings, you can use readPlistFromString()
and writePlistToString().
17 18

Values can be strings, integers, floats, booleans, tuples, lists,
19 20 21
dictionaries, Data or datetime.datetime objects. String values (including
dictionary keys) may be unicode strings -- they will be written out as
UTF-8.
22 23 24 25 26 27

The <data> plist type is supported through the Data class. This is a
thin wrapper around a Python string.

Generate Plist example:

28
    pl = dict(
Jack Jansen's avatar
Jack Jansen committed
29 30
        aString="Doodah",
        aList=["A", "B", 12, 32.1, [1, 2, 3]],
31 32
        aFloat=0.1,
        anInt=728,
33
        aDict=dict(
Jack Jansen's avatar
Jack Jansen committed
34 35 36 37 38
            anotherString="<hello & hi there!>",
            aUnicodeValue=u'M\xe4ssig, Ma\xdf',
            aTrueValue=True,
            aFalseValue=False,
        ),
39 40 41
        someData=Data("<binary gunk>"),
        someMoreData=Data("<lots of binary gunk>" * 10),
        aDate=datetime.datetime.fromtimestamp(time.mktime(time.gmtime())),
Jack Jansen's avatar
Jack Jansen committed
42 43 44
    )
    # unicode keys are possible, but a little awkward to use:
    pl[u'\xc5benraa'] = "That was a unicode key."
45
    writePlist(pl, fileName)
46 47 48

Parse Plist example:

49
    pl = readPlist(pathOrFile)
50
    print pl["aKey"]
51 52 53
"""


54
__all__ = [
55
    "readPlist", "writePlist", "readPlistFromString", "writePlistToString",
56
    "readPlistFromResource", "writePlistToResource",
57
    "Plist", "Data", "Dict"
58
]
59
# Note: the Plist and Dict classes have been deprecated.
60

61
import binascii
62 63
import datetime
from cStringIO import StringIO
64
import re
65

66

67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
def readPlist(pathOrFile):
    """Read a .plist file. 'pathOrFile' may either be a file name or a
    (readable) file object. Return the unpacked root object (which
    usually is a dictionary).
    """
    didOpen = 0
    if isinstance(pathOrFile, (str, unicode)):
        pathOrFile = open(pathOrFile)
        didOpen = 1
    p = PlistParser()
    rootObject = p.parse(pathOrFile)
    if didOpen:
        pathOrFile.close()
    return rootObject


def writePlist(rootObject, pathOrFile):
    """Write 'rootObject' to a .plist file. 'pathOrFile' may either be a
    file name or a (writable) file object.
    """
    didOpen = 0
    if isinstance(pathOrFile, (str, unicode)):
        pathOrFile = open(pathOrFile, "w")
        didOpen = 1
    writer = PlistWriter(pathOrFile)
    writer.writeln("<plist version=\"1.0\">")
    writer.writeValue(rootObject)
    writer.writeln("</plist>")
    if didOpen:
        pathOrFile.close()
97 98


99 100 101 102 103 104 105 106 107 108 109 110 111 112
def readPlistFromString(data):
    """Read a plist data from a string. Return the root object.
    """
    return readPlist(StringIO(data))


def writePlistToString(rootObject):
    """Return 'rootObject' as a plist-formatted string.
    """
    f = StringIO()
    writePlist(rootObject, f)
    return f.getvalue()


113 114 115 116 117 118 119 120 121
def readPlistFromResource(path, restype='plst', resid=0):
    """Read plst resource from the resource fork of path.
    """
    from Carbon.File import FSRef, FSGetResourceForkName
    from Carbon.Files import fsRdPerm
    from Carbon import Res
    fsRef = FSRef(path)
    resNum = Res.FSOpenResourceFile(fsRef, FSGetResourceForkName(), fsRdPerm)
    Res.UseResFile(resNum)
122
    plistData = Res.Get1Resource(restype, resid).data
123
    Res.CloseResFile(resNum)
124
    return readPlistFromString(plistData)
125 126 127 128 129 130 131 132


def writePlistToResource(rootObject, path, restype='plst', resid=0):
    """Write 'rootObject' as a plst resource to the resource fork of path.
    """
    from Carbon.File import FSRef, FSGetResourceForkName
    from Carbon.Files import fsRdWrPerm
    from Carbon import Res
133
    plistData = writePlistToString(rootObject)
134 135 136 137 138 139 140 141 142 143 144 145 146
    fsRef = FSRef(path)
    resNum = Res.FSOpenResourceFile(fsRef, FSGetResourceForkName(), fsRdWrPerm)
    Res.UseResFile(resNum)
    try:
        Res.Get1Resource(restype, resid).RemoveResource()
    except Res.Error:
        pass
    res = Res.Resource(plistData)
    res.AddResource(restype, resid, '')
    res.WriteResource()
    Res.CloseResFile(resNum)


147 148
class DumbXMLWriter:

149
    def __init__(self, file, indentLevel=0, indent="\t"):
Jack Jansen's avatar
Jack Jansen committed
150 151
        self.file = file
        self.stack = []
152 153
        self.indentLevel = indentLevel
        self.indent = indent
154

Jack Jansen's avatar
Jack Jansen committed
155 156 157 158
    def beginElement(self, element):
        self.stack.append(element)
        self.writeln("<%s>" % element)
        self.indentLevel += 1
159

Jack Jansen's avatar
Jack Jansen committed
160 161 162 163 164
    def endElement(self, element):
        assert self.indentLevel > 0
        assert self.stack.pop() == element
        self.indentLevel -= 1
        self.writeln("</%s>" % element)
165

Jack Jansen's avatar
Jack Jansen committed
166
    def simpleElement(self, element, value=None):
167
        if value is not None:
168
            value = _escapeAndEncode(value)
Jack Jansen's avatar
Jack Jansen committed
169 170 171
            self.writeln("<%s>%s</%s>" % (element, value, element))
        else:
            self.writeln("<%s/>" % element)
172

Jack Jansen's avatar
Jack Jansen committed
173 174
    def writeln(self, line):
        if line:
175
            self.file.write(self.indentLevel * self.indent + line + "\n")
Jack Jansen's avatar
Jack Jansen committed
176 177
        else:
            self.file.write("\n")
178 179


180 181 182 183 184
# Contents should conform to a subset of ISO 8601
# (in particular, YYYY '-' MM '-' DD 'T' HH ':' MM ':' SS 'Z'.  Smaller units may be omitted with
#  a loss of precision)
_dateParser = re.compile(r"(?P<year>\d\d\d\d)(?:-(?P<month>\d\d)(?:-(?P<day>\d\d)(?:T(?P<hour>\d\d)(?::(?P<minute>\d\d)(?::(?P<second>\d\d))?)?)?)?)?Z")

185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201
def _dateFromString(s):
    order = ('year', 'month', 'day', 'hour', 'minute', 'second')
    gd = _dateParser.match(s).groupdict()
    lst = []
    for key in order:
        val = gd[key]
        if val is None:
            break
        lst.append(int(val))
    return datetime.datetime(*lst)

def _dateToString(d):
    return '%04d-%02d-%02dT%02d:%02d:%02dZ' % (
        d.year, d.month, d.day,
        d.hour, d.minute, d.second
    )

202

203 204
# Regex to find any control chars, except for \t \n and \r
_controlCharPat = re.compile(
205 206
    r"[\x00\x01\x02\x03\x04\x05\x06\x07\x08\x0b\x0c\x0e\x0f"
    r"\x10\x11\x12\x13\x14\x15\x16\x17\x18\x19\x1a\x1b\x1c\x1d\x1e\x1f]")
207

208
def _escapeAndEncode(text):
209 210 211 212
    m = _controlCharPat.search(text)
    if m is not None:
        raise ValueError("strings can't contains control characters; "
                         "use plistlib.Data instead")
213 214 215 216
    text = text.replace("\r\n", "\n")       # convert DOS line endings
    text = text.replace("\r", "\n")         # convert Mac line endings
    text = text.replace("&", "&amp;")       # escape '&'
    text = text.replace("<", "&lt;")        # escape '<'
217
    text = text.replace(">", "&gt;")        # escape '>'
218
    return text.encode("utf-8")             # encode as UTF-8
219 220 221 222 223 224 225 226 227


PLISTHEADER = """\
<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE plist PUBLIC "-//Apple Computer//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
"""

class PlistWriter(DumbXMLWriter):

228 229 230 231
    def __init__(self, file, indentLevel=0, indent="\t", writeHeader=1):
        if writeHeader:
            file.write(PLISTHEADER)
        DumbXMLWriter.__init__(self, file, indentLevel, indent)
Jack Jansen's avatar
Jack Jansen committed
232 233 234 235 236 237 238 239 240 241 242

    def writeValue(self, value):
        if isinstance(value, (str, unicode)):
            self.simpleElement("string", value)
        elif isinstance(value, bool):
            # must switch for bool before int, as bool is a
            # subclass of int...
            if value:
                self.simpleElement("true")
            else:
                self.simpleElement("false")
243 244
        elif isinstance(value, (int, long)):
            self.simpleElement("integer", "%d" % value)
Jack Jansen's avatar
Jack Jansen committed
245
        elif isinstance(value, float):
246
            self.simpleElement("real", repr(value))
247
        elif isinstance(value, dict):
Jack Jansen's avatar
Jack Jansen committed
248 249 250
            self.writeDict(value)
        elif isinstance(value, Data):
            self.writeData(value)
251 252
        elif isinstance(value, datetime.datetime):
            self.simpleElement("date", _dateToString(value))
Jack Jansen's avatar
Jack Jansen committed
253 254 255
        elif isinstance(value, (tuple, list)):
            self.writeArray(value)
        else:
256
            raise TypeError("unsuported type: %s" % type(value))
Jack Jansen's avatar
Jack Jansen committed
257 258 259

    def writeData(self, data):
        self.beginElement("data")
260 261 262 263
        self.indentLevel -= 1
        maxlinelength = 76 - len(self.indent.replace("\t", " " * 8) *
                                 self.indentLevel)
        for line in data.asBase64(maxlinelength).split("\n"):
Jack Jansen's avatar
Jack Jansen committed
264 265
            if line:
                self.writeln(line)
266
        self.indentLevel += 1
Jack Jansen's avatar
Jack Jansen committed
267 268 269 270 271 272 273
        self.endElement("data")

    def writeDict(self, d):
        self.beginElement("dict")
        items = d.items()
        items.sort()
        for key, value in items:
274 275
            if not isinstance(key, (str, unicode)):
                raise TypeError("keys must be strings")
Jack Jansen's avatar
Jack Jansen committed
276 277 278 279 280 281 282 283 284
            self.simpleElement("key", key)
            self.writeValue(value)
        self.endElement("dict")

    def writeArray(self, array):
        self.beginElement("array")
        for value in array:
            self.writeValue(value)
        self.endElement("array")
285 286


287
class _InternalDict(dict):
288

289 290 291
    # This class is needed while Dict is scheduled for deprecation:
    # we only need to warn when a *user* instantiates Dict or when
    # the "attribute notation for dict keys" is used.
292

293 294 295 296 297
    def __getattr__(self, attr):
        try:
            value = self[attr]
        except KeyError:
            raise AttributeError, attr
298 299 300
        from warnings import warn
        warn("Attribute access from plist dicts is deprecated, use d[key] "
             "notation instead", PendingDeprecationWarning)
301
        return value
302

303
    def __setattr__(self, attr, value):
304 305 306
        from warnings import warn
        warn("Attribute access from plist dicts is deprecated, use d[key] "
             "notation instead", PendingDeprecationWarning)
307
        self[attr] = value
308

309 310 311 312 313
    def __delattr__(self, attr):
        try:
            del self[attr]
        except KeyError:
            raise AttributeError, attr
314 315 316 317 318 319 320 321 322 323 324
        from warnings import warn
        warn("Attribute access from plist dicts is deprecated, use d[key] "
             "notation instead", PendingDeprecationWarning)

class Dict(_InternalDict):

    def __init__(self, **kwargs):
        from warnings import warn
        warn("The plistlib.Dict class is deprecated, use builtin dict instead",
             PendingDeprecationWarning)
        super(Dict, self).__init__(**kwargs)
325 326


327
class Plist(_InternalDict):
328

329
    """This class has been deprecated. Use readPlist() and writePlist()
330
    functions instead, together with regular dict objects.
Jack Jansen's avatar
Jack Jansen committed
331 332
    """

Just van Rossum's avatar
Just van Rossum committed
333 334 335 336 337 338
    def __init__(self, **kwargs):
        from warnings import warn
        warn("The Plist class is deprecated, use the readPlist() and "
             "writePlist() functions instead", PendingDeprecationWarning)
        super(Plist, self).__init__(**kwargs)

Jack Jansen's avatar
Jack Jansen committed
339
    def fromFile(cls, pathOrFile):
Just van Rossum's avatar
Just van Rossum committed
340
        """Deprecated. Use the readPlist() function instead."""
341 342 343
        rootObject = readPlist(pathOrFile)
        plist = cls()
        plist.update(rootObject)
Jack Jansen's avatar
Jack Jansen committed
344 345 346 347
        return plist
    fromFile = classmethod(fromFile)

    def write(self, pathOrFile):
Just van Rossum's avatar
Just van Rossum committed
348
        """Deprecated. Use the writePlist() function instead."""
349
        writePlist(self, pathOrFile)
350 351


352 353 354 355 356 357 358 359 360
def _encodeBase64(s, maxlinelength=76):
    # copied from base64.encodestring(), with added maxlinelength argument
    maxbinsize = (maxlinelength//4)*3
    pieces = []
    for i in range(0, len(s), maxbinsize):
        chunk = s[i : i + maxbinsize]
        pieces.append(binascii.b2a_base64(chunk))
    return "".join(pieces)

361 362
class Data:

Jack Jansen's avatar
Jack Jansen committed
363
    """Wrapper for binary data."""
364

Jack Jansen's avatar
Jack Jansen committed
365 366
    def __init__(self, data):
        self.data = data
367

Jack Jansen's avatar
Jack Jansen committed
368
    def fromBase64(cls, data):
369 370 371
        # base64.decodestring just calls binascii.a2b_base64;
        # it seems overkill to use both base64 and binascii.
        return cls(binascii.a2b_base64(data))
Jack Jansen's avatar
Jack Jansen committed
372
    fromBase64 = classmethod(fromBase64)
373

374 375
    def asBase64(self, maxlinelength=76):
        return _encodeBase64(self.data, maxlinelength)
376

Jack Jansen's avatar
Jack Jansen committed
377 378 379 380 381 382 383
    def __cmp__(self, other):
        if isinstance(other, self.__class__):
            return cmp(self.data, other.data)
        elif isinstance(other, str):
            return cmp(self.data, other)
        else:
            return cmp(id(self), id(other))
384

Jack Jansen's avatar
Jack Jansen committed
385 386
    def __repr__(self):
        return "%s(%s)" % (self.__class__.__name__, repr(self.data))
387 388 389 390


class PlistParser:

Jack Jansen's avatar
Jack Jansen committed
391 392 393 394 395
    def __init__(self):
        self.stack = []
        self.currentKey = None
        self.root = None

396
    def parse(self, fileobj):
Jack Jansen's avatar
Jack Jansen committed
397 398 399 400 401
        from xml.parsers.expat import ParserCreate
        parser = ParserCreate()
        parser.StartElementHandler = self.handleBeginElement
        parser.EndElementHandler = self.handleEndElement
        parser.CharacterDataHandler = self.handleData
402
        parser.ParseFile(fileobj)
Jack Jansen's avatar
Jack Jansen committed
403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424
        return self.root

    def handleBeginElement(self, element, attrs):
        self.data = []
        handler = getattr(self, "begin_" + element, None)
        if handler is not None:
            handler(attrs)

    def handleEndElement(self, element):
        handler = getattr(self, "end_" + element, None)
        if handler is not None:
            handler()

    def handleData(self, data):
        self.data.append(data)

    def addObject(self, value):
        if self.currentKey is not None:
            self.stack[-1][self.currentKey] = value
            self.currentKey = None
        elif not self.stack:
            # this is the root object
425
            self.root = value
Jack Jansen's avatar
Jack Jansen committed
426 427 428 429 430 431 432 433 434 435 436 437 438 439 440
        else:
            self.stack[-1].append(value)

    def getData(self):
        data = "".join(self.data)
        try:
            data = data.encode("ascii")
        except UnicodeError:
            pass
        self.data = []
        return data

    # element handlers

    def begin_dict(self, attrs):
441
        d = _InternalDict()
Jack Jansen's avatar
Jack Jansen committed
442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469
        self.addObject(d)
        self.stack.append(d)
    def end_dict(self):
        self.stack.pop()

    def end_key(self):
        self.currentKey = self.getData()

    def begin_array(self, attrs):
        a = []
        self.addObject(a)
        self.stack.append(a)
    def end_array(self):
        self.stack.pop()

    def end_true(self):
        self.addObject(True)
    def end_false(self):
        self.addObject(False)
    def end_integer(self):
        self.addObject(int(self.getData()))
    def end_real(self):
        self.addObject(float(self.getData()))
    def end_string(self):
        self.addObject(self.getData())
    def end_data(self):
        self.addObject(Data.fromBase64(self.getData()))
    def end_date(self):
470
        self.addObject(_dateFromString(self.getData()))