File: vdf.py

package info (click to toggle)
python-steamodd 5.0-1
links: PTS, VCS
area: main
in suites: forky, sid
size: 304 kB
sloc: python: 2,224; makefile: 162
file content (209 lines) | stat: -rw-r--r-- 5,655 bytes
"""
VDF (de)serialization
Copyright (c) 2010+, Anthony Garcia <anthony@lagg.me>
Distributed under the ISC License (see LICENSE)
"""

STRING = '"'
NODE_OPEN = '{'
NODE_CLOSE = '}'
BR_OPEN = '['
BR_CLOSE = ']'
COMMENT = '/'
CR = '\r'
LF = '\n'
SPACE = ' '
TAB = '\t'
WHITESPACE = set(' \t\r\n')

try:
    from collections import OrderedDict as odict
except ImportError:
    odict = dict


def _symtostr(line, i, token=STRING):
    opening = i + 1
    closing = 0

    ci = line.find(token, opening)
    while ci != -1:
        if line[ci - 1] != '\\':
            closing = ci
            break
        ci = line.find(token, ci + 1)

    finalstr = line[opening:closing]
    return finalstr, i + len(finalstr) + 1


def _unquotedtostr(line, i):
    ci = i
    _len = len(line)
    while ci < _len:
        if line[ci] in WHITESPACE:
            break
        ci += 1
    return line[i:ci], ci


def _parse(stream, ptr=0):
    i = ptr
    laststr = None
    lasttok = None
    lastbrk = None
    next_is_value = False
    deserialized = {}

    while i < len(stream):
        c = stream[i]

        if c == NODE_OPEN:
            next_is_value = False  # Make sure next string is interpreted as a key.

            if laststr in deserialized.keys():
                # If this key already exists then we need to make it a list and append the current value.
                if type(deserialized[laststr]) is not list:
                    # If the value already set is not a list, let's make it one.
                    deserialized[laststr] = [deserialized[laststr]]

                # Append the current value to the list
                _value, i = _parse(stream, i + 1)
                deserialized[laststr].append(_value)
            else:
                # Key is brand new!
                deserialized[laststr], i = _parse(stream, i + 1)
        elif c == NODE_CLOSE:
            return deserialized, i
        elif c == BR_OPEN:
            lastbrk, i = _symtostr(stream, i, BR_CLOSE)
        elif c == COMMENT:
            if (i + 1) < len(stream) and stream[i + 1] == '/':
                i = stream.find('\n', i)
        elif c == CR or c == LF:
            ni = i + 1
            if ni < len(stream) and stream[ni] == LF:
                i = ni
            if lasttok != LF:
                c = LF
        elif c != SPACE and c != TAB:
            string, i = (
                _symtostr if c == STRING else
                _unquotedtostr)(stream, i)
            if lasttok == STRING and next_is_value:
                if laststr in deserialized and lastbrk is not None:
                    # ignore this entry if it's the second bracketed expression
                    lastbrk = None
                else:
                    if laststr in deserialized.keys():
                        # If this key already exists then we're dealing with a list of items
                        if type(deserialized[laststr]) is not list:
                            # If the existing val is not a list, we need to cast it to one.
                            deserialized[laststr] = [deserialized[laststr]]

                        # Append current val to list
                        deserialized[laststr].append(string)
                    else:
                        # First occurence of laststr in deserialized.  Assign the value as normal
                        deserialized[laststr] = string

            # force c = STRING so that lasttok will be set properly
            c = STRING
            laststr = string
            next_is_value = not next_is_value
        else:
            c = lasttok

        lasttok = c
        i += 1

    return deserialized, i


def _run_parse_encoded(string):
    try:
        encoded = bytearray(string, "utf-16")
    except:
        encoded = bytearray(string)  # Already byte object?

    try:
        encoded = encoded.decode("ascii")
    except UnicodeDecodeError:
        try:
            encoded = encoded.decode("utf-8")
        except:
            encoded = encoded.decode("utf-16")
    except UnicodeEncodeError:
        pass  # Likely already decoded

    res, ptr = _parse(encoded)
    return res


def load(stream):
    """
    Deserializes `stream` containing VDF document to Python object.
    """
    return _run_parse_encoded(stream.read())


def loads(string):
    """
    Deserializes `string` containing VDF document to Python object.
    """
    return _run_parse_encoded(string)

indent = 0
mult = 2


def _i():
    return u' ' * (indent * mult)


def _dump(obj):
    nodefmt = u'\n' + _i() + '"{0}"\n' + _i() + '{{\n{1}' + _i() + '}}\n\n'
    podfmt = _i() + '"{0}" "{1}"\n'
    lstfmt = _i() + (' ' * mult) + '"{0}" "1"'
    global indent

    indent += 1

    nodes = []
    for k, v in obj.items():
        if isinstance(v, dict):
            nodes.append(nodefmt.format(k, _dump(v)))
        else:
            try:
                try:
                    v.isdigit
                    nodes.append(podfmt.format(k, v))
                except AttributeError:
                    lst = map(lstfmt.format, v)
                    nodes.append(nodefmt.format(k, u'\n'.join(lst) + '\n'))
            except TypeError:
                nodes.append(podfmt.format(k, v))

    indent -= 1

    return u''.join(nodes)


def _run_dump(obj):
    res = _dump(obj)
    return res.encode("utf-16")


def dump(obj, stream):
    """
    Serializes `obj` as VDF formatted stream to `stream` object, encoded as
    UTF-16 by default.
    """
    stream.write(_run_dump(obj))


def dumps(obj):
    """
    Serializes `obj` as VDF formatted string, encoded as UTF-16 by default.
    """
    return _run_dump(obj)