File: quote.py

package info (click to toggle)

python-flanker 0.9.15-1

links: PTS, VCS
area: main
in suites: forky, sid, trixie
size: 17,976 kB
sloc: python: 9,308; makefile: 4

file content (58 lines) | stat: -rw-r--r-- 1,643 bytes

import regex as re
import six
from six.moves import StringIO

from flanker.addresslib._parser.lexer import t_ATOM, t_FWSP

_RE_ATOM_PHRASE = re.compile(
    r'(({atom}|\.)+({fwsp}({atom}|\.)+)*)?'.format(atom=t_ATOM, fwsp=t_FWSP),
    re.MULTILINE | re.VERBOSE)


def smart_quote(s):
    """
    Quotes the input string but only if it contains at least one word that is
    not an rfc2822 atom. That is probably a little bit excessive but we better
    be safe then sorry.
    """
    if _contains_atoms_only(s):
        return s

    return '"' + s.replace('\\', '\\\\').replace('"', '\\"') + '"'


def smart_unquote(s):
    """
    Returns a string that is created from the input string by unquoting all
    quoted regions in there. If there are no quoted regions in the input string
    then output string is identical to the input string.
    """
    unquoted = StringIO()
    escaped_char = False
    is_quoted_section = False
    for c in s:
        if is_quoted_section:
            if escaped_char:
                escaped_char = False
            else:
                if c == '"':
                    is_quoted_section = False
                    continue
                elif c == '\\':
                    escaped_char = True
                    continue
        else:
            if c == '"':
                is_quoted_section = True
                continue

        unquoted.write(c)

    return unquoted.getvalue()


def _contains_atoms_only(s):
    if six.PY2 and isinstance(s, six.text_type):
        s = s.encode('utf-8')
    match_result = _RE_ATOM_PHRASE.match(s)
    return match_result and match_result.end(0) == len(s)