관리-도구

편집 파일: quoting.py

import re
from string import ascii_letters, ascii_lowercase, digits

BASCII_LOWERCASE = ascii_lowercase.encode('ascii')
BPCT_ALLOWED = {'%{:02X}'.format(i).encode('ascii') for i in range(256)}
GEN_DELIMS = ":/?#[]@"
SUB_DELIMS_WITHOUT_QS = "!$'()*,"
SUB_DELIMS = SUB_DELIMS_WITHOUT_QS + '+&=;'
RESERVED = GEN_DELIMS + SUB_DELIMS
UNRESERVED = ascii_letters + digits + '-._~'
ALLOWED = UNRESERVED + SUB_DELIMS_WITHOUT_QS

_IS_HEX = re.compile(b'[A-Z0-9][A-Z0-9]')

class _PyQuoter:
    def __init__(self, *, safe='', protected='', qs=False):
        self._safe = safe
        self._protected = protected
        self._qs = qs

def __call__(self, val):
        if val is None:
            return None
        if not isinstance(val, str):
            raise TypeError("Argument should be str")
        if not val:
            return ''
        val = val.encode('utf8', errors='ignore')
        ret = bytearray()
        pct = b''
        safe = self._safe
        safe += ALLOWED
        if not self._qs:
            safe += '+&=;'
        safe += self._protected
        bsafe = safe.encode('ascii')
        idx = 0
        while idx < len(val):
            ch = val[idx]
            idx += 1

if pct:
                if ch in BASCII_LOWERCASE:
                    ch = ch - 32  # convert to uppercase
                pct.append(ch)
                if len(pct) == 3:  # pragma: no branch   # peephole optimizer
                    pct = bytes(pct)
                    buf = pct[1:]
                    if not _IS_HEX.match(buf):
                        ret.extend(b'%25')
                        pct = b''
                        idx -= 2
                        continue
                    try:
                        unquoted = chr(int(pct[1:].decode('ascii'), base=16))
                    except ValueError:
                        ret.extend(b'%25')
                        pct = b''
                        idx -= 2
                        continue

if unquoted in self._protected:
                        ret.extend(pct)
                    elif unquoted in safe:
                        ret.append(ord(unquoted))
                    else:
                        ret.extend(pct)
                    pct = b''

# special case, if we have only one char after "%"
                elif len(pct) == 2 and idx == len(val):
                    ret.extend(b'%25')
                    pct = b''
                    idx -= 1

continue

elif ch == ord('%'):
                pct = bytearray()
                pct.append(ch)

# special case if "%" is last char
                if idx == len(val):
                    ret.extend(b'%25')

continue

if self._qs:
                if ch == ord(' '):
                    ret.append(ord('+'))
                    continue
            if ch in bsafe:
                ret.append(ch)
                continue

ret.extend(('%{:02X}'.format(ch)).encode('ascii'))

return ret.decode('ascii')

class _PyUnquoter:
    def __init__(self, *, unsafe='', qs=False):
        self._unsafe = unsafe
        self._qs = qs
        self._quoter = _Quoter()
        self._qs_quoter = _Quoter(qs=True)

def __call__(self, val):
        if val is None:
            return None
        if not isinstance(val, str):
            raise TypeError("Argument should be str")
        if not val:
            return ''
        pct = ''
        last_pct = ''
        pcts = bytearray()
        ret = []
        for ch in val:
            if pct:
                pct += ch
                if len(pct) == 3:  # pragma: no branch   # peephole optimizer
                    pcts.append(int(pct[1:], base=16))
                    last_pct = pct
                    pct = ''
                continue
            if pcts:
                try:
                    unquoted = pcts.decode('utf8')
                except UnicodeDecodeError:
                    pass
                else:
                    if self._qs and unquoted in '+=&;':
                        ret.append(self._qs_quoter(unquoted))
                    elif unquoted in self._unsafe:
                        ret.append(self._quoter(unquoted))
                    else:
                        ret.append(unquoted)
                    del pcts[:]

if ch == '%':
                pct = ch
                continue

if pcts:
                ret.append(last_pct)  # %F8ab
                last_pct = ''

if ch == '+':
                if not self._qs or ch in self._unsafe:
                    ret.append('+')
                else:
                    ret.append(' ')
                continue

if ch in self._unsafe:
                ret.append('%')
                h = hex(ord(ch)).upper()[2:]
                for ch in h:
                    ret.append(ch)
                continue

ret.append(ch)

if pcts:
            try:
                unquoted = pcts.decode('utf8')
            except UnicodeDecodeError:
                ret.append(last_pct)  # %F8
            else:
                if self._qs and unquoted in '+=&;':
                    ret.append(self._qs_quoter(unquoted))
                elif unquoted in self._unsafe:
                    ret.append(self._quoter(unquoted))
                else:
                    ret.append(unquoted)
        return ''.join(ret)

try:
    from ._quoting import _Quoter, _Unquoter
except ImportError:  # pragma: no cover
    _Quoter = _PyQuoter
    _Unquoter = _PyUnquoter