slixmpp/sleekxmpp/util/misc_ops.py

import sys
import hashlib


def unicode(text):
    if sys.version_info < (3, 0):
        if isinstance(text, str):
            text = text.decode('utf-8')
        import __builtin__
        return __builtin__.unicode(text)
    elif not isinstance(text, str):
        return text.decode('utf-8')
    else:
        return text


def bytes(text):
    """
    Convert Unicode text to UTF-8 encoded bytes.

    Since Python 2.6+ and Python 3+ have similar but incompatible
    signatures, this function unifies the two to keep code sane.

    :param text: Unicode text to convert to bytes
    :rtype: bytes (Python3), str (Python2.6+)
    """
    if text is None:
        return b''

    if sys.version_info < (3, 0):
        import __builtin__
        return __builtin__.bytes(text)
    else:
        import builtins
        if isinstance(text, builtins.bytes):
            # We already have bytes, so do nothing
            return text
        if isinstance(text, list):
            # Convert a list of integers to bytes
            return builtins.bytes(text)
        else:
            # Convert UTF-8 text to bytes
            return builtins.bytes(text, encoding='utf-8')


def quote(text):
    """
    Enclose in quotes and escape internal slashes and double quotes.

    :param text: A Unicode or byte string.
    """
    text = bytes(text)
    return b'"' + text.replace(b'\\', b'\\\\').replace(b'"', b'\\"') + b'"'


def num_to_bytes(num):
    """
    Convert an integer into a four byte sequence.

    :param integer num: An integer to convert to its byte representation.
    """
    bval = b''
    bval += bytes(chr(0xFF & (num >> 24)))
    bval += bytes(chr(0xFF & (num >> 16)))
    bval += bytes(chr(0xFF & (num >> 8)))
    bval += bytes(chr(0xFF & (num >> 0)))
    return bval


def bytes_to_num(bval):
    """
    Convert a four byte sequence to an integer.

    :param bytes bval: A four byte sequence to turn into an integer.
    """
    num = 0
    num += ord(bval[0] << 24)
    num += ord(bval[1] << 16)
    num += ord(bval[2] << 8)
    num += ord(bval[3])
    return num


def XOR(x, y):
    """
    Return the results of an XOR operation on two equal length byte strings.

    :param bytes x: A byte string
    :param bytes y: A byte string
    :rtype: bytes
    """
    result = b''
    for a, b in zip(x, y):
        if sys.version_info < (3, 0):
            result += chr((ord(a) ^ ord(b)))
        else:
            result += bytes([a ^ b])
    return result


def hash(name):
    """
    Return a hash function implementing the given algorithm.

    :param name: The name of the hashing algorithm to use.
    :type name: string

    :rtype: function
    """
    name = name.lower()
    if name.startswith('sha-'):
        name = 'sha' + name[4:]
    if name in dir(hashlib):
        return getattr(hashlib, name)
    return None


def hashes():
    """
    Return a list of available hashing algorithms.

    :rtype: list of strings
    """
    t = []
    if 'md5' in dir(hashlib):
        t = ['MD5']
    if 'md2' in dir(hashlib):
        t += ['MD2']
    hashes = ['SHA-' + h[3:] for h in dir(hashlib) if h.startswith('sha')]
    return t + hashes


def setdefaultencoding(encoding):
    """
    Set the current default string encoding used by the Unicode implementation.

    Actually calls sys.setdefaultencoding under the hood - see the docs for that
    for more details.  This method exists only as a way to call find/call it
    even after it has been 'deleted' when the site module is executed.

    :param string encoding: An encoding name, compatible with sys.setdefaultencoding
    """
    func = getattr(sys, 'setdefaultencoding', None)
    if func is None:
        import gc
        import types
        for obj in gc.get_objects():
            if (isinstance(obj, types.BuiltinFunctionType)
                    and obj.__name__ == 'setdefaultencoding'):
                func = obj
                break
        if func is None:
            raise RuntimeError("Could not find setdefaultencoding")
        sys.setdefaultencoding = func
    return func(encoding)


def safedict(data):
    if sys.version_info < (2, 7):
        safe = {}
        for key in data:
            safe[key.encode('utf8')] = data[key]
        return safe
    else:
        return data
Actually commit file of byte and hash utilities. 2012-07-31 02:29:33 +00:00			`import sys`
			`import hashlib`


			`def unicode(text):`
			`if sys.version_info < (3, 0):`
Fix unicode conversion utility. 2012-08-10 19:41:29 +00:00			`if isinstance(text, str):`
			`text = text.decode('utf-8')`
Actually commit file of byte and hash utilities. 2012-07-31 02:29:33 +00:00			`import __builtin__`
			`return __builtin__.unicode(text)`
Fix unicode conversion in Python3 2012-12-18 18:33:14 +00:00			`elif not isinstance(text, str):`
			`return text.decode('utf-8')`
			`else:`
			`return text`
Actually commit file of byte and hash utilities. 2012-07-31 02:29:33 +00:00

			`def bytes(text):`
			`"""`
			`Convert Unicode text to UTF-8 encoded bytes.`

			`Since Python 2.6+ and Python 3+ have similar but incompatible`
			`signatures, this function unifies the two to keep code sane.`

			`:param text: Unicode text to convert to bytes`
			`:rtype: bytes (Python3), str (Python2.6+)`
			`"""`
Fix encoding issue in Python3. 2012-08-01 16:04:41 +00:00			`if text is None:`
			`return b''`

Actually commit file of byte and hash utilities. 2012-07-31 02:29:33 +00:00			`if sys.version_info < (3, 0):`
			`import __builtin__`
			`return __builtin__.bytes(text)`
			`else:`
			`import builtins`
			`if isinstance(text, builtins.bytes):`
			`# We already have bytes, so do nothing`
			`return text`
			`if isinstance(text, list):`
			`# Convert a list of integers to bytes`
			`return builtins.bytes(text)`
			`else:`
			`# Convert UTF-8 text to bytes`
			`return builtins.bytes(text, encoding='utf-8')`


			`def quote(text):`
			`"""`
			`Enclose in quotes and escape internal slashes and double quotes.`

			`:param text: A Unicode or byte string.`
			`"""`
			`text = bytes(text)`
			`return b'"' + text.replace(b'\\', b'\\\\').replace(b'"', b'\\"') + b'"'`


			`def num_to_bytes(num):`
			`"""`
			`Convert an integer into a four byte sequence.`

			`:param integer num: An integer to convert to its byte representation.`
			`"""`
			`bval = b''`
			`bval += bytes(chr(0xFF & (num >> 24)))`
			`bval += bytes(chr(0xFF & (num >> 16)))`
			`bval += bytes(chr(0xFF & (num >> 8)))`
			`bval += bytes(chr(0xFF & (num >> 0)))`
			`return bval`


			`def bytes_to_num(bval):`
			`"""`
			`Convert a four byte sequence to an integer.`

			`:param bytes bval: A four byte sequence to turn into an integer.`
			`"""`
			`num = 0`
			`num += ord(bval[0] << 24)`
			`num += ord(bval[1] << 16)`
			`num += ord(bval[2] << 8)`
			`num += ord(bval[3])`
			`return num`


			`def XOR(x, y):`
			`"""`
			`Return the results of an XOR operation on two equal length byte strings.`

			`:param bytes x: A byte string`
			`:param bytes y: A byte string`
			`:rtype: bytes`
			`"""`
			`result = b''`
			`for a, b in zip(x, y):`
			`if sys.version_info < (3, 0):`
			`result += chr((ord(a) ^ ord(b)))`
			`else:`
			`result += bytes([a ^ b])`
			`return result`


			`def hash(name):`
			`"""`
			`Return a hash function implementing the given algorithm.`

			`:param name: The name of the hashing algorithm to use.`
			`:type name: string`

			`:rtype: function`
			`"""`
			`name = name.lower()`
			`if name.startswith('sha-'):`
			`name = 'sha' + name[4:]`
			`if name in dir(hashlib):`
			`return getattr(hashlib, name)`
			`return None`


			`def hashes():`
			`"""`
			`Return a list of available hashing algorithms.`

			`:rtype: list of strings`
			`"""`
			`t = []`
			`if 'md5' in dir(hashlib):`
			`t = ['MD5']`
			`if 'md2' in dir(hashlib):`
			`t += ['MD2']`
			`hashes = ['SHA-' + h[3:] for h in dir(hashlib) if h.startswith('sha')]`
			`return t + hashes`
added setdefaultencoding method so reload(sys) not needed reload(sys) could cause problem in user code - ie, sys.stdout, excepthook, and displayhook would be reset, etc 2012-10-24 18:27:52 +00:00
Fix things again, this time for python3 2014-06-09 15:28:57 +00:00
added setdefaultencoding method so reload(sys) not needed reload(sys) could cause problem in user code - ie, sys.stdout, excepthook, and displayhook would be reset, etc 2012-10-24 18:27:52 +00:00			`def setdefaultencoding(encoding):`
			`"""`
			`Set the current default string encoding used by the Unicode implementation.`

			`Actually calls sys.setdefaultencoding under the hood - see the docs for that`
			`for more details. This method exists only as a way to call find/call it`
			`even after it has been 'deleted' when the site module is executed.`

			`:param string encoding: An encoding name, compatible with sys.setdefaultencoding`
			`"""`
			`func = getattr(sys, 'setdefaultencoding', None)`
			`if func is None:`
			`import gc`
			`import types`
			`for obj in gc.get_objects():`
			`if (isinstance(obj, types.BuiltinFunctionType)`
			`and obj.__name__ == 'setdefaultencoding'):`
			`func = obj`
			`break`
			`if func is None:`
			`raise RuntimeError("Could not find setdefaultencoding")`
			`sys.setdefaultencoding = func`
Fix unicode conversion in Python3 2012-12-18 18:33:14 +00:00			`return func(encoding)`
Fix things again, this time for python3 2014-06-09 15:28:57 +00:00

			`def safedict(data):`
			`if sys.version_info < (2, 7):`
			`safe = {}`
			`for key in data:`
			`safe[key.encode('utf8')] = data[key]`
			`return safe`
			`else:`
			`return data`