123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237 |
- # Copyright (C) 2009 Internet Systems Consortium.
- #
- # Permission to use, copy, modify, and distribute this software for any
- # purpose with or without fee is hereby granted, provided that the above
- # copyright notice and this permission notice appear in all copies.
- #
- # THE SOFTWARE IS PROVIDED "AS IS" AND INTERNET SYSTEMS CONSORTIUM
- # DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL
- # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL
- # INTERNET SYSTEMS CONSORTIUM BE LIABLE FOR ANY SPECIAL, DIRECT,
- # INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING
- # FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT,
- # NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION
- # WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
- import sys
- import struct
- class DecodeError(Exception): pass
- PROTOCOL_VERSION = 0x536b616e
- _ITEM_BLOB = 0x01
- _ITEM_HASH = 0x02
- _ITEM_LIST = 0x03
- _ITEM_NULL = 0x04
- _ITEM_BOOL = 0x05
- _ITEM_INT = 0x06
- _ITEM_REAL = 0x07
- _ITEM_UTF8 = 0x08
- _ITEM_MASK = 0x0f
- _ITEM_LENGTH_32 = 0x00
- _ITEM_LENGTH_16 = 0x10
- _ITEM_LENGTH_8 = 0x20
- _ITEM_LENGTH_MASK = 0x30
- def to_wire(items):
- """Encode a dict into wire format.
- >>> wire_format = Message.to_wire({"a": "b"})
- """
- return struct.pack(">I", PROTOCOL_VERSION) + _encode_hash(items)
- def _encode_tag(tag):
- """Encode a single UTF-8 tag.
- ... wire_partial = Message._encode_tag('this')
- """
- binary = bytes(tag, 'utf-8')
- if len(binary) > 255:
- raise ArgumentError("tag is too long (max 255 encoded bytes)")
- return(struct.pack(">B", len(binary))) + binary
- def _encode_length_and_type(data, datatype):
- """Helper method to handle the length encoding in one place."""
- if data == None:
- return(struct.pack(">B", _ITEM_NULL))
- length = len(data)
- if length < 0x0000100:
- return(struct.pack(">B B", datatype | _ITEM_LENGTH_8, length) + data)
- elif length < 0x00010000:
- return(struct.pack(">B H", datatype | _ITEM_LENGTH_16, length) + data)
- else:
- return(struct.pack(">B I", datatype | _ITEM_LENGTH_32, length) + data)
- def _pack_utf8(item):
- """Pack a string (utf-8) and its type/length prefix."""
- return (_encode_length_and_type(bytes(item, 'utf-8'), _ITEM_UTF8))
- def _pack_blob(item):
- """Pack a blob (binary data) and its type/length prefix."""
- return (_encode_length_and_type(item, _ITEM_BLOB))
- def _pack_bool(item):
- """Pack a bool and its type/length prefix."""
- return (_encode_length_and_type(_encode_bool(item), _ITEM_BOOL))
- def _pack_int(item):
- """Pack an integer and its type/length prefix."""
- return (_encode_length_and_type(bytes(str(item), 'utf-8'), _ITEM_INT))
- def _pack_real(item):
- """Pack an integer and its type/length prefix."""
- return (_encode_length_and_type(bytes(str(item), 'utf-8'), _ITEM_REAL))
- def _pack_array(item):
- """Pack a list (array) and its type/length prefix."""
- return (_encode_length_and_type(_encode_array(item), _ITEM_LIST))
- def _pack_hash(item):
- """Pack a dict (hash) and its type/length prefix."""
- data = _encode_hash(item)
- return (_encode_length_and_type(data, _ITEM_HASH))
- def _pack_nil():
- """Encode a nil (NULL, None) item."""
- return _encode_length_and_type(None, None)
- def _encode_item(item):
- """Encode each item depending on its type"""
- if item == None:
- return (_pack_nil())
- elif type(item) == bool:
- return (_pack_bool(item))
- elif type(item) == int:
- return (_pack_int(item))
- elif type(item) == float:
- return (_pack_real(item))
- elif type(item) == dict:
- return (_pack_hash(item))
- elif type(item) == list:
- return (_pack_array(item))
- elif type(item) in (bytes, bytearray):
- return (_pack_blob(item))
- else:
- return (_pack_utf8(str(item)))
- def _encode_bool(item):
- """Encode a boolean value into a bytearray of one byte (0=false)"""
- if item:
- return b'1'
- else:
- return b'0'
- def _encode_array(item):
- """Encode an array, where each value is encoded recursively"""
- ret = bytes()
- for i in item:
- ret += _encode_item(i)
- return ret
- def _encode_hash(item):
- """Encode a hash, where each value is encoded recursively"""
- ret = bytes()
- for key, value in item.items():
- ret += _encode_tag(key)
- ret += _encode_item(value)
- return ret
- #
- # decode methods
- #
- def from_wire(data):
- if len(data) < 5:
- raise DecodeError("Data is too short to decode")
- wire_version, data = data[0:4], data[4:]
- wire_version = struct.unpack(">I", wire_version)[0]
- if wire_version != PROTOCOL_VERSION:
- raise DecodeError("Incorrect protocol version")
- return _decode_hash(data)
- def _decode_tag(data):
- if len(data) < 1:
- raise DecodeError("Data underrun while decoding")
- length = data[0]
- if len(data) - 1 < length:
- raise DecodeError("Data underrun while decoding")
- return [data[1:length + 1].decode(), data[length + 1:]]
- def _decode_item(data):
- if len(data) < 1:
- raise DecodeError("Data underrun while decoding")
- type_and_length_format = data[0]
- item_type = type_and_length_format & _ITEM_MASK
- length_format = type_and_length_format & _ITEM_LENGTH_MASK
- if item_type == _ITEM_NULL:
- data = data[1:]
- else:
- if length_format == _ITEM_LENGTH_8:
- if len(data) - 1 < 1:
- raise DecodeError("Data underrun while decoding")
- length = data[1]
- data = data[2:]
- elif length_format == _ITEM_LENGTH_16:
- if len(data) - 1 < 2:
- raise DecodeError("Data underrun while decoding")
- length = struct.unpack(">H", data[1:3])[0]
- data = data[3:]
- elif length_format == _ITEM_LENGTH_32:
- if len(data) - 1 < 4:
- raise DecodeError("Data underrun while decoding")
- length = struct.unpack(">I", data[1:5])[0]
- data = data[5:]
- if len(data) < length:
- raise DecodeError("Data underrun while decoding")
- item = data[0:length]
- data = data[length:]
- if item_type == _ITEM_BLOB:
- value = item
- elif item_type == _ITEM_BOOL:
- value = _decode_bool(item)
- elif item_type == _ITEM_INT:
- value = _decode_int(item)
- elif item_type == _ITEM_REAL:
- value = _decode_real(item)
- elif item_type == _ITEM_UTF8:
- value = str(item, 'utf-8')
- elif item_type == _ITEM_HASH:
- value = _decode_hash(item)
- elif item_type == _ITEM_LIST:
- value = _decode_array(item)
- elif item_type == _ITEM_NULL:
- value = None
- else:
- raise DecodeError("Unknown item type in decode: %02x" % item_type)
- return (value, data)
- def _decode_bool(data):
- return data == b'1'
- def _decode_int(data):
- return int(str(data, 'utf-8'))
- def _decode_real(data):
- return float(str(data, 'utf-8'))
- def _decode_hash(data):
- ret = {}
- while len(data) > 0:
- tag, data = _decode_tag(data)
- value, data = _decode_item(data)
- ret[tag] = value
- return ret
- def _decode_array(data):
- ret = []
- while len(data) > 0:
- value, data = _decode_item(data)
- ret.append(value)
- return ret
- if __name__ == "__main__":
- import doctest
- doctest.testmod()
|