deb-python-cassandra-driver/cassandra/marshal.pyx

# -- cython: profile=True
#
# Copyright 2013-2015 DataStax, Inc.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import six
import sys
import struct
import math

from libc.stdint cimport (int8_t, int16_t, int32_t, int64_t,
                          uint8_t, uint16_t, uint32_t, uint64_t)

cdef bint is_little_endian
from cassandra.util import is_little_endian

# cdef extern from "marshal.h":
#     cdef str c_string_to_python(char *p, Py_ssize_t len)

def _make_packer(format_string):
    packer = struct.Struct(format_string)
    pack = packer.pack
    unpack = lambda s: packer.unpack(s)[0]
    return pack, unpack


cdef inline bytes pack(char *buf, Py_ssize_t size):
    """
    Pack a buffer, given as a char *, into Python bytes in byte order.
    """
    swap_order(buf, size)
    return buf[:size]


cdef inline void swap_order(char *buf, Py_ssize_t size):
    """
    Swap the byteorder of `buf` in-place on little-endian platforms
    (reverse all the bytes).
    There are functions ntohl etc, but these may be POSIX-dependent.
    """
    cdef Py_ssize_t start, end, i
    cdef char c

    if is_little_endian:
        for i in range(size//2):
            end = size - i - 1
            c = buf[i]
            buf[i] = buf[end]
            buf[end] = c

### Packing and unpacking of signed integers

cpdef inline bytes int64_pack(int64_t x):
    return pack(<char *> &x, 8)

cpdef inline int64_t int64_unpack(const char *buf):
    # The 'const' makes sure the buffer is not mutated in-place!
    cdef int64_t x = (<int64_t *> buf)[0]
    cdef char *p = <char *> &x
    # if is_little_endian:
    #     p[0], p[1], p[2], p[3], p[4], p[5], p[6], p[7] = (
    #         p[7], p[6], p[5], p[4], p[3], p[2], p[1], p[0])
    swap_order(<char *> &x, 8)
    return x

cpdef inline bytes int32_pack(int32_t x):
    return pack(<char *> &x, 4)

cpdef inline int32_t int32_unpack(const char *buf):
    cdef int32_t x = (<int32_t *> buf)[0]
    cdef char *p = <char *> &x
    swap_order(<char *> &x, 4)
    # if is_little_endian:
    #     p[0], p[1], p[2], p[3] = p[3], p[2], p[1], p[0]
    return x

cpdef inline bytes int16_pack(int16_t x):
    return pack(<char *> &x, 2)

cpdef inline int16_t int16_unpack(const char *buf):
    cdef int16_t x = (<int16_t *> buf)[0]
    swap_order(<char *> &x, 2)
    return x

cpdef inline bytes int8_pack(int8_t x):
    return (<char *> &x)[:1]

cpdef inline int8_t int8_unpack(const char *buf):
    return (<int8_t *> buf)[0]

cpdef inline bytes uint64_pack(uint64_t x):
    return pack(<char *> &x, 8)

cpdef inline uint64_t uint64_unpack(const char *buf):
    cdef uint64_t x = (<uint64_t *> buf)[0]
    swap_order(<char *> &x, 8)
    return x

cpdef inline bytes uint32_pack(uint32_t x):
    return pack(<char *> &x, 4)

cpdef inline uint32_t uint32_unpack(const char *buf):
    cdef uint32_t x = (<uint32_t *> buf)[0]
    swap_order(<char *> &x, 4)
    return x

cpdef inline bytes uint16_pack(uint16_t x):
    return pack(<char *> &x, 2)

cpdef inline uint16_t uint16_unpack(const char *buf):
    cdef uint16_t x = (<uint16_t *> buf)[0]
    swap_order(<char *> &x, 2)
    return x

cpdef inline bytes uint8_pack(uint8_t x):
    return pack(<char *> &x, 1)

cpdef inline uint8_t uint8_unpack(const char *buf):
    return (<uint8_t *> buf)[0]

cpdef inline bytes double_pack(double x):
    return pack(<char *> &x, 8)

cpdef inline double double_unpack(const char *buf):
    cdef double x = (<double *> buf)[0]
    swap_order(<char *> &x, 8)
    return x

cpdef inline bytes float_pack(float x):
    return pack(<char *> &x, 4)

cpdef inline float float_unpack(const char *buf):
    cdef float x = (<float *> buf)[0]
    swap_order(<char *> &x, 4)
    return x

# int64_pack, int64_unpack = _make_packer('>q')
# int32_pack, int32_unpack = _make_packer('>i')
# int16_pack, int16_unpack = _make_packer('>h')
# int8_pack, int8_unpack = _make_packer('>b')
# uint64_pack, uint64_unpack = _make_packer('>Q')
# uint32_pack, uint32_unpack = _make_packer('>I')
# uint16_pack, uint16_unpack = _make_packer('>H')
# uint8_pack, uint8_unpack = _make_packer('>B')
# float_pack, float_unpack = _make_packer('>f')
# double_pack, double_unpack = _make_packer('>d')

# Special case for cassandra header
header_struct = struct.Struct('>BBbB')
header_pack = header_struct.pack
header_unpack = header_struct.unpack

# in protocol version 3 and higher, the stream ID is two bytes
v3_header_struct = struct.Struct('>BBhB')
v3_header_pack = v3_header_struct.pack
v3_header_unpack = v3_header_struct.unpack


if six.PY3:
    def varint_unpack(term):
        val = int(''.join("%02x" % i for i in term), 16)
        if (term[0] & 128) != 0:
            # There is a bug in Cython (0.20 - 0.22), where if we do
            # '1 << (len(term) * 8)' Cython generates '1' directly into the
            # C code, causing integer overflows. Treat it as an object for now
            val -= (<object> 1L) << (len(term) * 8)
        return val
else:
    def varint_unpack(term):  # noqa
        val = int(term.encode('hex'), 16)
        if (ord(term[0]) & 128) != 0:
            val = val - (1 << (len(term) * 8))
        return val


def bitlength(n):
    # return int(math.log2(n)) + 1
    bitlen = 0
    while n > 0:
        n >>= 1
        bitlen += 1
    return bitlen


def varint_pack(big):
    pos = True
    if big == 0:
        return b'\x00'
    if big < 0:
        bytelength = bitlength(abs(big) - 1) // 8 + 1
        big = (1 << bytelength * 8) + big
        pos = False
    revbytes = bytearray()
    while big > 0:
        revbytes.append(big & 0xff)
        big >>= 8
    if pos and revbytes[-1] & 0x80:
        revbytes.append(0)
    revbytes.reverse()
    return six.binary_type(revbytes)