Cythonize marshalling code

This commit is contained in:
Mark Florisson
2015-07-23 15:45:28 +01:00
parent 8afd853ae9
commit f0b360a9c7
2 changed files with 230 additions and 0 deletions

29
cassandra/marshal.pxd Normal file
View File

@@ -0,0 +1,29 @@
from libc.stdint cimport (int8_t, int16_t, int32_t, int64_t,
uint8_t, uint16_t, uint32_t, uint64_t)
cpdef bytes int64_pack(int64_t x)
cpdef bytes int32_pack(int32_t x)
cpdef bytes int16_pack(int16_t x)
cpdef bytes int8_pack(int8_t x)
cpdef int64_t int64_unpack(const char *buf)
cpdef int32_t int32_unpack(const char *buf)
cpdef int16_t int16_unpack(const char *buf)
cpdef int8_t int8_unpack(const char *buf)
cpdef bytes uint64_pack(uint64_t x)
cpdef bytes uint32_pack(uint32_t x)
cpdef bytes uint16_pack(uint16_t x)
cpdef bytes uint8_pack(uint8_t x)
cpdef uint64_t uint64_unpack(const char *buf)
cpdef uint32_t uint32_unpack(const char *buf)
cpdef uint16_t uint16_unpack(const char *buf)
cpdef uint8_t uint8_unpack(const char *buf)
cpdef bytes double_pack(double x)
cpdef bytes float_pack(float x)
cpdef double double_unpack(const char *buf)
cpdef float float_unpack(const char *buf)

201
cassandra/marshal.pyx Normal file
View File

@@ -0,0 +1,201 @@
# cython: profile=True
# Copyright 2013-2015 DataStax, Inc.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import six
import sys
import struct
import math
from libc.stdint cimport (int8_t, int16_t, int32_t, int64_t,
uint8_t, uint16_t, uint32_t, uint64_t)
assert sys.byteorder in ('little', 'big')
is_little_endian = sys.byteorder == 'little'
# cdef extern from "marshal.h":
# cdef str c_string_to_python(char *p, Py_ssize_t len)
def _make_packer(format_string):
packer = struct.Struct(format_string)
pack = packer.pack
unpack = lambda s: packer.unpack(s)[0]
return pack, unpack
cdef inline bytes pack(char *buf, Py_ssize_t size):
"""
Pack a buffer, given as a char *, into Python bytes in byte order.
"""
if is_little_endian:
swap_order(buf, size)
return buf[:size]
cdef inline swap_order(char *buf, Py_ssize_t size):
"""
Swap the byteorder of `buf` in-place (reverse all the bytes).
There are functions ntohl etc, but these may be POSIX-dependent.
"""
cdef Py_ssize_t start, end
cdef char c
for i in range(size/2):
end = size - i - 1
c = buf[i]
buf[i] = buf[end]
buf[end] = c
### Packing and unpacking of signed integers
cpdef inline bytes int64_pack(int64_t x):
return pack(<char *> &x, 8)
cpdef inline int64_t int64_unpack(const char *buf):
# The 'const' makes sure the buffer is not mutated in-place!
cdef int64_t x = (<int64_t *> buf)[0]
swap_order(<char *> &x, 8)
return x
cpdef inline bytes int32_pack(int32_t x):
return pack(<char *> &x, 4)
cpdef inline int32_t int32_unpack(const char *buf):
cdef int32_t x = (<int32_t *> buf)[0]
swap_order(<char *> &x, 4)
return x
cpdef inline bytes int16_pack(int16_t x):
return pack(<char *> &x, 2)
cpdef inline int16_t int16_unpack(const char *buf):
cdef int16_t x = (<int16_t *> buf)[0]
swap_order(<char *> &x, 2)
return x
cpdef inline bytes int8_pack(int8_t x):
return (<char *> &x)[:1]
cpdef inline int8_t int8_unpack(const char *buf):
return (<int8_t *> buf)[0]
cpdef inline bytes uint64_pack(uint64_t x):
return pack(<char *> &x, 8)
cpdef inline uint64_t uint64_unpack(const char *buf):
cdef uint64_t x = (<uint64_t *> buf)[0]
swap_order(<char *> &x, 8)
return x
cpdef inline bytes uint32_pack(uint32_t x):
return pack(<char *> &x, 4)
cpdef inline uint32_t uint32_unpack(const char *buf):
cdef uint32_t x = (<uint32_t *> buf)[0]
swap_order(<char *> &x, 4)
return x
cpdef inline bytes uint16_pack(uint16_t x):
return pack(<char *> &x, 2)
cpdef inline uint16_t uint16_unpack(const char *buf):
cdef uint16_t x = (<uint16_t *> buf)[0]
swap_order(<char *> &x, 2)
return x
cpdef inline bytes uint8_pack(uint8_t x):
return pack(<char *> &x, 1)
cpdef inline uint8_t uint8_unpack(const char *buf):
return (<uint8_t *> buf)[0]
cpdef inline bytes double_pack(double x):
return pack(<char *> &x, 8)
cpdef inline double double_unpack(const char *buf):
cdef double x = (<double *> buf)[0]
swap_order(<char *> &x, 8)
return x
cpdef inline bytes float_pack(float x):
return pack(<char *> &x, 4)
cpdef inline float float_unpack(const char *buf):
cdef float x = (<float *> buf)[0]
swap_order(<char *> &x, 4)
return x
# int64_pack, int64_unpack = _make_packer('>q')
# int32_pack, int32_unpack = _make_packer('>i')
# int16_pack, int16_unpack = _make_packer('>h')
# int8_pack, int8_unpack = _make_packer('>b')
# uint64_pack, uint64_unpack = _make_packer('>Q')
# uint32_pack, uint32_unpack = _make_packer('>I')
# uint16_pack, uint16_unpack = _make_packer('>H')
# uint8_pack, uint8_unpack = _make_packer('>B')
# float_pack, float_unpack = _make_packer('>f')
# double_pack, double_unpack = _make_packer('>d')
# Special case for cassandra header
header_struct = struct.Struct('>BBbB')
header_pack = header_struct.pack
header_unpack = header_struct.unpack
# in protocol version 3 and higher, the stream ID is two bytes
v3_header_struct = struct.Struct('>BBhB')
v3_header_pack = v3_header_struct.pack
v3_header_unpack = v3_header_struct.unpack
if six.PY3:
def varint_unpack(term):
val = int(''.join("%02x" % i for i in term), 16)
if (term[0] & 128) != 0:
# There is a bug in Cython (0.20 - 0.22), where if we do
# '1 << (len(term) * 8)' Cython generates '1' directly into the
# C code, causing integer overflows. Treat it as an object for now
val -= (<object> 1L) << (len(term) * 8)
return val
else:
def varint_unpack(term): # noqa
val = int(term.encode('hex'), 16)
if (ord(term[0]) & 128) != 0:
val = val - (1 << (len(term) * 8))
return val
def bitlength(n):
# return int(math.log2(n)) + 1
bitlen = 0
while n > 0:
n >>= 1
bitlen += 1
return bitlen
def varint_pack(big):
pos = True
if big == 0:
return b'\x00'
if big < 0:
bytelength = bitlength(abs(big) - 1) // 8 + 1
big = (1 << bytelength * 8) + big
pos = False
revbytes = bytearray()
while big > 0:
revbytes.append(big & 0xff)
big >>= 8
if pos and revbytes[-1] & 0x80:
revbytes.append(0)
revbytes.reverse()
return six.binary_type(revbytes)