Cythonize marshalling code
This commit is contained in:
29
cassandra/marshal.pxd
Normal file
29
cassandra/marshal.pxd
Normal file
@@ -0,0 +1,29 @@
|
||||
from libc.stdint cimport (int8_t, int16_t, int32_t, int64_t,
|
||||
uint8_t, uint16_t, uint32_t, uint64_t)
|
||||
|
||||
cpdef bytes int64_pack(int64_t x)
|
||||
cpdef bytes int32_pack(int32_t x)
|
||||
cpdef bytes int16_pack(int16_t x)
|
||||
cpdef bytes int8_pack(int8_t x)
|
||||
|
||||
cpdef int64_t int64_unpack(const char *buf)
|
||||
cpdef int32_t int32_unpack(const char *buf)
|
||||
cpdef int16_t int16_unpack(const char *buf)
|
||||
cpdef int8_t int8_unpack(const char *buf)
|
||||
|
||||
cpdef bytes uint64_pack(uint64_t x)
|
||||
cpdef bytes uint32_pack(uint32_t x)
|
||||
cpdef bytes uint16_pack(uint16_t x)
|
||||
cpdef bytes uint8_pack(uint8_t x)
|
||||
|
||||
cpdef uint64_t uint64_unpack(const char *buf)
|
||||
cpdef uint32_t uint32_unpack(const char *buf)
|
||||
cpdef uint16_t uint16_unpack(const char *buf)
|
||||
cpdef uint8_t uint8_unpack(const char *buf)
|
||||
|
||||
cpdef bytes double_pack(double x)
|
||||
cpdef bytes float_pack(float x)
|
||||
|
||||
cpdef double double_unpack(const char *buf)
|
||||
cpdef float float_unpack(const char *buf)
|
||||
|
||||
201
cassandra/marshal.pyx
Normal file
201
cassandra/marshal.pyx
Normal file
@@ -0,0 +1,201 @@
|
||||
# cython: profile=True
|
||||
# Copyright 2013-2015 DataStax, Inc.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
import six
|
||||
import sys
|
||||
import struct
|
||||
import math
|
||||
|
||||
from libc.stdint cimport (int8_t, int16_t, int32_t, int64_t,
|
||||
uint8_t, uint16_t, uint32_t, uint64_t)
|
||||
|
||||
assert sys.byteorder in ('little', 'big')
|
||||
is_little_endian = sys.byteorder == 'little'
|
||||
|
||||
# cdef extern from "marshal.h":
|
||||
# cdef str c_string_to_python(char *p, Py_ssize_t len)
|
||||
|
||||
def _make_packer(format_string):
|
||||
packer = struct.Struct(format_string)
|
||||
pack = packer.pack
|
||||
unpack = lambda s: packer.unpack(s)[0]
|
||||
return pack, unpack
|
||||
|
||||
|
||||
cdef inline bytes pack(char *buf, Py_ssize_t size):
|
||||
"""
|
||||
Pack a buffer, given as a char *, into Python bytes in byte order.
|
||||
"""
|
||||
if is_little_endian:
|
||||
swap_order(buf, size)
|
||||
return buf[:size]
|
||||
|
||||
|
||||
cdef inline swap_order(char *buf, Py_ssize_t size):
|
||||
"""
|
||||
Swap the byteorder of `buf` in-place (reverse all the bytes).
|
||||
There are functions ntohl etc, but these may be POSIX-dependent.
|
||||
"""
|
||||
cdef Py_ssize_t start, end
|
||||
cdef char c
|
||||
for i in range(size/2):
|
||||
end = size - i - 1
|
||||
c = buf[i]
|
||||
buf[i] = buf[end]
|
||||
buf[end] = c
|
||||
|
||||
### Packing and unpacking of signed integers
|
||||
|
||||
cpdef inline bytes int64_pack(int64_t x):
|
||||
return pack(<char *> &x, 8)
|
||||
|
||||
cpdef inline int64_t int64_unpack(const char *buf):
|
||||
# The 'const' makes sure the buffer is not mutated in-place!
|
||||
cdef int64_t x = (<int64_t *> buf)[0]
|
||||
swap_order(<char *> &x, 8)
|
||||
return x
|
||||
|
||||
cpdef inline bytes int32_pack(int32_t x):
|
||||
return pack(<char *> &x, 4)
|
||||
|
||||
cpdef inline int32_t int32_unpack(const char *buf):
|
||||
cdef int32_t x = (<int32_t *> buf)[0]
|
||||
swap_order(<char *> &x, 4)
|
||||
return x
|
||||
|
||||
cpdef inline bytes int16_pack(int16_t x):
|
||||
return pack(<char *> &x, 2)
|
||||
|
||||
cpdef inline int16_t int16_unpack(const char *buf):
|
||||
cdef int16_t x = (<int16_t *> buf)[0]
|
||||
swap_order(<char *> &x, 2)
|
||||
return x
|
||||
|
||||
cpdef inline bytes int8_pack(int8_t x):
|
||||
return (<char *> &x)[:1]
|
||||
|
||||
cpdef inline int8_t int8_unpack(const char *buf):
|
||||
return (<int8_t *> buf)[0]
|
||||
|
||||
cpdef inline bytes uint64_pack(uint64_t x):
|
||||
return pack(<char *> &x, 8)
|
||||
|
||||
cpdef inline uint64_t uint64_unpack(const char *buf):
|
||||
cdef uint64_t x = (<uint64_t *> buf)[0]
|
||||
swap_order(<char *> &x, 8)
|
||||
return x
|
||||
|
||||
cpdef inline bytes uint32_pack(uint32_t x):
|
||||
return pack(<char *> &x, 4)
|
||||
|
||||
cpdef inline uint32_t uint32_unpack(const char *buf):
|
||||
cdef uint32_t x = (<uint32_t *> buf)[0]
|
||||
swap_order(<char *> &x, 4)
|
||||
return x
|
||||
|
||||
cpdef inline bytes uint16_pack(uint16_t x):
|
||||
return pack(<char *> &x, 2)
|
||||
|
||||
cpdef inline uint16_t uint16_unpack(const char *buf):
|
||||
cdef uint16_t x = (<uint16_t *> buf)[0]
|
||||
swap_order(<char *> &x, 2)
|
||||
return x
|
||||
|
||||
cpdef inline bytes uint8_pack(uint8_t x):
|
||||
return pack(<char *> &x, 1)
|
||||
|
||||
cpdef inline uint8_t uint8_unpack(const char *buf):
|
||||
return (<uint8_t *> buf)[0]
|
||||
|
||||
cpdef inline bytes double_pack(double x):
|
||||
return pack(<char *> &x, 8)
|
||||
|
||||
cpdef inline double double_unpack(const char *buf):
|
||||
cdef double x = (<double *> buf)[0]
|
||||
swap_order(<char *> &x, 8)
|
||||
return x
|
||||
|
||||
cpdef inline bytes float_pack(float x):
|
||||
return pack(<char *> &x, 4)
|
||||
|
||||
cpdef inline float float_unpack(const char *buf):
|
||||
cdef float x = (<float *> buf)[0]
|
||||
swap_order(<char *> &x, 4)
|
||||
return x
|
||||
|
||||
# int64_pack, int64_unpack = _make_packer('>q')
|
||||
# int32_pack, int32_unpack = _make_packer('>i')
|
||||
# int16_pack, int16_unpack = _make_packer('>h')
|
||||
# int8_pack, int8_unpack = _make_packer('>b')
|
||||
# uint64_pack, uint64_unpack = _make_packer('>Q')
|
||||
# uint32_pack, uint32_unpack = _make_packer('>I')
|
||||
# uint16_pack, uint16_unpack = _make_packer('>H')
|
||||
# uint8_pack, uint8_unpack = _make_packer('>B')
|
||||
# float_pack, float_unpack = _make_packer('>f')
|
||||
# double_pack, double_unpack = _make_packer('>d')
|
||||
|
||||
# Special case for cassandra header
|
||||
header_struct = struct.Struct('>BBbB')
|
||||
header_pack = header_struct.pack
|
||||
header_unpack = header_struct.unpack
|
||||
|
||||
# in protocol version 3 and higher, the stream ID is two bytes
|
||||
v3_header_struct = struct.Struct('>BBhB')
|
||||
v3_header_pack = v3_header_struct.pack
|
||||
v3_header_unpack = v3_header_struct.unpack
|
||||
|
||||
|
||||
if six.PY3:
|
||||
def varint_unpack(term):
|
||||
val = int(''.join("%02x" % i for i in term), 16)
|
||||
if (term[0] & 128) != 0:
|
||||
# There is a bug in Cython (0.20 - 0.22), where if we do
|
||||
# '1 << (len(term) * 8)' Cython generates '1' directly into the
|
||||
# C code, causing integer overflows. Treat it as an object for now
|
||||
val -= (<object> 1L) << (len(term) * 8)
|
||||
return val
|
||||
else:
|
||||
def varint_unpack(term): # noqa
|
||||
val = int(term.encode('hex'), 16)
|
||||
if (ord(term[0]) & 128) != 0:
|
||||
val = val - (1 << (len(term) * 8))
|
||||
return val
|
||||
|
||||
|
||||
def bitlength(n):
|
||||
# return int(math.log2(n)) + 1
|
||||
bitlen = 0
|
||||
while n > 0:
|
||||
n >>= 1
|
||||
bitlen += 1
|
||||
return bitlen
|
||||
|
||||
|
||||
def varint_pack(big):
|
||||
pos = True
|
||||
if big == 0:
|
||||
return b'\x00'
|
||||
if big < 0:
|
||||
bytelength = bitlength(abs(big) - 1) // 8 + 1
|
||||
big = (1 << bytelength * 8) + big
|
||||
pos = False
|
||||
revbytes = bytearray()
|
||||
while big > 0:
|
||||
revbytes.append(big & 0xff)
|
||||
big >>= 8
|
||||
if pos and revbytes[-1] & 0x80:
|
||||
revbytes.append(0)
|
||||
revbytes.reverse()
|
||||
return six.binary_type(revbytes)
|
||||
Reference in New Issue
Block a user