Major fixes and new features
All checks were successful
continuous-integration/drone/push Build is passing
All checks were successful
continuous-integration/drone/push Build is passing
This commit is contained in:
102
venv/lib/python3.12/site-packages/kafka/partitioner/default.py
Normal file
102
venv/lib/python3.12/site-packages/kafka/partitioner/default.py
Normal file
@@ -0,0 +1,102 @@
|
||||
from __future__ import absolute_import
|
||||
|
||||
import random
|
||||
|
||||
from kafka.vendor import six
|
||||
|
||||
|
||||
class DefaultPartitioner(object):
|
||||
"""Default partitioner.
|
||||
|
||||
Hashes key to partition using murmur2 hashing (from java client)
|
||||
If key is None, selects partition randomly from available,
|
||||
or from all partitions if none are currently available
|
||||
"""
|
||||
@classmethod
|
||||
def __call__(cls, key, all_partitions, available):
|
||||
"""
|
||||
Get the partition corresponding to key
|
||||
:param key: partitioning key
|
||||
:param all_partitions: list of all partitions sorted by partition ID
|
||||
:param available: list of available partitions in no particular order
|
||||
:return: one of the values from all_partitions or available
|
||||
"""
|
||||
if key is None:
|
||||
if available:
|
||||
return random.choice(available)
|
||||
return random.choice(all_partitions)
|
||||
|
||||
idx = murmur2(key)
|
||||
idx &= 0x7fffffff
|
||||
idx %= len(all_partitions)
|
||||
return all_partitions[idx]
|
||||
|
||||
|
||||
# https://github.com/apache/kafka/blob/0.8.2/clients/src/main/java/org/apache/kafka/common/utils/Utils.java#L244
|
||||
def murmur2(data):
|
||||
"""Pure-python Murmur2 implementation.
|
||||
|
||||
Based on java client, see org.apache.kafka.common.utils.Utils.murmur2
|
||||
|
||||
Args:
|
||||
data (bytes): opaque bytes
|
||||
|
||||
Returns: MurmurHash2 of data
|
||||
"""
|
||||
# Python2 bytes is really a str, causing the bitwise operations below to fail
|
||||
# so convert to bytearray.
|
||||
if six.PY2:
|
||||
data = bytearray(bytes(data))
|
||||
|
||||
length = len(data)
|
||||
seed = 0x9747b28c
|
||||
# 'm' and 'r' are mixing constants generated offline.
|
||||
# They're not really 'magic', they just happen to work well.
|
||||
m = 0x5bd1e995
|
||||
r = 24
|
||||
|
||||
# Initialize the hash to a random value
|
||||
h = seed ^ length
|
||||
length4 = length // 4
|
||||
|
||||
for i in range(length4):
|
||||
i4 = i * 4
|
||||
k = ((data[i4 + 0] & 0xff) +
|
||||
((data[i4 + 1] & 0xff) << 8) +
|
||||
((data[i4 + 2] & 0xff) << 16) +
|
||||
((data[i4 + 3] & 0xff) << 24))
|
||||
k &= 0xffffffff
|
||||
k *= m
|
||||
k &= 0xffffffff
|
||||
k ^= (k % 0x100000000) >> r # k ^= k >>> r
|
||||
k &= 0xffffffff
|
||||
k *= m
|
||||
k &= 0xffffffff
|
||||
|
||||
h *= m
|
||||
h &= 0xffffffff
|
||||
h ^= k
|
||||
h &= 0xffffffff
|
||||
|
||||
# Handle the last few bytes of the input array
|
||||
extra_bytes = length % 4
|
||||
if extra_bytes >= 3:
|
||||
h ^= (data[(length & ~3) + 2] & 0xff) << 16
|
||||
h &= 0xffffffff
|
||||
if extra_bytes >= 2:
|
||||
h ^= (data[(length & ~3) + 1] & 0xff) << 8
|
||||
h &= 0xffffffff
|
||||
if extra_bytes >= 1:
|
||||
h ^= (data[length & ~3] & 0xff)
|
||||
h &= 0xffffffff
|
||||
h *= m
|
||||
h &= 0xffffffff
|
||||
|
||||
h ^= (h % 0x100000000) >> 13 # h >>> 13;
|
||||
h &= 0xffffffff
|
||||
h *= m
|
||||
h &= 0xffffffff
|
||||
h ^= (h % 0x100000000) >> 15 # h >>> 15;
|
||||
h &= 0xffffffff
|
||||
|
||||
return h
|
||||
Reference in New Issue
Block a user