1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165
|
# -*- coding: utf-8 -*-
from __future__ import unicode_literals
import pytest
from kafka.record import MemoryRecords, MemoryRecordsBuilder
from kafka.errors import CorruptRecordException
# This is real live data from Kafka 11 broker
record_batch_data_v2 = [
# First Batch value == "123"
b'\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00;\x00\x00\x00\x01\x02\x03'
b'\x18\xa2p\x00\x00\x00\x00\x00\x00\x00\x00\x01]\xff{\x06<\x00\x00\x01]'
b'\xff{\x06<\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x00'
b'\x00\x00\x01\x12\x00\x00\x00\x01\x06123\x00',
# Second Batch value = "" and value = "". 2 records
b'\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00@\x00\x00\x00\x02\x02\xc8'
b'\\\xbd#\x00\x00\x00\x00\x00\x01\x00\x00\x01]\xff|\xddl\x00\x00\x01]\xff'
b'|\xde\x14\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x00'
b'\x00\x00\x02\x0c\x00\x00\x00\x01\x00\x00\x0e\x00\xd0\x02\x02\x01\x00'
b'\x00',
# Third batch value = "123"
b'\x00\x00\x00\x00\x00\x00\x00\x03\x00\x00\x00;\x00\x00\x00\x02\x02.\x0b'
b'\x85\xb7\x00\x00\x00\x00\x00\x00\x00\x00\x01]\xff|\xe7\x9d\x00\x00\x01]'
b'\xff|\xe7\x9d\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff'
b'\x00\x00\x00\x01\x12\x00\x00\x00\x01\x06123\x00'
# Fourth batch value = "hdr" with header hkey=hval
b'\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00E\x00\x00\x00\x00\x02\\'
b'\xd8\xefR\x00\x00\x00\x00\x00\x00\x00\x00\x01e\x85\xb6\xf3\xc1\x00\x00'
b'\x01e\x85\xb6\xf3\xc1\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff'
b'\xff\xff\x00\x00\x00\x01&\x00\x00\x00\x01\x06hdr\x02\x08hkey\x08hval'
]
record_batch_data_v1 = [
# First Message value == "123"
b'\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x19G\x86(\xc2\x01\x00\x00'
b'\x00\x01^\x18g\xab\xae\xff\xff\xff\xff\x00\x00\x00\x03123',
# Second Message value == ""
b'\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x16\xef\x98\xc9 \x01\x00'
b'\x00\x00\x01^\x18g\xaf\xc0\xff\xff\xff\xff\x00\x00\x00\x00',
# Third Message value == ""
b'\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x16_\xaf\xfb^\x01\x00\x00'
b'\x00\x01^\x18g\xb0r\xff\xff\xff\xff\x00\x00\x00\x00',
# Fourth Message value = "123"
b'\x00\x00\x00\x00\x00\x00\x00\x03\x00\x00\x00\x19\xa8\x12W \x01\x00\x00'
b'\x00\x01^\x18g\xb8\x03\xff\xff\xff\xff\x00\x00\x00\x03123'
]
# This is real live data from Kafka 10 broker
record_batch_data_v0 = [
# First Message value == "123"
b'\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x11\xfe\xb0\x1d\xbf\x00'
b'\x00\xff\xff\xff\xff\x00\x00\x00\x03123',
# Second Message value == ""
b'\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x0eyWH\xe0\x00\x00\xff'
b'\xff\xff\xff\x00\x00\x00\x00',
# Third Message value == ""
b'\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x0eyWH\xe0\x00\x00\xff'
b'\xff\xff\xff\x00\x00\x00\x00',
# Fourth Message value = "123"
b'\x00\x00\x00\x00\x00\x00\x00\x03\x00\x00\x00\x11\xfe\xb0\x1d\xbf\x00'
b'\x00\xff\xff\xff\xff\x00\x00\x00\x03123'
]
def test_memory_records_v2():
data_bytes = b"".join(record_batch_data_v2) + b"\x00" * 4
records = MemoryRecords(data_bytes)
assert records.size_in_bytes() == 303
assert records.valid_bytes() == 299
assert records.has_next() is True
batch = records.next_batch()
recs = list(batch)
assert len(recs) == 1
assert recs[0].value == b"123"
assert recs[0].key is None
assert recs[0].timestamp == 1503229838908
assert recs[0].timestamp_type == 0
assert recs[0].checksum is None
assert recs[0].headers == []
assert records.next_batch() is not None
assert records.next_batch() is not None
batch = records.next_batch()
recs = list(batch)
assert len(recs) == 1
assert recs[0].value == b"hdr"
assert recs[0].headers == [('hkey', b'hval')]
assert records.has_next() is False
assert records.next_batch() is None
assert records.next_batch() is None
def test_memory_records_v1():
data_bytes = b"".join(record_batch_data_v1) + b"\x00" * 4
records = MemoryRecords(data_bytes)
assert records.size_in_bytes() == 146
assert records.valid_bytes() == 142
assert records.has_next() is True
batch = records.next_batch()
recs = list(batch)
assert len(recs) == 1
assert recs[0].value == b"123"
assert recs[0].key is None
assert recs[0].timestamp == 1503648000942
assert recs[0].timestamp_type == 0
assert recs[0].checksum == 1199974594 & 0xffffffff
assert records.next_batch() is not None
assert records.next_batch() is not None
assert records.next_batch() is not None
assert records.has_next() is False
assert records.next_batch() is None
assert records.next_batch() is None
def test_memory_records_v0():
data_bytes = b"".join(record_batch_data_v0)
records = MemoryRecords(data_bytes + b"\x00" * 4)
assert records.size_in_bytes() == 114
assert records.valid_bytes() == 110
records = MemoryRecords(data_bytes)
assert records.has_next() is True
batch = records.next_batch()
recs = list(batch)
assert len(recs) == 1
assert recs[0].value == b"123"
assert recs[0].key is None
assert recs[0].timestamp is None
assert recs[0].timestamp_type is None
assert recs[0].checksum == -22012481 & 0xffffffff
assert records.next_batch() is not None
assert records.next_batch() is not None
assert records.next_batch() is not None
assert records.has_next() is False
assert records.next_batch() is None
assert records.next_batch() is None
@pytest.mark.parametrize("compression_type", [0, 1, 2, 3])
@pytest.mark.parametrize("magic", [0, 1, 2])
def test_memory_records_builder_full(magic, compression_type):
builder = MemoryRecordsBuilder(
magic=magic, compression_type=compression_type, batch_size=1024 * 10)
# 1 message should always be appended
metadata = builder.append(
key=None, timestamp=None, value=b"M" * 10240)
assert metadata is not None
assert builder.is_full()
metadata = builder.append(
key=None, timestamp=None, value=b"M")
assert metadata is None
assert builder.next_offset() == 1
|