1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687
|
# encoding: ascii-8bit
require 'stringio'
require 'tempfile'
require 'zlib'
require 'spec/spec_helper'
describe MessagePack::Unpacker do
let :unpacker do
MessagePack::Unpacker.new
end
let :packer do
MessagePack::Packer.new
end
it 'gets options to specify how to unpack values' do
u1 = MessagePack::Unpacker.new
u1.symbolize_keys?.should == false
u1.allow_unknown_ext?.should == false
u2 = MessagePack::Unpacker.new(symbolize_keys: true, allow_unknown_ext: true)
u2.symbolize_keys?.should == true
u2.allow_unknown_ext?.should == true
end
it 'gets IO or object which has #read to read data from it' do
sample_data = {"message" => "morning!", "num" => 1}
sample_packed = MessagePack.pack(sample_data).force_encoding('ASCII-8BIT')
Tempfile.open("for_io") do |file|
file.sync = true
file.write sample_packed
file.rewind
u1 = MessagePack::Unpacker.new(file)
u1.each do |obj|
expect(obj).to eql(sample_data)
end
file.unlink
end
sio = StringIO.new(sample_packed)
u2 = MessagePack::Unpacker.new(sio)
u2.each do |obj|
expect(obj).to eql(sample_data)
end
dio = StringIO.new
Zlib::GzipWriter.wrap(dio){|gz| gz.write sample_packed }
reader = Zlib::GzipReader.new(StringIO.new(dio.string))
u3 = MessagePack::Unpacker.new(reader)
u3.each do |obj|
expect(obj).to eql(sample_data)
end
class DummyIO
def initialize
@buf = "".force_encoding('ASCII-8BIT')
@pos = 0
end
def write(val)
@buf << val.to_s
end
def read(length=nil,outbuf="")
if @pos == @buf.size
nil
elsif length.nil?
val = @buf[@pos..(@buf.size)]
@pos = @buf.size
outbuf << val
outbuf
else
val = @buf[@pos..(@pos + length)]
@pos += val.size
@pos = @buf.size if @pos > @buf.size
outbuf << val
outbuf
end
end
def flush
# nop
end
end
dio = DummyIO.new
dio.write sample_packed
u4 = MessagePack::Unpacker.new(dio)
u4.each do |obj|
expect(obj).to eql(sample_data)
end
end
it 'read_array_header succeeds' do
unpacker.feed("\x91")
unpacker.read_array_header.should == 1
end
it 'read_array_header fails' do
unpacker.feed("\x81")
lambda {
unpacker.read_array_header
}.should raise_error(MessagePack::TypeError) # TypeError is included in UnexpectedTypeError
lambda {
unpacker.read_array_header
}.should raise_error(MessagePack::UnexpectedTypeError)
end
it 'read_map_header converts an map to key-value sequence' do
packer.write_array_header(2)
packer.write("e")
packer.write(1)
unpacker = MessagePack::Unpacker.new
unpacker.feed(packer.to_s)
unpacker.read_array_header.should == 2
unpacker.read.should == "e"
unpacker.read.should == 1
end
it 'read_map_header succeeds' do
unpacker.feed("\x81")
unpacker.read_map_header.should == 1
end
it 'read_map_header converts an map to key-value sequence' do
packer.write_map_header(1)
packer.write("k")
packer.write("v")
unpacker = MessagePack::Unpacker.new
unpacker.feed(packer.to_s)
unpacker.read_map_header.should == 1
unpacker.read.should == "k"
unpacker.read.should == "v"
end
it 'read_map_header fails' do
unpacker.feed("\x91")
lambda {
unpacker.read_map_header
}.should raise_error(MessagePack::TypeError) # TypeError is included in UnexpectedTypeError
lambda {
unpacker.read_map_header
}.should raise_error(MessagePack::UnexpectedTypeError)
end
it 'read raises EOFError before feeding' do
lambda {
unpacker.read
}.should raise_error(EOFError)
end
let :sample_object do
[1024, {["a","b"]=>["c","d"]}, ["e","f"], "d", 70000, 4.12, 1.5, 1.5, 1.5]
end
it 'feed and each continue internal state' do
raw = sample_object.to_msgpack.to_s * 4
objects = []
raw.split(//).each do |b|
unpacker.feed(b)
unpacker.each {|c|
objects << c
}
end
objects.should == [sample_object] * 4
end
it 'feed_each continues internal state' do
raw = sample_object.to_msgpack.to_s * 4
objects = []
raw.split(//).each do |b|
unpacker.feed_each(b) {|c|
objects << c
}
end
objects.should == [sample_object] * 4
end
it 'feed_each enumerator' do
raw = sample_object.to_msgpack.to_s * 4
enum = unpacker.feed_each(raw)
enum.should be_instance_of(Enumerator)
enum.to_a.should == [sample_object] * 4
end
it 'reset clears internal buffer' do
# 1-element array
unpacker.feed("\x91")
unpacker.reset
unpacker.feed("\x01")
unpacker.each.map {|x| x }.should == [1]
end
it 'reset clears internal state' do
# 1-element array
unpacker.feed("\x91")
unpacker.each.map {|x| x }.should == []
unpacker.reset
unpacker.feed("\x01")
unpacker.each.map {|x| x }.should == [1]
end
it 'frozen short strings' do
raw = sample_object.to_msgpack.to_s.force_encoding('UTF-8')
lambda {
unpacker.feed_each(raw.freeze) { }
}.should_not raise_error
end
it 'frozen long strings' do
raw = (sample_object.to_msgpack.to_s * 10240).force_encoding('UTF-8')
lambda {
unpacker.feed_each(raw.freeze) { }
}.should_not raise_error
end
it 'read raises invalid byte error' do
unpacker.feed("\xc1")
lambda {
unpacker.read
}.should raise_error(MessagePack::MalformedFormatError)
end
it "gc mark" do
raw = sample_object.to_msgpack.to_s * 4
n = 0
raw.split(//).each do |b|
GC.start
unpacker.feed_each(b) {|o|
GC.start
o.should == sample_object
n += 1
}
GC.start
end
n.should == 4
end
it "buffer" do
orig = "a"*32*1024*4
raw = orig.to_msgpack.to_s
n = 655
times = raw.size / n
times += 1 unless raw.size % n == 0
off = 0
parsed = false
times.times do
parsed.should == false
seg = raw[off, n]
off += seg.length
unpacker.feed_each(seg) {|obj|
parsed.should == false
obj.should == orig
parsed = true
}
end
parsed.should == true
end
it 'MessagePack.unpack symbolize_keys' do
symbolized_hash = {:a => 'b', :c => 'd'}
MessagePack.load(MessagePack.pack(symbolized_hash), :symbolize_keys => true).should == symbolized_hash
MessagePack.unpack(MessagePack.pack(symbolized_hash), :symbolize_keys => true).should == symbolized_hash
end
it 'Unpacker#unpack symbolize_keys' do
unpacker = MessagePack::Unpacker.new(:symbolize_keys => true)
symbolized_hash = {:a => 'b', :c => 'd'}
unpacker.feed(MessagePack.pack(symbolized_hash)).read.should == symbolized_hash
end
it "msgpack str 8 type" do
MessagePack.unpack([0xd9, 0x00].pack('C*')).should == ""
MessagePack.unpack([0xd9, 0x00].pack('C*')).encoding.should == Encoding::UTF_8
MessagePack.unpack([0xd9, 0x01].pack('C*') + 'a').should == "a"
MessagePack.unpack([0xd9, 0x02].pack('C*') + 'aa').should == "aa"
end
it "msgpack str 16 type" do
MessagePack.unpack([0xda, 0x00, 0x00].pack('C*')).should == ""
MessagePack.unpack([0xda, 0x00, 0x00].pack('C*')).encoding.should == Encoding::UTF_8
MessagePack.unpack([0xda, 0x00, 0x01].pack('C*') + 'a').should == "a"
MessagePack.unpack([0xda, 0x00, 0x02].pack('C*') + 'aa').should == "aa"
end
it "msgpack str 32 type" do
MessagePack.unpack([0xdb, 0x00, 0x00, 0x00, 0x00].pack('C*')).should == ""
MessagePack.unpack([0xdb, 0x00, 0x00, 0x00, 0x00].pack('C*')).encoding.should == Encoding::UTF_8
MessagePack.unpack([0xdb, 0x00, 0x00, 0x00, 0x01].pack('C*') + 'a').should == "a"
MessagePack.unpack([0xdb, 0x00, 0x00, 0x00, 0x02].pack('C*') + 'aa').should == "aa"
end
it "msgpack bin 8 type" do
MessagePack.unpack([0xc4, 0x00].pack('C*')).should == ""
MessagePack.unpack([0xc4, 0x00].pack('C*')).encoding.should == Encoding::ASCII_8BIT
MessagePack.unpack([0xc4, 0x01].pack('C*') + 'a').should == "a"
MessagePack.unpack([0xc4, 0x02].pack('C*') + 'aa').should == "aa"
end
it "msgpack bin 16 type" do
MessagePack.unpack([0xc5, 0x00, 0x00].pack('C*')).should == ""
MessagePack.unpack([0xc5, 0x00, 0x00].pack('C*')).encoding.should == Encoding::ASCII_8BIT
MessagePack.unpack([0xc5, 0x00, 0x01].pack('C*') + 'a').should == "a"
MessagePack.unpack([0xc5, 0x00, 0x02].pack('C*') + 'aa').should == "aa"
end
it "msgpack bin 32 type" do
MessagePack.unpack([0xc6, 0x00, 0x00, 0x00, 0x00].pack('C*')).should == ""
MessagePack.unpack([0xc6, 0x0, 0x00, 0x00, 0x000].pack('C*')).encoding.should == Encoding::ASCII_8BIT
MessagePack.unpack([0xc6, 0x00, 0x00, 0x00, 0x01].pack('C*') + 'a').should == "a"
MessagePack.unpack([0xc6, 0x00, 0x00, 0x00, 0x02].pack('C*') + 'aa').should == "aa"
end
describe "ext formats" do
let(:unpacker) { MessagePack::Unpacker.new(allow_unknown_ext: true) }
[1, 2, 4, 8, 16].zip([0xd4, 0xd5, 0xd6, 0xd7, 0xd8]).each do |n,b|
it "msgpack fixext #{n} format" do
unpacker.feed([b, 1].pack('CC') + "a"*n).unpack.should == MessagePack::ExtensionValue.new(1, "a"*n)
unpacker.feed([b, -1].pack('CC') + "a"*n).unpack.should == MessagePack::ExtensionValue.new(-1, "a"*n)
end
end
it "msgpack ext 8 format" do
unpacker.feed([0xc7, 0, 1].pack('CCC')).unpack.should == MessagePack::ExtensionValue.new(1, "")
unpacker.feed([0xc7, 255, -1].pack('CCC') + "a"*255).unpack.should == MessagePack::ExtensionValue.new(-1, "a"*255)
end
it "msgpack ext 16 format" do
unpacker.feed([0xc8, 0, 1].pack('CnC')).unpack.should == MessagePack::ExtensionValue.new(1, "")
unpacker.feed([0xc8, 256, -1].pack('CnC') + "a"*256).unpack.should == MessagePack::ExtensionValue.new(-1, "a"*256)
end
it "msgpack ext 32 format" do
unpacker.feed([0xc9, 0, 1].pack('CNC')).unpack.should == MessagePack::ExtensionValue.new(1, "")
unpacker.feed([0xc9, 256, -1].pack('CNC') + "a"*256).unpack.should == MessagePack::ExtensionValue.new(-1, "a"*256)
unpacker.feed([0xc9, 65536, -1].pack('CNC') + "a"*65536).unpack.should == MessagePack::ExtensionValue.new(-1, "a"*65536)
end
end
class ValueOne
attr_reader :num
def initialize(num)
@num = num
end
def ==(obj)
self.num == obj.num
end
def num
@num
end
def to_msgpack_ext
@num.to_msgpack
end
def self.from_msgpack_ext(data)
self.new(MessagePack.unpack(data))
end
end
class ValueTwo
attr_reader :num_s
def initialize(num)
@num_s = num.to_s
end
def ==(obj)
self.num_s == obj.num_s
end
def num
@num_s.to_i
end
def to_msgpack_ext
@num_s.to_msgpack
end
def self.from_msgpack_ext(data)
self.new(MessagePack.unpack(data))
end
end
describe '#type_registered?' do
it 'receive Class or Integer, and return bool' do
expect(subject.type_registered?(0x00)).to be_falsy
expect(subject.type_registered?(0x01)).to be_falsy
expect(subject.type_registered?(::ValueOne)).to be_falsy
end
it 'returns true if specified type or class is already registered' do
subject.register_type(0x30, ::ValueOne, :from_msgpack_ext)
subject.register_type(0x31, ::ValueTwo, :from_msgpack_ext)
expect(subject.type_registered?(0x00)).to be_falsy
expect(subject.type_registered?(0x01)).to be_falsy
expect(subject.type_registered?(0x30)).to be_truthy
expect(subject.type_registered?(0x31)).to be_truthy
expect(subject.type_registered?(::ValueOne)).to be_truthy
expect(subject.type_registered?(::ValueTwo)).to be_truthy
end
it 'cannot detect unpack rule with block, not method' do
subject.register_type(0x40){|data| ValueOne.from_msgpack_ext(data) }
expect(subject.type_registered?(0x40)).to be_truthy
expect(subject.type_registered?(ValueOne)).to be_falsy
end
end
context 'with ext definitions' do
it 'get type and class mapping for packing' do
unpacker = MessagePack::Unpacker.new
unpacker.register_type(0x01){|data| ValueOne.from_msgpack_ext }
unpacker.register_type(0x02){|data| ValueTwo.from_msgpack_ext(data) }
unpacker = MessagePack::Unpacker.new
unpacker.register_type(0x01, ValueOne, :from_msgpack_ext)
unpacker.register_type(0x02, ValueTwo, :from_msgpack_ext)
end
it 'returns a Array of Hash which contains :type, :class and :unpacker' do
unpacker = MessagePack::Unpacker.new
unpacker.register_type(0x02, ValueTwo, :from_msgpack_ext)
unpacker.register_type(0x01, ValueOne, :from_msgpack_ext)
list = unpacker.registered_types
expect(list).to be_a(Array)
expect(list.size).to eq(2)
one = list[0]
expect(one.keys.sort).to eq([:type, :class, :unpacker].sort)
expect(one[:type]).to eq(0x01)
expect(one[:class]).to eq(ValueOne)
expect(one[:unpacker]).to eq(:from_msgpack_ext)
two = list[1]
expect(two.keys.sort).to eq([:type, :class, :unpacker].sort)
expect(two[:type]).to eq(0x02)
expect(two[:class]).to eq(ValueTwo)
expect(two[:unpacker]).to eq(:from_msgpack_ext)
end
it 'returns a Array of Hash, which contains nil for class if block unpacker specified' do
unpacker = MessagePack::Unpacker.new
unpacker.register_type(0x01){|data| ValueOne.from_msgpack_ext }
unpacker.register_type(0x02, &ValueTwo.method(:from_msgpack_ext))
list = unpacker.registered_types
expect(list).to be_a(Array)
expect(list.size).to eq(2)
one = list[0]
expect(one.keys.sort).to eq([:type, :class, :unpacker].sort)
expect(one[:type]).to eq(0x01)
expect(one[:class]).to be_nil
expect(one[:unpacker]).to be_instance_of(Proc)
two = list[1]
expect(two.keys.sort).to eq([:type, :class, :unpacker].sort)
expect(two[:type]).to eq(0x02)
expect(two[:class]).to be_nil
expect(two[:unpacker]).to be_instance_of(Proc)
end
end
def flatten(struct, results = [])
case struct
when Array
struct.each { |v| flatten(v, results) }
when Hash
struct.each { |k, v| flatten(v, flatten(k, results)) }
else
results << struct
end
results
end
subject do
described_class.new
end
let :buffer1 do
MessagePack.pack(:foo => 'bar')
end
let :buffer2 do
MessagePack.pack(:hello => {:world => [1, 2, 3]})
end
let :buffer3 do
MessagePack.pack(:x => 'y')
end
describe '#read' do
context 'with a buffer' do
it 'reads objects' do
objects = []
subject.feed(buffer1)
subject.feed(buffer2)
subject.feed(buffer3)
objects << subject.read
objects << subject.read
objects << subject.read
objects.should == [{'foo' => 'bar'}, {'hello' => {'world' => [1, 2, 3]}}, {'x' => 'y'}]
end
it 'reads map header' do
subject.feed({}.to_msgpack)
subject.read_map_header.should == 0
end
it 'reads array header' do
subject.feed([].to_msgpack)
subject.read_array_header.should == 0
end
end
end
describe '#each' do
context 'with a buffer' do
it 'yields each object in the buffer' do
objects = []
subject.feed(buffer1)
subject.feed(buffer2)
subject.feed(buffer3)
subject.each do |obj|
objects << obj
end
objects.should == [{'foo' => 'bar'}, {'hello' => {'world' => [1, 2, 3]}}, {'x' => 'y'}]
end
it 'returns an enumerator when no block is given' do
subject.feed(buffer1)
subject.feed(buffer2)
subject.feed(buffer3)
enum = subject.each
enum.map { |obj| obj.keys.first }.should == %w[foo hello x]
end
end
context 'with a stream passed to the constructor' do
it 'yields each object in the stream' do
objects = []
unpacker = described_class.new(StringIO.new(buffer1 + buffer2 + buffer3))
unpacker.each do |obj|
objects << obj
end
objects.should == [{'foo' => 'bar'}, {'hello' => {'world' => [1, 2, 3]}}, {'x' => 'y'}]
end
end
end
describe '#feed_each' do
it 'feeds the buffer then runs #each' do
objects = []
subject.feed_each(buffer1 + buffer2 + buffer3) do |obj|
objects << obj
end
objects.should == [{'foo' => 'bar'}, {'hello' => {'world' => [1, 2, 3]}}, {'x' => 'y'}]
end
it 'handles chunked data' do
objects = []
buffer = buffer1 + buffer2 + buffer3
buffer.chars.each do |ch|
subject.feed_each(ch) do |obj|
objects << obj
end
end
objects.should == [{'foo' => 'bar'}, {'hello' => {'world' => [1, 2, 3]}}, {'x' => 'y'}]
end
end
context 'regressions' do
it 'handles massive arrays (issue #2)' do
array = ['foo'] * 10_000
MessagePack.unpack(MessagePack.pack(array)).size.should == 10_000
end
end
context 'extensions' do
context 'symbolized keys' do
let :buffer do
MessagePack.pack({'hello' => 'world', 'nested' => ['object', {'structure' => true}]})
end
let :unpacker do
described_class.new(:symbolize_keys => true)
end
it 'can symbolize keys when using #each' do
objs = []
unpacker.feed(buffer)
unpacker.each do |obj|
objs << obj
end
objs.should == [{:hello => 'world', :nested => ['object', {:structure => true}]}]
end
it 'can symbolize keys when using #feed_each' do
objs = []
unpacker.feed_each(buffer) do |obj|
objs << obj
end
objs.should == [{:hello => 'world', :nested => ['object', {:structure => true}]}]
end
end
context 'binary encoding', :encodings do
let :buffer do
MessagePack.pack({'hello' => 'world', 'nested' => ['object', {'structure' => true}]})
end
let :unpacker do
described_class.new()
end
it 'decodes binary as ascii-8bit when using #feed' do
objs = []
unpacker.feed(buffer)
unpacker.each do |obj|
objs << obj
end
strings = flatten(objs).grep(String)
strings.should == %w[hello world nested object structure]
strings.map(&:encoding).uniq.should == [Encoding::ASCII_8BIT]
end
it 'decodes binary as ascii-8bit when using #feed_each' do
objs = []
unpacker.feed_each(buffer) do |obj|
objs << obj
end
strings = flatten(objs).grep(String)
strings.should == %w[hello world nested object structure]
strings.map(&:encoding).uniq.should == [Encoding::ASCII_8BIT]
end
end
context 'string encoding', :encodings do
let :buffer do
MessagePack.pack({'hello'.force_encoding(Encoding::UTF_8) => 'world'.force_encoding(Encoding::UTF_8), 'nested'.force_encoding(Encoding::UTF_8) => ['object'.force_encoding(Encoding::UTF_8), {'structure'.force_encoding(Encoding::UTF_8) => true}]})
end
let :unpacker do
described_class.new()
end
it 'decodes string as utf-8 when using #feed' do
objs = []
unpacker.feed(buffer)
unpacker.each do |obj|
objs << obj
end
strings = flatten(objs).grep(String)
strings.should == %w[hello world nested object structure]
strings.map(&:encoding).uniq.should == [Encoding::UTF_8]
end
it 'decodes binary as ascii-8bit when using #feed_each' do
objs = []
unpacker.feed_each(buffer) do |obj|
objs << obj
end
strings = flatten(objs).grep(String)
strings.should == %w[hello world nested object structure]
strings.map(&:encoding).uniq.should == [Encoding::UTF_8]
end
end
end
end
|