File: length.rb

package info (click to toggle)
jruby 9.4.8.0%2Bds-3
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 89,244 kB
  • sloc: ruby: 548,574; java: 276,189; yacc: 25,873; ansic: 6,178; xml: 6,111; sh: 1,855; sed: 94; makefile: 78; jsp: 48; tcl: 40; exp: 12
file content (55 lines) | stat: -rw-r--r-- 1,772 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
# encoding: utf-8

describe :string_length, shared: true do
  it "returns the length of self" do
    "".send(@method).should == 0
    "\x00".send(@method).should == 1
    "one".send(@method).should == 3
    "two".send(@method).should == 3
    "three".send(@method).should == 5
    "four".send(@method).should == 4
  end

  it "returns the length of a string in different encodings" do
    utf8_str = 'こにちわ' * 100
    utf8_str.send(@method).should == 400
    utf8_str.encode(Encoding::UTF_32BE).send(@method).should == 400
    utf8_str.encode(Encoding::SHIFT_JIS).send(@method).should == 400
  end

  it "returns the length of the new self after encoding is changed" do
    str = +'こにちわ'
    str.send(@method)

    str.force_encoding('BINARY').send(@method).should == 12
  end

  it "returns the correct length after force_encoding(BINARY)" do
    utf8 = "あ"
    ascii = "a"
    concat = utf8 + ascii

    concat.encoding.should == Encoding::UTF_8
    concat.bytesize.should == 4

    concat.send(@method).should == 2
    concat.force_encoding(Encoding::ASCII_8BIT)
    concat.send(@method).should == 4
  end

  it "adds 1 for every invalid byte in UTF-8" do
    "\xF4\x90\x80\x80".send(@method).should == 4
    "a\xF4\x90\x80\x80b".send(@method).should == 6
    "é\xF4\x90\x80\x80è".send(@method).should == 6
  end

  it "adds 1 (and not 2) for a incomplete surrogate in UTF-16" do
    "\x00\xd8".dup.force_encoding("UTF-16LE").send(@method).should == 1
    "\xd8\x00".dup.force_encoding("UTF-16BE").send(@method).should == 1
  end

  it "adds 1 for a broken sequence in UTF-32" do
    "\x04\x03\x02\x01".dup.force_encoding("UTF-32LE").send(@method).should == 1
    "\x01\x02\x03\x04".dup.force_encoding("UTF-32BE").send(@method).should == 1
  end
end