File: codepoints.rb

package info (click to toggle)
jruby 1.7.26-1%2Bdeb9u1
  • links: PTS, VCS
  • area: main
  • in suites: stretch
  • size: 84,572 kB
  • sloc: ruby: 669,910; java: 253,056; xml: 35,152; ansic: 9,187; yacc: 7,267; cpp: 5,244; sh: 1,036; makefile: 345; jsp: 48; tcl: 40
file content (56 lines) | stat: -rw-r--r-- 1,780 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56

describe :string_codepoints, :shared => true do
  it "raises an ArgumentError when self has an invalid encoding and a method is called on the returned Enumerator" do
    s = "\xDF".force_encoding(Encoding::UTF_8)
    s.valid_encoding?.should be_false
    lambda { s.send(@method).to_a }.should raise_error(ArgumentError)
  end

  it "yields each codepoint to the block if one is given" do
    codepoints = []
    "abcd".send(@method) do |codepoint|
      codepoints << codepoint
    end
    codepoints.should == [97, 98, 99, 100]
  end

  it "raises an ArgumentError if self's encoding is invalid and a block is given" do
    s = "\xDF".force_encoding(Encoding::UTF_8)
    s.valid_encoding?.should be_false
    lambda { s.send(@method) { } }.should raise_error(ArgumentError)
  end

  it "returns codepoints as Fixnums" do
    "glark\u{20}".send(@method).to_a.each do |codepoint|
      codepoint.should be_an_instance_of(Fixnum)
    end
  end

  it "returns one codepoint for each character" do
    s = "\u{9876}\u{28}\u{1987}"
    s.send(@method).to_a.size.should == s.chars.to_a.size
  end

  it "works for multibyte characters" do
    s = "\u{9819}"
    s.bytesize.should == 3
    s.send(@method).to_a.should == [38937]
  end

  it "returns the codepoint corresponding to the character's position in the String's encoding" do
    "\u{787}".send(@method).to_a.should == [1927]
  end

  it "round-trips to the original String using Integer#chr" do
    s = "\u{13}\u{7711}\u{1010}"
    s2 = ""
    s.send(@method) {|n| s2 << n.chr(Encoding::UTF_8)}
    s.should == s2
  end

  it "is synonomous with #bytes for Strings which are single-byte optimisable" do
    s = "(){}".encode('ascii')
    s.ascii_only?.should be_true
    s.send(@method).to_a.should == s.bytes.to_a
  end
end