mirror of
https://github.com/ruby/ruby.git
synced 2022-11-09 12:17:21 -05:00
55 lines
1.6 KiB
Ruby
55 lines
1.6 KiB
Ruby
# encoding: utf-8
|
|
|
|
describe :string_length, shared: true do
|
|
it "returns the length of self" do
|
|
"".send(@method).should == 0
|
|
"\x00".send(@method).should == 1
|
|
"one".send(@method).should == 3
|
|
"two".send(@method).should == 3
|
|
"three".send(@method).should == 5
|
|
"four".send(@method).should == 4
|
|
end
|
|
|
|
it "returns the length of a string in different encodings" do
|
|
utf8_str = 'こにちわ' * 100
|
|
utf8_str.size.should == 400
|
|
utf8_str.encode(Encoding::UTF_32BE).size.should == 400
|
|
utf8_str.encode(Encoding::SHIFT_JIS).size.should == 400
|
|
end
|
|
|
|
it "returns the length of the new self after encoding is changed" do
|
|
str = 'こにちわ'
|
|
str.send(@method)
|
|
|
|
str.force_encoding('BINARY').send(@method).should == 12
|
|
end
|
|
|
|
it "returns the correct length after force_encoding(BINARY)" do
|
|
utf8 = "あ"
|
|
ascii = "a"
|
|
concat = utf8 + ascii
|
|
|
|
concat.encoding.should == Encoding::UTF_8
|
|
concat.bytesize.should == 4
|
|
|
|
concat.size.should == 2
|
|
concat.force_encoding(Encoding::ASCII_8BIT)
|
|
concat.size.should == 4
|
|
end
|
|
|
|
it "adds 1 for every invalid byte in UTF-8" do
|
|
"\xF4\x90\x80\x80".size.should == 4
|
|
"a\xF4\x90\x80\x80b".size.should == 6
|
|
"é\xF4\x90\x80\x80è".size.should == 6
|
|
end
|
|
|
|
it "adds 1 (and not 2) for a incomplete surrogate in UTF-16" do
|
|
"\x00\xd8".force_encoding("UTF-16LE").size.should == 1
|
|
"\xd8\x00".force_encoding("UTF-16BE").size.should == 1
|
|
end
|
|
|
|
it "adds 1 for a broken sequence in UTF-32" do
|
|
"\x04\x03\x02\x01".force_encoding("UTF-32LE").size.should == 1
|
|
"\x01\x02\x03\x04".force_encoding("UTF-32BE").size.should == 1
|
|
end
|
|
end
|