mirror of
https://github.com/ruby/ruby.git
synced 2022-11-09 12:17:21 -05:00
string.c: respect the actual encoding
* string.c (rb_enc_str_coderange): respect the actual encoding of if a BOM presents, and scan for the actual code range. [ruby-core:91662] [Bug #15635] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@67167 b2dd03c8-39d4-4d8f-98ff-823fe69b080e
This commit is contained in:
parent
4045cb8222
commit
593505ac6f
2 changed files with 10 additions and 2 deletions
5
string.c
5
string.c
|
@ -655,12 +655,13 @@ rb_enc_str_coderange(VALUE str)
|
|||
if (cr == ENC_CODERANGE_UNKNOWN) {
|
||||
int encidx = ENCODING_GET(str);
|
||||
rb_encoding *enc = rb_enc_from_index(encidx);
|
||||
if (rb_enc_mbminlen(enc) > 1 && rb_enc_dummy_p(enc)) {
|
||||
if (rb_enc_mbminlen(enc) > 1 && rb_enc_dummy_p(enc) &&
|
||||
rb_enc_mbminlen(enc = get_actual_encoding(encidx, str)) == 1) {
|
||||
cr = ENC_CODERANGE_BROKEN;
|
||||
}
|
||||
else {
|
||||
cr = coderange_scan(RSTRING_PTR(str), RSTRING_LEN(str),
|
||||
get_actual_encoding(encidx, str));
|
||||
enc);
|
||||
}
|
||||
ENC_CODERANGE_SET(str, cr);
|
||||
}
|
||||
|
|
|
@ -269,6 +269,13 @@ class TestM17N < Test::Unit::TestCase
|
|||
assert_empty(encs, bug10598)
|
||||
end
|
||||
|
||||
def test_utf_without_bom_valid
|
||||
encs = [Encoding::UTF_16, Encoding::UTF_32].find_all {|enc|
|
||||
!(+"abcd").encode!(enc).force_encoding(enc).valid_encoding?
|
||||
}
|
||||
assert_empty(encs)
|
||||
end
|
||||
|
||||
def test_object_utf16_32_inspect
|
||||
EnvUtil.suppress_warning do
|
||||
begin
|
||||
|
|
Loading…
Reference in a new issue