1
0
Fork 0
mirror of https://github.com/ruby/ruby.git synced 2022-11-09 12:17:21 -05:00
ruby--ruby/lib/rexml/encodings/UTF-16.rb
matz f2ad09d5b7 * lib/rexml/source.rb (REXML::Source::encoding): should not
convert the body twice.  [ruby-core:08828]

* lib/rexml/encoding.rb (REXML::Encoding::encoding):
  Encoding#encoding= to return boolean value to tell if the body
  is really converted or not.

* lib/rexml/encoding.rb (REXML::Encoding::encoding): Specific
  conversion library (e.g. rexml/encodings/UTF-16.rb) to have
  higher preceding.

* lib/rexml/encodings/UTF-16.rb (REXML::Encoding::decode_utf16):
  UTF-16#decode_utf16 should work strings without BOM.


git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@10910 b2dd03c8-39d4-4d8f-98ff-823fe69b080e
2006-09-11 02:48:17 +00:00

35 lines
792 B
Ruby

module REXML
module Encoding
def encode_utf16 content
array_utf8 = content.unpack("U*")
array_enc = []
array_utf8.each do |num|
if ((num>>16) > 0)
array_enc << 0
array_enc << ??
else
array_enc << (num >> 8)
array_enc << (num & 0xFF)
end
end
array_enc.pack('C*')
end
def decode_utf16(str)
str = str[2..-1] if /^\376\377/ =~ str
array_enc=str.unpack('C*')
array_utf8 = []
0.step(array_enc.size-1, 2){|i|
array_utf8 << (array_enc.at(i+1) + array_enc.at(i)*0x100)
}
array_utf8.pack('U*')
end
register(UTF_16) do |obj|
class << obj
alias decode decode_utf16
alias encode encode_utf16
end
end
end
end