mirror of
https://github.com/ruby/ruby.git
synced 2022-11-09 12:17:21 -05:00
7a77e12488
git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@40049 b2dd03c8-39d4-4d8f-98ff-823fe69b080e
258 lines
6.3 KiB
Ruby
258 lines
6.3 KiB
Ruby
# -*- coding: utf-8 -*-
|
|
|
|
require_relative 'helper'
|
|
|
|
module Psych
|
|
class TestEncoding < TestCase
|
|
class EncodingCatcher < Handler
|
|
attr_reader :strings
|
|
def initialize
|
|
@strings = []
|
|
end
|
|
|
|
(Handler.instance_methods(true) -
|
|
Object.instance_methods).each do |m|
|
|
class_eval %{
|
|
def #{m} *args
|
|
@strings += args.flatten.find_all { |a|
|
|
String === a
|
|
}
|
|
end
|
|
}
|
|
end
|
|
end
|
|
|
|
def setup
|
|
super
|
|
@buffer = StringIO.new
|
|
@handler = EncodingCatcher.new
|
|
@parser = Psych::Parser.new @handler
|
|
@utf8 = Encoding.find('UTF-8')
|
|
@emitter = Psych::Emitter.new @buffer
|
|
end
|
|
|
|
def test_transcode_shiftjis
|
|
str = "こんにちは!"
|
|
loaded = Psych.load("--- こんにちは!".encode('SHIFT_JIS'))
|
|
assert_equal str, loaded
|
|
end
|
|
|
|
def test_transcode_utf16le
|
|
str = "こんにちは!"
|
|
loaded = Psych.load("--- こんにちは!".encode('UTF-16LE'))
|
|
assert_equal str, loaded
|
|
end
|
|
|
|
def test_transcode_utf16be
|
|
str = "こんにちは!"
|
|
loaded = Psych.load("--- こんにちは!".encode('UTF-16BE'))
|
|
assert_equal str, loaded
|
|
end
|
|
|
|
def test_io_shiftjis
|
|
t = Tempfile.new(['shiftjis', 'yml'], :encoding => 'SHIFT_JIS')
|
|
t.write '--- こんにちは!'
|
|
t.close
|
|
|
|
# If the external encoding isn't utf8, utf16le, or utf16be, we cannot
|
|
# process the file.
|
|
File.open(t.path, 'r', :encoding => 'SHIFT_JIS') do |f|
|
|
assert_raises Psych::SyntaxError do
|
|
Psych.load(f)
|
|
end
|
|
end
|
|
|
|
t.close(true)
|
|
end
|
|
|
|
def test_io_utf16le
|
|
t = Tempfile.new(['utf16le', 'yml'])
|
|
t.binmode
|
|
t.write '--- こんにちは!'.encode('UTF-16LE')
|
|
t.close
|
|
|
|
File.open(t.path, 'rb', :encoding => 'UTF-16LE') do |f|
|
|
assert_equal "こんにちは!", Psych.load(f)
|
|
end
|
|
|
|
t.close(true)
|
|
end
|
|
|
|
def test_io_utf16be
|
|
t = Tempfile.new(['utf16be', 'yml'])
|
|
t.binmode
|
|
t.write '--- こんにちは!'.encode('UTF-16BE')
|
|
t.close
|
|
|
|
File.open(t.path, 'rb', :encoding => 'UTF-16BE') do |f|
|
|
assert_equal "こんにちは!", Psych.load(f)
|
|
end
|
|
|
|
t.close(true)
|
|
end
|
|
|
|
def test_io_utf8
|
|
t = Tempfile.new(['utf8', 'yml'])
|
|
t.binmode
|
|
t.write '--- こんにちは!'.encode('UTF-8')
|
|
t.close
|
|
|
|
File.open(t.path, 'rb', :encoding => 'UTF-8') do |f|
|
|
assert_equal "こんにちは!", Psych.load(f)
|
|
end
|
|
|
|
t.close(true)
|
|
end
|
|
|
|
def test_emit_alias
|
|
@emitter.start_stream Psych::Parser::UTF8
|
|
@emitter.start_document [], [], true
|
|
e = assert_raises(RuntimeError) do
|
|
@emitter.alias 'ドラえもん'.encode('EUC-JP')
|
|
end
|
|
assert_match(/alias value/, e.message)
|
|
end
|
|
|
|
def test_to_yaml_is_valid
|
|
EnvUtil.with_default_external(Encoding::US_ASCII) do
|
|
EnvUtil.with_default_internal(nil) do
|
|
s = "こんにちは!"
|
|
# If no encoding is specified, use UTF-8
|
|
assert_equal Encoding::UTF_8, Psych.dump(s).encoding
|
|
assert_equal s, Psych.load(Psych.dump(s))
|
|
end
|
|
end
|
|
end
|
|
|
|
def test_start_mapping
|
|
foo = 'foo'
|
|
bar = 'バー'
|
|
|
|
@emitter.start_stream Psych::Parser::UTF8
|
|
@emitter.start_document [], [], true
|
|
@emitter.start_mapping(
|
|
foo.encode('Shift_JIS'),
|
|
bar.encode('UTF-16LE'),
|
|
false, Nodes::Sequence::ANY)
|
|
@emitter.end_mapping
|
|
@emitter.end_document false
|
|
@emitter.end_stream
|
|
|
|
@parser.parse @buffer.string
|
|
assert_encodings @utf8, @handler.strings
|
|
assert_equal [foo, bar], @handler.strings
|
|
end
|
|
|
|
def test_start_sequence
|
|
foo = 'foo'
|
|
bar = 'バー'
|
|
|
|
@emitter.start_stream Psych::Parser::UTF8
|
|
@emitter.start_document [], [], true
|
|
@emitter.start_sequence(
|
|
foo.encode('Shift_JIS'),
|
|
bar.encode('UTF-16LE'),
|
|
false, Nodes::Sequence::ANY)
|
|
@emitter.end_sequence
|
|
@emitter.end_document false
|
|
@emitter.end_stream
|
|
|
|
@parser.parse @buffer.string
|
|
assert_encodings @utf8, @handler.strings
|
|
assert_equal [foo, bar], @handler.strings
|
|
end
|
|
|
|
def test_doc_tag_encoding
|
|
key = '鍵'
|
|
@emitter.start_stream Psych::Parser::UTF8
|
|
@emitter.start_document(
|
|
[1, 1],
|
|
[['!'.encode('EUC-JP'), key.encode('EUC-JP')]],
|
|
true
|
|
)
|
|
@emitter.scalar 'foo', nil, nil, true, false, Nodes::Scalar::ANY
|
|
@emitter.end_document false
|
|
@emitter.end_stream
|
|
|
|
@parser.parse @buffer.string
|
|
assert_encodings @utf8, @handler.strings
|
|
assert_equal key, @handler.strings[1]
|
|
end
|
|
|
|
def test_emitter_encoding
|
|
str = "壁に耳あり、障子に目あり"
|
|
thing = Psych.load Psych.dump str.encode('EUC-JP')
|
|
assert_equal str, thing
|
|
end
|
|
|
|
def test_default_internal
|
|
EnvUtil.with_default_internal(Encoding::EUC_JP) do
|
|
str = "壁に耳あり、障子に目あり"
|
|
assert_equal @utf8, str.encoding
|
|
|
|
@parser.parse str
|
|
assert_encodings Encoding::EUC_JP, @handler.strings
|
|
assert_equal str, @handler.strings.first.encode('UTF-8')
|
|
end
|
|
end
|
|
|
|
def test_scalar
|
|
@parser.parse("--- a")
|
|
assert_encodings @utf8, @handler.strings
|
|
end
|
|
|
|
def test_alias
|
|
@parser.parse(<<-eoyml)
|
|
%YAML 1.1
|
|
---
|
|
!!seq [
|
|
!!str "Without properties",
|
|
&A !!str "Anchored",
|
|
!!str "Tagged",
|
|
*A,
|
|
!!str "",
|
|
]
|
|
eoyml
|
|
assert_encodings @utf8, @handler.strings
|
|
end
|
|
|
|
def test_list_anchor
|
|
list = %w{ a b }
|
|
list << list
|
|
@parser.parse(Psych.dump(list))
|
|
assert_encodings @utf8, @handler.strings
|
|
end
|
|
|
|
def test_map_anchor
|
|
h = {}
|
|
h['a'] = h
|
|
@parser.parse(Psych.dump(h))
|
|
assert_encodings @utf8, @handler.strings
|
|
end
|
|
|
|
def test_map_tag
|
|
@parser.parse(<<-eoyml)
|
|
%YAML 1.1
|
|
---
|
|
!!map { a : b }
|
|
eoyml
|
|
assert_encodings @utf8, @handler.strings
|
|
end
|
|
|
|
def test_doc_tag
|
|
@parser.parse(<<-eoyml)
|
|
%YAML 1.1
|
|
%TAG ! tag:tenderlovemaking.com,2009:
|
|
--- !fun
|
|
eoyml
|
|
assert_encodings @utf8, @handler.strings
|
|
end
|
|
|
|
private
|
|
def assert_encodings encoding, strings
|
|
strings.each do |str|
|
|
assert_equal encoding, str.encoding, str
|
|
end
|
|
end
|
|
end
|
|
end
|