mirror of
https://github.com/ruby/ruby.git
synced 2022-11-09 12:17:21 -05:00
281 lines
7 KiB
Ruby
281 lines
7 KiB
Ruby
# -*- coding: utf-8 -*-
|
|
# frozen_string_literal: true
|
|
|
|
require_relative 'helper'
|
|
|
|
module Psych
|
|
class TestEncoding < TestCase
|
|
class EncodingCatcher < Handler
|
|
attr_reader :strings
|
|
def initialize
|
|
@strings = []
|
|
end
|
|
|
|
(Handler.instance_methods(true) -
|
|
Object.instance_methods).each do |m|
|
|
class_eval %{
|
|
def #{m} *args
|
|
@strings += args.flatten.find_all { |a|
|
|
String === a
|
|
}
|
|
end
|
|
}
|
|
end
|
|
end
|
|
|
|
def setup
|
|
super
|
|
@buffer = StringIO.new
|
|
@handler = EncodingCatcher.new
|
|
@parser = Psych::Parser.new @handler
|
|
@utf8 = Encoding.find('UTF-8')
|
|
@emitter = Psych::Emitter.new @buffer
|
|
end
|
|
|
|
def test_dump_load_encoding_object
|
|
assert_cycle Encoding::US_ASCII
|
|
assert_cycle Encoding::UTF_8
|
|
end
|
|
|
|
def test_transcode_shiftjis
|
|
str = "こんにちは!"
|
|
loaded = Psych.load("--- こんにちは!".encode('SHIFT_JIS'))
|
|
assert_equal str, loaded
|
|
end
|
|
|
|
def test_transcode_utf16le
|
|
str = "こんにちは!"
|
|
loaded = Psych.load("--- こんにちは!".encode('UTF-16LE'))
|
|
assert_equal str, loaded
|
|
end
|
|
|
|
def test_transcode_utf16be
|
|
str = "こんにちは!"
|
|
loaded = Psych.load("--- こんにちは!".encode('UTF-16BE'))
|
|
assert_equal str, loaded
|
|
end
|
|
|
|
def test_io_shiftjis
|
|
Tempfile.create(['shiftjis', 'yml'], :encoding => 'SHIFT_JIS') {|t|
|
|
t.write '--- こんにちは!'
|
|
t.close
|
|
|
|
# If the external encoding isn't utf8, utf16le, or utf16be, we cannot
|
|
# process the file.
|
|
File.open(t.path, 'r', :encoding => 'SHIFT_JIS') do |f|
|
|
assert_raise Psych::SyntaxError do
|
|
Psych.load(f)
|
|
end
|
|
end
|
|
}
|
|
end
|
|
|
|
def test_io_utf16le
|
|
Tempfile.create(['utf16le', 'yml']) {|t|
|
|
t.binmode
|
|
t.write '--- こんにちは!'.encode('UTF-16LE')
|
|
t.close
|
|
|
|
File.open(t.path, 'rb', :encoding => 'UTF-16LE') do |f|
|
|
assert_equal "こんにちは!", Psych.load(f)
|
|
end
|
|
}
|
|
end
|
|
|
|
def test_io_utf16be
|
|
Tempfile.create(['utf16be', 'yml']) {|t|
|
|
t.binmode
|
|
t.write '--- こんにちは!'.encode('UTF-16BE')
|
|
t.close
|
|
|
|
File.open(t.path, 'rb', :encoding => 'UTF-16BE') do |f|
|
|
assert_equal "こんにちは!", Psych.load(f)
|
|
end
|
|
}
|
|
end
|
|
|
|
def test_io_utf8
|
|
Tempfile.create(['utf8', 'yml']) {|t|
|
|
t.binmode
|
|
t.write '--- こんにちは!'.encode('UTF-8')
|
|
t.close
|
|
|
|
File.open(t.path, 'rb', :encoding => 'UTF-8') do |f|
|
|
assert_equal "こんにちは!", Psych.load(f)
|
|
end
|
|
}
|
|
end
|
|
|
|
def test_io_utf8_read_as_binary
|
|
Tempfile.create(['utf8', 'yml']) {|t|
|
|
t.binmode
|
|
t.write '--- こんにちは!'.encode('UTF-8')
|
|
t.close
|
|
|
|
File.open(t.path, 'rb', :encoding => 'ascii-8bit') do |f|
|
|
assert_equal "こんにちは!", Psych.load(f)
|
|
end
|
|
}
|
|
end
|
|
|
|
def test_emit_alias
|
|
@emitter.start_stream Psych::Parser::UTF8
|
|
@emitter.start_document [], [], true
|
|
e = assert_raise(RuntimeError) do
|
|
@emitter.alias 'ドラえもん'.encode('EUC-JP')
|
|
end
|
|
assert_match(/alias value/, e.message)
|
|
end
|
|
|
|
def test_to_yaml_is_valid
|
|
with_default_external(Encoding::US_ASCII) do
|
|
with_default_internal(nil) do
|
|
s = "こんにちは!"
|
|
# If no encoding is specified, use UTF-8
|
|
assert_equal Encoding::UTF_8, Psych.dump(s).encoding
|
|
assert_equal s, Psych.load(Psych.dump(s))
|
|
end
|
|
end
|
|
end
|
|
|
|
def test_start_mapping
|
|
foo = 'foo'
|
|
bar = 'バー'
|
|
|
|
@emitter.start_stream Psych::Parser::UTF8
|
|
@emitter.start_document [], [], true
|
|
@emitter.start_mapping(
|
|
foo.encode('Shift_JIS'),
|
|
bar.encode('UTF-16LE'),
|
|
false, Nodes::Sequence::ANY)
|
|
@emitter.end_mapping
|
|
@emitter.end_document false
|
|
@emitter.end_stream
|
|
|
|
@parser.parse @buffer.string
|
|
assert_encodings @utf8, @handler.strings
|
|
assert_equal [foo, bar], @handler.strings
|
|
end
|
|
|
|
def test_start_sequence
|
|
foo = 'foo'
|
|
bar = 'バー'
|
|
|
|
@emitter.start_stream Psych::Parser::UTF8
|
|
@emitter.start_document [], [], true
|
|
@emitter.start_sequence(
|
|
foo.encode('Shift_JIS'),
|
|
bar.encode('UTF-16LE'),
|
|
false, Nodes::Sequence::ANY)
|
|
@emitter.end_sequence
|
|
@emitter.end_document false
|
|
@emitter.end_stream
|
|
|
|
@parser.parse @buffer.string
|
|
assert_encodings @utf8, @handler.strings
|
|
assert_equal [foo, bar], @handler.strings
|
|
end
|
|
|
|
def test_doc_tag_encoding
|
|
key = '鍵'
|
|
@emitter.start_stream Psych::Parser::UTF8
|
|
@emitter.start_document(
|
|
[1, 1],
|
|
[['!'.encode('EUC-JP'), key.encode('EUC-JP')]],
|
|
true
|
|
)
|
|
@emitter.scalar 'foo', nil, nil, true, false, Nodes::Scalar::ANY
|
|
@emitter.end_document false
|
|
@emitter.end_stream
|
|
|
|
@parser.parse @buffer.string
|
|
assert_encodings @utf8, @handler.strings
|
|
assert_equal key, @handler.strings[1]
|
|
end
|
|
|
|
def test_emitter_encoding
|
|
str = "壁に耳あり、障子に目あり"
|
|
thing = Psych.load Psych.dump str.encode('EUC-JP')
|
|
assert_equal str, thing
|
|
end
|
|
|
|
def test_default_internal
|
|
with_default_internal(Encoding::EUC_JP) do
|
|
str = "壁に耳あり、障子に目あり"
|
|
assert_equal @utf8, str.encoding
|
|
|
|
@parser.parse str
|
|
assert_encodings Encoding::EUC_JP, @handler.strings
|
|
assert_equal str, @handler.strings.first.encode('UTF-8')
|
|
end
|
|
end
|
|
|
|
def test_scalar
|
|
@parser.parse("--- a")
|
|
assert_encodings @utf8, @handler.strings
|
|
end
|
|
|
|
def test_alias
|
|
@parser.parse(<<-eoyml)
|
|
%YAML 1.1
|
|
---
|
|
!!seq [
|
|
!!str "Without properties",
|
|
&A !!str "Anchored",
|
|
!!str "Tagged",
|
|
*A,
|
|
!!str "",
|
|
]
|
|
eoyml
|
|
assert_encodings @utf8, @handler.strings
|
|
end
|
|
|
|
def test_list_anchor
|
|
list = %w{ a b }
|
|
list << list
|
|
@parser.parse(Psych.dump(list))
|
|
assert_encodings @utf8, @handler.strings
|
|
end
|
|
|
|
def test_map_anchor
|
|
h = {}
|
|
h['a'] = h
|
|
@parser.parse(Psych.dump(h))
|
|
assert_encodings @utf8, @handler.strings
|
|
end
|
|
|
|
def test_map_tag
|
|
@parser.parse(<<-eoyml)
|
|
%YAML 1.1
|
|
---
|
|
!!map { a : b }
|
|
eoyml
|
|
assert_encodings @utf8, @handler.strings
|
|
end
|
|
|
|
def test_doc_tag
|
|
@parser.parse(<<-eoyml)
|
|
%YAML 1.1
|
|
%TAG ! tag:tenderlovemaking.com,2009:
|
|
--- !fun
|
|
eoyml
|
|
assert_encodings @utf8, @handler.strings
|
|
end
|
|
|
|
def test_dump_non_ascii_string_to_file
|
|
Tempfile.create(['utf8', 'yml'], :encoding => 'UTF-8') do |t|
|
|
h = {'one' => 'いち'}
|
|
Psych.dump(h, t)
|
|
t.close
|
|
assert_equal h, Psych.load_file(t.path)
|
|
end
|
|
end
|
|
|
|
private
|
|
def assert_encodings encoding, strings
|
|
strings.each do |str|
|
|
assert_equal encoding, str.encoding, str
|
|
end
|
|
end
|
|
end
|
|
end
|