2010-04-14 09:11:11 -04:00
|
|
|
# -*- coding: utf-8 -*-
|
|
|
|
|
2008-09-01 09:41:38 -04:00
|
|
|
require "rexml/document"
|
|
|
|
require "test/unit"
|
|
|
|
|
|
|
|
class REXML::TestDocument < Test::Unit::TestCase
|
2009-11-28 16:40:59 -05:00
|
|
|
def test_version_attributes_to_s
|
|
|
|
doc = REXML::Document.new(<<-eoxml)
|
|
|
|
<?xml version="1.0" encoding="UTF-8" standalone="no"?>
|
|
|
|
<svg id="svg2"
|
|
|
|
xmlns:sodipodi="foo"
|
|
|
|
xmlns:inkscape="bar"
|
|
|
|
sodipodi:version="0.32"
|
|
|
|
inkscape:version="0.44.1"
|
|
|
|
>
|
|
|
|
</svg>
|
|
|
|
eoxml
|
|
|
|
|
|
|
|
string = doc.to_s
|
|
|
|
assert_match('xmlns:sodipodi', string)
|
|
|
|
assert_match('xmlns:inkscape', string)
|
|
|
|
assert_match('sodipodi:version', string)
|
|
|
|
assert_match('inkscape:version', string)
|
|
|
|
end
|
|
|
|
|
2008-09-01 09:41:38 -04:00
|
|
|
def test_new
|
|
|
|
doc = REXML::Document.new(<<EOF)
|
|
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
|
|
<message>Hello world!</message>
|
|
|
|
EOF
|
|
|
|
assert_equal("Hello world!", doc.root.children.first.value)
|
|
|
|
end
|
|
|
|
|
|
|
|
XML_WITH_NESTED_ENTITY = <<EOF
|
|
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
|
|
<!DOCTYPE member [
|
|
|
|
<!ENTITY a "&b;&b;&b;&b;&b;&b;&b;&b;&b;&b;">
|
|
|
|
<!ENTITY b "&c;&c;&c;&c;&c;&c;&c;&c;&c;&c;">
|
|
|
|
<!ENTITY c "&d;&d;&d;&d;&d;&d;&d;&d;&d;&d;">
|
|
|
|
<!ENTITY d "&e;&e;&e;&e;&e;&e;&e;&e;&e;&e;">
|
|
|
|
<!ENTITY e "&f;&f;&f;&f;&f;&f;&f;&f;&f;&f;">
|
|
|
|
<!ENTITY f "&g;&g;&g;&g;&g;&g;&g;&g;&g;&g;">
|
|
|
|
<!ENTITY g "xxxxxxxxxxxxxxxxxxxxxxxxxxxxxx">
|
|
|
|
]>
|
|
|
|
<member>
|
|
|
|
&a;
|
|
|
|
</member>
|
2008-09-12 21:40:36 -04:00
|
|
|
EOF
|
|
|
|
|
|
|
|
XML_WITH_4_ENTITY_EXPANSION = <<EOF
|
|
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
|
|
<!DOCTYPE member [
|
|
|
|
<!ENTITY a "a">
|
|
|
|
<!ENTITY a2 "&a; &a;">
|
|
|
|
]>
|
|
|
|
<member>
|
|
|
|
&a;
|
|
|
|
&a2;
|
2008-11-06 12:03:40 -05:00
|
|
|
<
|
2008-09-12 21:40:36 -04:00
|
|
|
</member>
|
2008-09-01 09:41:38 -04:00
|
|
|
EOF
|
|
|
|
|
|
|
|
def test_entity_expansion_limit
|
|
|
|
doc = REXML::Document.new(XML_WITH_NESTED_ENTITY)
|
|
|
|
assert_raise(RuntimeError) do
|
|
|
|
doc.root.children.first.value
|
|
|
|
end
|
2013-02-27 07:24:31 -05:00
|
|
|
REXML::Security.entity_expansion_limit = 100
|
|
|
|
assert_equal(100, REXML::Security.entity_expansion_limit)
|
2008-09-01 09:41:38 -04:00
|
|
|
doc = REXML::Document.new(XML_WITH_NESTED_ENTITY)
|
|
|
|
assert_raise(RuntimeError) do
|
|
|
|
doc.root.children.first.value
|
|
|
|
end
|
|
|
|
assert_equal(101, doc.entity_expansion_count)
|
2008-09-12 21:40:36 -04:00
|
|
|
|
2013-02-27 07:24:31 -05:00
|
|
|
REXML::Security.entity_expansion_limit = 4
|
2008-09-12 21:40:36 -04:00
|
|
|
doc = REXML::Document.new(XML_WITH_4_ENTITY_EXPANSION)
|
2008-11-06 12:03:40 -05:00
|
|
|
assert_equal("\na\na a\n<\n", doc.root.children.first.value)
|
2013-02-27 07:24:31 -05:00
|
|
|
REXML::Security.entity_expansion_limit = 3
|
2008-09-12 21:40:36 -04:00
|
|
|
doc = REXML::Document.new(XML_WITH_4_ENTITY_EXPANSION)
|
|
|
|
assert_raise(RuntimeError) do
|
|
|
|
doc.root.children.first.value
|
|
|
|
end
|
|
|
|
ensure
|
2013-02-27 07:24:31 -05:00
|
|
|
REXML::Security.entity_expansion_limit = 10000
|
2008-09-01 09:41:38 -04:00
|
|
|
end
|
2009-12-28 20:36:26 -05:00
|
|
|
|
2010-04-14 09:11:11 -04:00
|
|
|
def test_tag_in_cdata_with_not_ascii_only_but_ascii8bit_encoding_source
|
|
|
|
tag = "<b>...</b>"
|
|
|
|
message = "こんにちは、世界!" # Hello world! in Japanese
|
|
|
|
xml = <<EOX
|
|
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
|
|
<message><![CDATA[#{tag}#{message}]]></message>
|
|
|
|
EOX
|
|
|
|
xml.force_encoding(Encoding::ASCII_8BIT)
|
|
|
|
doc = REXML::Document.new(xml)
|
|
|
|
assert_equal("#{tag}#{message}", doc.root.children.first.value)
|
|
|
|
end
|
|
|
|
|
2009-12-28 20:36:26 -05:00
|
|
|
def test_xml_declaration_standalone
|
|
|
|
bug2539 = '[ruby-core:27345]'
|
|
|
|
doc = REXML::Document.new('<?xml version="1.0" standalone="no" ?>')
|
|
|
|
assert_equal('no', doc.stand_alone?, bug2539)
|
|
|
|
doc = REXML::Document.new('<?xml version="1.0" standalone= "no" ?>')
|
|
|
|
assert_equal('no', doc.stand_alone?, bug2539)
|
|
|
|
doc = REXML::Document.new('<?xml version="1.0" standalone= "no" ?>')
|
|
|
|
assert_equal('no', doc.stand_alone?, bug2539)
|
|
|
|
end
|
2012-10-28 01:59:59 -04:00
|
|
|
|
|
|
|
class WriteTest < Test::Unit::TestCase
|
|
|
|
def setup
|
|
|
|
@document = REXML::Document.new(<<-EOX)
|
|
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
|
|
<message>Hello world!</message>
|
|
|
|
EOX
|
|
|
|
end
|
|
|
|
|
|
|
|
class ArgumentsTest < self
|
|
|
|
def test_output
|
|
|
|
output = ""
|
|
|
|
@document.write(output)
|
|
|
|
assert_equal(<<-EOX, output)
|
|
|
|
<?xml version='1.0' encoding='UTF-8'?>
|
|
|
|
<message>Hello world!</message>
|
|
|
|
EOX
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_indent
|
|
|
|
output = ""
|
|
|
|
indent = 2
|
|
|
|
@document.write(output, indent)
|
|
|
|
assert_equal(<<-EOX.chomp, output)
|
|
|
|
<?xml version='1.0' encoding='UTF-8'?>
|
|
|
|
<message>
|
|
|
|
Hello world!
|
|
|
|
</message>
|
|
|
|
EOX
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_transitive
|
|
|
|
output = ""
|
|
|
|
indent = 2
|
|
|
|
transitive = true
|
|
|
|
@document.write(output, indent, transitive)
|
|
|
|
assert_equal(<<-EOX, output)
|
|
|
|
<?xml version='1.0' encoding='UTF-8'?>
|
|
|
|
<message
|
|
|
|
>Hello world!</message
|
|
|
|
>
|
|
|
|
EOX
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_ie_hack
|
|
|
|
output = ""
|
|
|
|
indent = -1
|
|
|
|
transitive = false
|
|
|
|
ie_hack = true
|
|
|
|
document = REXML::Document.new("<empty/>")
|
|
|
|
document.write(output, indent, transitive, ie_hack)
|
|
|
|
assert_equal("<empty />", output)
|
|
|
|
end
|
2012-10-28 02:43:38 -04:00
|
|
|
|
|
|
|
def test_encoding
|
|
|
|
output = ""
|
|
|
|
indent = -1
|
|
|
|
transitive = false
|
|
|
|
ie_hack = false
|
2012-11-02 23:53:09 -04:00
|
|
|
encoding = "Windows-31J"
|
|
|
|
|
2012-11-03 00:58:03 -04:00
|
|
|
@document.xml_decl.encoding = "Shift_JIS"
|
2012-11-02 23:53:09 -04:00
|
|
|
japanese_text = "こんにちは"
|
|
|
|
@document.root.text = japanese_text
|
2012-10-28 02:43:38 -04:00
|
|
|
@document.write(output, indent, transitive, ie_hack, encoding)
|
2012-11-02 23:53:09 -04:00
|
|
|
assert_equal(<<-EOX.encode(encoding), output)
|
2012-11-03 00:58:03 -04:00
|
|
|
<?xml version='1.0' encoding='SHIFT_JIS'?>
|
2012-11-02 23:53:09 -04:00
|
|
|
<message>#{japanese_text}</message>
|
2012-10-28 02:43:38 -04:00
|
|
|
EOX
|
|
|
|
end
|
2012-10-28 01:59:59 -04:00
|
|
|
end
|
|
|
|
|
|
|
|
class OptionsTest < self
|
|
|
|
def test_output
|
|
|
|
output = ""
|
|
|
|
@document.write(:output => output)
|
|
|
|
assert_equal(<<-EOX, output)
|
|
|
|
<?xml version='1.0' encoding='UTF-8'?>
|
|
|
|
<message>Hello world!</message>
|
|
|
|
EOX
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_indent
|
|
|
|
output = ""
|
|
|
|
@document.write(:output => output, :indent => 2)
|
|
|
|
assert_equal(<<-EOX.chomp, output)
|
|
|
|
<?xml version='1.0' encoding='UTF-8'?>
|
|
|
|
<message>
|
|
|
|
Hello world!
|
|
|
|
</message>
|
|
|
|
EOX
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_transitive
|
|
|
|
output = ""
|
|
|
|
@document.write(:output => output, :indent => 2, :transitive => true)
|
|
|
|
assert_equal(<<-EOX, output)
|
|
|
|
<?xml version='1.0' encoding='UTF-8'?>
|
|
|
|
<message
|
|
|
|
>Hello world!</message
|
|
|
|
>
|
|
|
|
EOX
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_ie_hack
|
|
|
|
output = ""
|
|
|
|
document = REXML::Document.new("<empty/>")
|
|
|
|
document.write(:output => output, :ie_hack => true)
|
|
|
|
assert_equal("<empty />", output)
|
|
|
|
end
|
2012-10-28 02:43:38 -04:00
|
|
|
|
|
|
|
def test_encoding
|
|
|
|
output = ""
|
2012-11-02 23:53:09 -04:00
|
|
|
encoding = "Windows-31J"
|
2012-11-03 00:58:03 -04:00
|
|
|
@document.xml_decl.encoding = "Shift_JIS"
|
2012-11-02 23:53:09 -04:00
|
|
|
japanese_text = "こんにちは"
|
|
|
|
@document.root.text = japanese_text
|
|
|
|
@document.write(:output => output, :encoding => encoding)
|
|
|
|
assert_equal(<<-EOX.encode(encoding), output)
|
2012-11-03 00:58:03 -04:00
|
|
|
<?xml version='1.0' encoding='SHIFT_JIS'?>
|
2012-11-02 23:53:09 -04:00
|
|
|
<message>#{japanese_text}</message>
|
2012-10-28 02:43:38 -04:00
|
|
|
EOX
|
|
|
|
end
|
2012-10-28 01:59:59 -04:00
|
|
|
end
|
|
|
|
end
|
2012-10-28 08:19:58 -04:00
|
|
|
|
|
|
|
class BomTest < self
|
2012-10-28 08:39:37 -04:00
|
|
|
class HaveEncodingTest < self
|
2012-10-28 10:53:07 -04:00
|
|
|
def test_utf_8
|
|
|
|
xml = <<-EOX.force_encoding("ASCII-8BIT")
|
|
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
|
|
<message>Hello world!</message>
|
|
|
|
EOX
|
|
|
|
bom = "\ufeff".force_encoding("ASCII-8BIT")
|
|
|
|
document = REXML::Document.new(bom + xml)
|
|
|
|
assert_equal("UTF-8", document.encoding)
|
|
|
|
end
|
|
|
|
|
2012-10-28 08:39:37 -04:00
|
|
|
def test_utf_16le
|
|
|
|
xml = <<-EOX.encode("UTF-16LE").force_encoding("ASCII-8BIT")
|
2012-10-28 08:19:58 -04:00
|
|
|
<?xml version="1.0" encoding="UTF-16"?>
|
|
|
|
<message>Hello world!</message>
|
|
|
|
EOX
|
2012-10-28 08:39:37 -04:00
|
|
|
bom = "\ufeff".encode("UTF-16LE").force_encoding("ASCII-8BIT")
|
|
|
|
document = REXML::Document.new(bom + xml)
|
|
|
|
assert_equal("UTF-16", document.encoding)
|
|
|
|
end
|
2012-10-28 08:19:58 -04:00
|
|
|
|
2012-10-28 08:39:37 -04:00
|
|
|
def test_utf_16be
|
|
|
|
xml = <<-EOX.encode("UTF-16BE").force_encoding("ASCII-8BIT")
|
2012-10-28 10:54:59 -04:00
|
|
|
<?xml version="1.0" encoding="UTF-16"?>
|
|
|
|
<message>Hello world!</message>
|
|
|
|
EOX
|
2012-10-28 08:39:37 -04:00
|
|
|
bom = "\ufeff".encode("UTF-16BE").force_encoding("ASCII-8BIT")
|
|
|
|
document = REXML::Document.new(bom + xml)
|
|
|
|
assert_equal("UTF-16", document.encoding)
|
|
|
|
end
|
2012-10-28 08:19:58 -04:00
|
|
|
end
|
2012-10-28 08:42:37 -04:00
|
|
|
|
|
|
|
class NoEncodingTest < self
|
2012-10-28 10:53:07 -04:00
|
|
|
def test_utf_8
|
|
|
|
xml = <<-EOX.force_encoding("ASCII-8BIT")
|
|
|
|
<?xml version="1.0"?>
|
|
|
|
<message>Hello world!</message>
|
|
|
|
EOX
|
|
|
|
bom = "\ufeff".force_encoding("ASCII-8BIT")
|
|
|
|
document = REXML::Document.new(bom + xml)
|
|
|
|
assert_equal("UTF-8", document.encoding)
|
|
|
|
end
|
|
|
|
|
2012-10-28 08:42:37 -04:00
|
|
|
def test_utf_16le
|
|
|
|
xml = <<-EOX.encode("UTF-16LE").force_encoding("ASCII-8BIT")
|
|
|
|
<?xml version="1.0"?>
|
|
|
|
<message>Hello world!</message>
|
|
|
|
EOX
|
|
|
|
bom = "\ufeff".encode("UTF-16LE").force_encoding("ASCII-8BIT")
|
|
|
|
document = REXML::Document.new(bom + xml)
|
|
|
|
assert_equal("UTF-16", document.encoding)
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_utf_16be
|
|
|
|
xml = <<-EOX.encode("UTF-16BE").force_encoding("ASCII-8BIT")
|
|
|
|
<?xml version="1.0"?>
|
|
|
|
<message>Hello world!</message>
|
|
|
|
EOX
|
|
|
|
bom = "\ufeff".encode("UTF-16BE").force_encoding("ASCII-8BIT")
|
|
|
|
document = REXML::Document.new(bom + xml)
|
|
|
|
assert_equal("UTF-16", document.encoding)
|
|
|
|
end
|
|
|
|
end
|
2012-11-03 01:42:40 -04:00
|
|
|
|
|
|
|
class WriteTest < self
|
|
|
|
def test_utf_16
|
|
|
|
xml = <<-EOX.encode("UTF-16LE").force_encoding("ASCII-8BIT")
|
|
|
|
<?xml version="1.0"?>
|
|
|
|
<message>Hello world!</message>
|
|
|
|
EOX
|
|
|
|
bom = "\ufeff".encode("UTF-16LE").force_encoding("ASCII-8BIT")
|
|
|
|
document = REXML::Document.new(bom + xml)
|
|
|
|
|
|
|
|
actual_xml = ""
|
|
|
|
document.write(actual_xml)
|
|
|
|
expected_xml = <<-EOX.encode("UTF-16BE")
|
|
|
|
\ufeff<?xml version='1.0' encoding='UTF-16'?>
|
|
|
|
<message>Hello world!</message>
|
|
|
|
EOX
|
|
|
|
assert_equal(expected_xml, actual_xml)
|
|
|
|
end
|
|
|
|
end
|
2012-10-28 08:19:58 -04:00
|
|
|
end
|
2008-09-01 09:41:38 -04:00
|
|
|
end
|