ruby--ruby/test/csv/test_csv.rb

1521 lines
37 KiB
Ruby
Raw Normal View History

require 'test/unit'
require 'tempfile'
require 'fileutils'
require 'csv'
class CSV
class StreamBuf
# Let buffer work hard.
remove_const("BufSize")
BufSize = 2
end
end
class TestCSV < Test::Unit::TestCase
class << self
def d(data, is_null = false)
CSV::Cell.new(data.to_s, is_null)
end
end
@@colData = ['', nil, true, false, 'foo', '!' * 1000]
@@simpleCSVData = {
[nil] => '',
[''] => '""',
[nil, nil] => ',',
[nil, nil, nil] => ',,',
['foo'] => 'foo',
[','] => '","',
[',', ','] => '",",","',
[';'] => ';',
[';', ';'] => ';,;',
["\"\r", "\"\r"] => "\"\"\"\r\",\"\"\"\r\"",
["\"\n", "\"\n"] => "\"\"\"\n\",\"\"\"\n\"",
["\t"] => "\t",
["\t", "\t"] => "\t,\t",
['foo', 'bar'] => 'foo,bar',
['foo', '"bar"', 'baz'] => 'foo,"""bar""",baz',
['foo', 'foo,bar', 'baz'] => 'foo,"foo,bar",baz',
['foo', '""', 'baz'] => 'foo,"""""",baz',
['foo', '', 'baz'] => 'foo,"",baz',
['foo', nil, 'baz'] => 'foo,,baz',
[nil, 'foo', 'bar'] => ',foo,bar',
['foo', 'bar', nil] => 'foo,bar,',
['foo', "\r", 'baz'] => "foo,\"\r\",baz",
['foo', "\n", 'baz'] => "foo,\"\n\",baz",
['foo', "\r\n\r", 'baz'] => "foo,\"\r\n\r\",baz",
['foo', "\r\n", 'baz'] => "foo,\"\r\n\",baz",
['foo', "\r.\n", 'baz'] => "foo,\"\r.\n\",baz",
['foo', "\r\n\n", 'baz'] => "foo,\"\r\n\n\",baz",
['foo', '"', 'baz'] => 'foo,"""",baz',
}
@@fullCSVData = {
[d('', true)] => '',
[d('')] => '""',
[d('', true), d('', true)] => ',',
[d('', true), d('', true), d('', true)] => ',,',
[d('foo')] => 'foo',
[d('foo'), d('bar')] => 'foo,bar',
[d('foo'), d('"bar"'), d('baz')] => 'foo,"""bar""",baz',
[d('foo'), d('foo,bar'), d('baz')] => 'foo,"foo,bar",baz',
[d('foo'), d('""'), d('baz')] => 'foo,"""""",baz',
[d('foo'), d(''), d('baz')] => 'foo,"",baz',
[d('foo'), d('', true), d('baz')] => 'foo,,baz',
[d('foo'), d("\r"), d('baz')] => "foo,\"\r\",baz",
[d('foo'), d("\n"), d('baz')] => "foo,\"\n\",baz",
[d('foo'), d("\r\n"), d('baz')] => "foo,\"\r\n\",baz",
[d('foo'), d("\r.\n"), d('baz')] => "foo,\"\r.\n\",baz",
[d('foo'), d("\r\n\n"), d('baz')] => "foo,\"\r\n\n\",baz",
[d('foo'), d('"'), d('baz')] => 'foo,"""",baz',
}
@@fullCSVDataArray = @@fullCSVData.collect { |key, value| key }
def ssv2csv(ssvStr)
sepConv(ssvStr, ?;, ?,)
end
def csv2ssv(csvStr)
sepConv(csvStr, ?,, ?;)
end
def tsv2csv(tsvStr)
sepConv(tsvStr, ?\t, ?,)
end
def csv2tsv(csvStr)
sepConv(csvStr, ?,, ?\t)
end
def sepConv(srcStr, srcSep, destSep)
rows = CSV::Row.new
cols, idx = CSV.parse_row(srcStr, 0, rows, srcSep)
destStr = ''
cols = CSV.generate_row(rows, rows.size, destStr, destSep)
destStr
end
public
def setup
@tmpdir = File.join(Dir.tmpdir, "ruby_test_csv_tmp_#{$$}")
Dir.mkdir(@tmpdir)
@infile = File.join(@tmpdir, 'in.csv')
@infiletsv = File.join(@tmpdir, 'in.tsv')
@emptyfile = File.join(@tmpdir, 'empty.csv')
@outfile = File.join(@tmpdir, 'out.csv')
@bomfile = File.join(File.dirname(__FILE__), "bom.csv")
CSV.open(@infile, "w") do |writer|
@@fullCSVDataArray.each do |row|
writer.add_row(row)
end
end
CSV.open(@infiletsv, "w", ?\t) do |writer|
@@fullCSVDataArray.each do |row|
writer.add_row(row)
end
end
CSV.generate(@emptyfile) do |writer|
# Create empty file.
end
end
def teardown
FileUtils.rm_rf(@tmpdir)
end
def d(*arg)
TestCSV.d(*arg)
end
#### CSV::Cell unit test
def test_Cell_EQUAL # '=='
d1 = CSV::Cell.new('d', false)
d2 = CSV::Cell.new('d', false)
d3 = CSV::Cell.new('d', true)
d4 = CSV::Cell.new('d', true)
assert(d1 == d2, "Normal case.")
assert(d1 != d3, "RHS is null.")
assert(d4 != d1, "LHS is null.")
assert(d3 != d4, "Either is null.")
end
def test_Cell_match
d1 = CSV::Cell.new('d', false)
d2 = CSV::Cell.new('d', false)
d3 = CSV::Cell.new('d', true)
d4 = CSV::Cell.new('d', true)
assert(d1.match(d2), "Normal case.")
assert(!d1.match(d3), "RHS is null.")
assert(!d4.match(d1), "LHS is null.")
assert(d3.match(d4), "Either is null.")
end
def test_Cell_data
d = CSV::Cell.new()
@@colData.each do |v|
d.data = v
assert_equal(d.data, v, "Case: #{ v }.")
end
end
def test_Cell_data=
d = CSV::Cell.new()
@@colData.each do |v|
d.data = v
assert_equal(d.data, v, "Case: #{ v }.")
end
end
def test_Cell_is_null
d = CSV::Cell.new()
d.is_null = true
assert_equal(d.is_null, true, "Case: true.")
d.is_null = false
assert_equal(d.is_null, false, "Case: false.")
end
def test_Cell_is_null=
d = CSV::Cell.new()
d.is_null = true
assert_equal(d.is_null, true, "Case: true.")
d.is_null = false
assert_equal(d.is_null, false, "Case: false.")
end
def test_Cell_s_new
d1 = CSV::Cell.new()
assert_equal(d1.data, '', "Default: data.")
assert_equal(d1.is_null, true, "Default: is_null.")
@@colData.each do |v|
d = CSV::Cell.new(v)
assert_equal(d.data, v, "Data: #{ v }.")
end
d2 = CSV::Cell.new(nil, true)
assert_equal(d2.is_null, true, "Data: true.")
d3 = CSV::Cell.new(nil, false)
assert_equal(d3.is_null, false, "Data: false.")
end
#### CSV::Row unit test
def test_Row_s_match
c1 = CSV::Row[d(1), d(2), d(3)]
c2 = CSV::Row[d(1, false), d(2, false), d(3, false)]
assert(c1.match(c2), "Normal case.")
c1 = CSV::Row[d(1), d('foo', true), d(3)]
c2 = CSV::Row[d(1, false), d('bar', true), d(3, false)]
assert(c1.match(c2), "Either is null.")
c1 = CSV::Row[d(1), d('foo', true), d(3)]
c2 = CSV::Row[d(1, false), d('bar', false), d(3, false)]
assert(!c1.match(c2), "LHS is null.")
c1 = CSV::Row[d(1), d('foo'), d(3)]
c2 = CSV::Row[d(1, false), d('bar', true), d(3, false)]
assert(!c1.match(c2), "RHS is null.")
c1 = CSV::Row[d(1), d('', true), d(3)]
c2 = CSV::Row[d(1, false), d('', true), d(3, false)]
assert(c1.match(c2), "Either is null(empty data).")
c1 = CSV::Row[d(1), d('', true), d(3)]
c2 = CSV::Row[d(1, false), d('', false), d(3, false)]
assert(!c1.match(c2), "LHS is null(empty data).")
c1 = CSV::Row[d(1), d(''), d(3)]
c2 = CSV::Row[d(1, false), d('', true), d(3, false)]
assert(!c1.match(c2), "RHS is null(empty data).")
c1 = CSV::Row[]
c2 = CSV::Row[]
assert(c1.match(c2))
c1 = CSV::Row[]
c2 = CSV::Row[d(1)]
assert(!c1.match(c2))
end
def test_Row_to_a
r = CSV::Row[d(1), d(2), d(3)]
assert_equal(['1', '2', '3'], r.to_a, 'Normal case')
r = CSV::Row[d(1)]
assert_equal(['1'], r.to_a, '1 item')
r = CSV::Row[d(nil, true), d(2), d(3)]
assert_equal([nil, '2', '3'], r.to_a, 'Null in data')
r = CSV::Row[d(nil, true), d(nil, true), d(nil, true)]
assert_equal([nil, nil, nil], r.to_a, 'Nulls')
r = CSV::Row[d(nil, true)]
assert_equal([nil], r.to_a, '1 Null')
r = CSV::Row[]
assert_equal([], r.to_a, 'Empty')
end
#### CSV::Reader unit test
def test_Reader_each
file = File.open(@infile, "rb")
begin
reader = CSV::Reader.create(file)
expectedArray = @@fullCSVDataArray.dup
first = true
ret = reader.each { |row|
if first
assert_instance_of(CSV::Row, row)
first = false
end
expected = expectedArray.shift
assert(row.match(expected))
}
assert_nil(ret, "Return is nil")
assert(expectedArray.empty?)
ensure
file.close
end
# Illegal format.
reader = CSV::Reader.create("a,b\r\na,b,\"c\"\ra")
assert_raises(CSV::IllegalFormatError) do
reader.each do |row|
end
end
reader = CSV::Reader.create("a,b\r\n\"")
assert_raises(CSV::IllegalFormatError) do
reader.each do |row|
end
end
end
def test_Reader_shift
file = File.open(@infile, "rb")
begin
reader = CSV::Reader.create(file)
first = true
checked = 0
@@fullCSVDataArray.each do |expected|
actual = reader.shift
if first
assert_instance_of(CSV::Row, actual)
first = false
end
assert(actual.match(expected))
checked += 1
end
assert(checked == @@fullCSVDataArray.size)
ensure
file.close
end
# Illegal format.
reader = CSV::Reader.create("a,b\r\na,b,\"c\"\ra")
assert_raises(CSV::IllegalFormatError) do
reader.shift
reader.shift
end
reader = CSV::Reader.create("a,b\r\na,b,\"c\"\ra")
assert_raises(CSV::IllegalFormatError) do
reader.shift
reader.shift
end
end
def test_Reader_getRow
if CSV::Reader.respond_to?(:allocate)
obj = CSV::Reader.allocate
assert_raises(NotImplementedError) do
row = []
obj.shift
end
end
end
def test_IOReader_close_on_terminate
f = File.open(@infile, "r")
reader = CSV::IOReader.create(f)
reader.close
assert(!f.closed?)
f.close
f = File.open(@infile, "r")
writer = CSV::IOReader.create(f)
writer.close_on_terminate
writer.close
assert(f.closed?)
end
def test_Reader_close
f = File.open(@infile, "r")
reader = CSV::IOReader.create(f)
reader.close_on_terminate
reader.close
assert(f.closed?)
end
def test_Reader_s_new
assert_raises(RuntimeError) do
CSV::Reader.new(nil)
end
end
def test_Reader_s_create
reader = CSV::Reader.create("abc")
assert_instance_of(CSV::StringReader, reader, "With a String")
file = File.open(@infile, "rb")
reader = CSV::Reader.create(file)
assert_instance_of(CSV::IOReader, reader, 'With an IO')
obj = Object.new
def obj.sysread(size)
"abc"
end
def obj.read(size)
"abc"
end
reader = CSV::Reader.create(obj)
assert_instance_of(CSV::IOReader, reader, "With not an IO or String")
# No need to test Tempfile because it's a pseudo IO. I test this here
# fors other tests.
reader = CSV::Reader.create(Tempfile.new("in.csv"))
assert_instance_of(CSV::IOReader, reader, "With an pseudo IO.")
file.close
end
def test_Reader_s_parse
ret = CSV::Reader.parse("a,b,c") { |row|
assert_instance_of(CSV::Row, row, "Block parameter")
}
assert_nil(ret, "Return is nil")
ret = CSV::Reader.parse("a;b;c", ?;) { |row|
assert_instance_of(CSV::Row, row, "Block parameter")
}
file = Tempfile.new("in.csv")
file << "a,b,c"
file.open
ret = CSV::Reader.parse(file) { |row|
assert_instance_of(CSV::Row, row, "Block parameter")
}
assert_nil(ret, "Return is nil")
file = Tempfile.new("in.csv")
file << "a,b,c"
file.open
ret = CSV::Reader.parse(file, ?,) { |row|
assert_instance_of(CSV::Row, row, "Block parameter")
}
# Illegal format.
assert_raises(CSV::IllegalFormatError) do
CSV::Reader.parse("a,b\r\na,b,\"c\"\ra") do |row|
end
end
assert_raises(CSV::IllegalFormatError) do
CSV::Reader.parse("a,b\r\na,b\"") do |row|
end
end
end
#### CSV::Writer unit test
def test_Writer_s_new
assert_raises(RuntimeError) do
CSV::Writer.new(nil)
end
end
def test_Writer_s_generate
ret = CSV::Writer.generate(STDOUT) { |writer|
assert_instance_of(CSV::BasicWriter, writer, "Block parameter")
}
ret = CSV::Writer.generate(STDOUT, ?;) { |writer|
assert_instance_of(CSV::BasicWriter, writer, "Block parameter")
}
assert_nil(ret, "Return is nil")
end
def test_Writer_s_create
writer = CSV::Writer.create(STDERR)
assert_instance_of(CSV::BasicWriter, writer, "String")
writer = CSV::Writer.create(STDERR, ?;)
assert_instance_of(CSV::BasicWriter, writer, "String")
writer = CSV::Writer.create(Tempfile.new("out.csv"))
assert_instance_of(CSV::BasicWriter, writer, "IO")
end
def test_Writer_LSHIFT # '<<'
file = Tempfile.new("out.csv")
CSV::Writer.generate(file) do |writer|
ret = writer << ['a', 'b', 'c']
assert_instance_of(CSV::BasicWriter, ret, 'Return is self')
writer << [nil, 'e', 'f'] << [nil, nil, '']
end
str = file.open.read
assert_equal("a,b,c\r\n,e,f\r\n,,\"\"\r\n", str, 'Normal')
file = Tempfile.new("out2.csv")
CSV::Writer.generate(file) do |writer|
ret = writer << [d('a'), d('b'), d('c')]
assert_instance_of(CSV::BasicWriter, ret, 'Return is self')
writer << [d(nil, true), d('e'), d('f')] << [d(nil, true), d(nil, true), d('')]
end
str = file.open.read
assert_equal("a,b,c\r\n,e,f\r\n,,\"\"\r\n", str, 'Normal')
end
def test_Writer_add_row
file = Tempfile.new("out.csv")
CSV::Writer.generate(file) do |writer|
ret = writer.add_row(
[d('a', false), d('b', false), d('c', false)])
assert_instance_of(CSV::BasicWriter, ret, 'Return is self')
writer.add_row(
[d('dummy', true), d('e', false), d('f', false)]
).add_row(
[d('a', true), d('b', true), d('', false)]
)
end
str = file.open.read
assert_equal("a,b,c\r\n,e,f\r\n,,\"\"\r\n", str, 'Normal')
end
def test_Writer_close
f = File.open(@outfile, "w")
writer = CSV::BasicWriter.create(f)
writer.close_on_terminate
writer.close
assert(f.closed?)
end
def test_BasicWriter_close_on_terminate
f = File.open(@outfile, "w")
writer = CSV::BasicWriter.create(f)
writer.close
assert(!f.closed?)
f.close
f = File.open(@outfile, "w")
writer = CSV::BasicWriter.create(f)
writer.close_on_terminate
writer.close
assert(f.closed?)
end
#### CSV unit test
def test_s_open_reader
assert_raises(ArgumentError, 'Illegal mode') do
CSV.open("temp", "a")
end
assert_raises(ArgumentError, 'Illegal mode') do
CSV.open("temp", "a", ?;)
end
reader = CSV.open(@infile, "r")
assert_instance_of(CSV::IOReader, reader)
reader.close
reader = CSV.open(@infile, "rb")
assert_instance_of(CSV::IOReader, reader)
reader.close
reader = CSV.open(@infile, "r", ?;)
assert_instance_of(CSV::IOReader, reader)
reader.close
CSV.open(@infile, "r") do |row|
assert_instance_of(CSV::Row, row)
break
end
CSV.open(@infiletsv, "r", ?\t) do |row|
assert_instance_of(CSV::Row, row)
break
end
assert_raises(Errno::ENOENT) do
CSV.open("NoSuchFileOrDirectory", "r")
end
assert_raises(Errno::ENOENT) do
CSV.open("NoSuchFileOrDirectory", "r", ?;)
end
# Illegal format.
File.open(@outfile, "w") do |f|
f << "a,b\r\na,b,\"c\"\ra"
end
assert_raises(CSV::IllegalFormatError) do
CSV.open(@outfile, "r") do |row|
end
end
File.open(@outfile, "w") do |f|
f << "a,b\r\na,b\""
end
assert_raises(CSV::IllegalFormatError) do
CSV.open(@outfile, "r") do |row|
end
end
CSV.open(@emptyfile, "r") do |row|
assert_fail("Must not reach here")
end
end
def test_s_parse
reader = CSV.parse(@infile)
assert_instance_of(CSV::IOReader, reader)
reader.close
reader = CSV.parse(@infile)
assert_instance_of(CSV::IOReader, reader)
reader.close
reader = CSV.parse(@infile, ?;)
assert_instance_of(CSV::IOReader, reader)
reader.close
CSV.parse(@infile) do |row|
assert_instance_of(CSV::Row, row)
break
end
CSV.parse(@infiletsv, ?\t) do |row|
assert_instance_of(CSV::Row, row)
break
end
assert_raises(Errno::ENOENT) do
CSV.parse("NoSuchFileOrDirectory")
end
assert_raises(Errno::ENOENT) do
CSV.parse("NoSuchFileOrDirectory", ?;)
end
CSV.parse(@emptyfile) do |row|
assert_fail("Must not reach here")
end
end
def test_s_open_writer
writer = CSV.open(@outfile, "w")
assert_instance_of(CSV::BasicWriter, writer)
writer.close
writer = CSV.open(@outfile, "wb")
assert_instance_of(CSV::BasicWriter, writer)
writer.close
writer = CSV.open(@outfile, "wb", ?;)
assert_instance_of(CSV::BasicWriter, writer)
writer.close
CSV.open(@outfile, "w") do |writer|
assert_instance_of(CSV::BasicWriter, writer)
end
CSV.open(@outfile, "w", ?;) do |writer|
assert_instance_of(CSV::BasicWriter, writer)
end
begin
CSV.open(@tmpdir, "w")
assert(false)
rescue Exception => ex
assert(ex.is_a?(Errno::EEXIST) || ex.is_a?(Errno::EISDIR) || ex.is_a?(Errno::EACCES))
end
end
def test_s_generate
writer = CSV.generate(@outfile)
assert_instance_of(CSV::BasicWriter, writer)
writer.close
writer = CSV.generate(@outfile, ?;)
assert_instance_of(CSV::BasicWriter, writer)
writer.close
CSV.generate(@outfile) do |writer|
assert_instance_of(CSV::BasicWriter, writer)
end
CSV.generate(@outfile, ?;) do |writer|
assert_instance_of(CSV::BasicWriter, writer)
end
begin
CSV.generate(@tmpdir)
assert(false)
rescue Exception => ex
assert(ex.is_a?(Errno::EEXIST) || ex.is_a?(Errno::EISDIR) || ex.is_a?(Errno::EACCES))
end
end
def test_s_generate_line
str = CSV.generate_line([])
assert_equal('', str, "Extra boundary check.")
str = CSV.generate_line([], ?;)
assert_equal('', str, "Extra boundary check.")
@@simpleCSVData.each do |col, str|
buf = CSV.generate_line(col)
assert_equal(str, buf)
end
@@simpleCSVData.each do |col, str|
buf = CSV.generate_line(col, ?;)
assert_equal(str + "\r\n", ssv2csv(buf))
end
@@simpleCSVData.each do |col, str|
buf = CSV.generate_line(col, ?\t)
assert_equal(str + "\r\n", tsv2csv(buf))
end
end
def test_s_generate_row
buf = ''
cols = CSV.generate_row([], 0, buf)
assert_equal(0, cols)
assert_equal("\r\n", buf, "Extra boundary check.")
buf = ''
cols = CSV.generate_row([], 0, buf, ?;)
assert_equal(0, cols)
assert_equal("\r\n", buf, "Extra boundary check.")
buf = ''
cols = CSV.generate_row([], 0, buf, ?\t)
assert_equal(0, cols)
assert_equal("\r\n", buf, "Extra boundary check.")
buf = ''
cols = CSV.generate_row([d(1)], 2, buf)
assert_equal('1,', buf)
buf = ''
cols = CSV.generate_row([d(1)], 2, buf, ?;)
assert_equal('1;', buf)
buf = ''
cols = CSV.generate_row([d(1)], 2, buf, ?\t)
assert_equal("1\t", buf)
buf = ''
cols = CSV.generate_row([d(1), d(2)], 1, buf)
assert_equal("1\r\n", buf)
buf = ''
cols = CSV.generate_row([d(1), d(2)], 1, buf, ?;)
assert_equal("1\r\n", buf)
buf = ''
cols = CSV.generate_row([d(1), d(2)], 1, buf, ?\t)
assert_equal("1\r\n", buf)
@@fullCSVData.each do |col, str|
buf = ''
cols = CSV.generate_row(col, col.size, buf)
assert_equal(col.size, cols)
assert_equal(str + "\r\n", buf)
end
@@fullCSVData.each do |col, str|
buf = ''
cols = CSV.generate_row(col, col.size, buf, ?;)
assert_equal(col.size, cols)
assert_equal(str + "\r\n", ssv2csv(buf))
end
@@fullCSVData.each do |col, str|
buf = ''
cols = CSV.generate_row(col, col.size, buf, ?\t)
assert_equal(col.size, cols)
assert_equal(str + "\r\n", tsv2csv(buf))
end
buf = ''
toBe = ''
cols = 0
colsToBe = 0
@@fullCSVData.each do |col, str|
cols += CSV.generate_row(col, col.size, buf)
toBe << str << "\r\n"
colsToBe += col.size
end
assert_equal(colsToBe, cols)
assert_equal(toBe, buf)
buf = ''
toBe = ''
cols = 0
colsToBe = 0
@@fullCSVData.each do |col, str|
lineBuf = ''
cols += CSV.generate_row(col, col.size, lineBuf, ?;)
buf << ssv2csv(lineBuf) << "\r\n"
toBe << ssv2csv(lineBuf) << "\r\n"
colsToBe += col.size
end
assert_equal(colsToBe, cols)
assert_equal(toBe, buf)
buf = ''
toBe = ''
cols = 0
colsToBe = 0
@@fullCSVData.each do |col, str|
lineBuf = ''
cols += CSV.generate_row(col, col.size, lineBuf, ?\t)
buf << tsv2csv(lineBuf) << "\r\n"
toBe << tsv2csv(lineBuf) << "\r\n"
colsToBe += col.size
end
assert_equal(colsToBe, cols)
assert_equal(toBe, buf)
end
def test_s_parse_line
@@simpleCSVData.each do |col, str|
row = CSV.parse_line(str)
assert_instance_of(CSV::Row, row)
assert_equal(col.size, row.size)
assert_equal(col, row)
end
@@simpleCSVData.each do |col, str|
str = csv2ssv(str)
row = CSV.parse_line(str, ?;)
assert_instance_of(CSV::Row, row)
assert_equal(col.size, row.size)
assert_equal(col, row)
end
@@simpleCSVData.each do |col, str|
str = csv2tsv(str)
row = CSV.parse_line(str, ?\t)
assert_instance_of(CSV::Row, row)
assert_equal(col.size, row.size)
assert_equal(col, row)
end
# Illegal format.
buf = CSV::Row.new
row = CSV.parse_line("a,b,\"c\"\ra")
assert_instance_of(CSV::Row, row)
assert_equal(0, row.size)
buf = CSV::Row.new
row = CSV.parse_line("a;b;\"c\"\ra", ?;)
assert_instance_of(CSV::Row, row)
assert_equal(0, row.size)
buf = CSV::Row.new
row = CSV.parse_line("a\tb\t\"c\"\ra", ?\t)
assert_instance_of(CSV::Row, row)
assert_equal(0, row.size)
row = CSV.parse_line("a,b\"")
assert_instance_of(CSV::Row, row)
assert_equal(0, row.size)
row = CSV.parse_line("a;b\"", ?;)
assert_instance_of(CSV::Row, row)
assert_equal(0, row.size)
row = CSV.parse_line("a\tb\"", ?\t)
assert_instance_of(CSV::Row, row)
assert_equal(0, row.size)
row = CSV.parse_line("\"a,b\"\r,")
assert_instance_of(CSV::Row, row)
assert_equal(0, row.size)
row = CSV.parse_line("\"a;b\"\r;", ?;)
assert_instance_of(CSV::Row, row)
assert_equal(0, row.size)
row = CSV.parse_line("\"a\tb\"\r\t", ?\t)
assert_instance_of(CSV::Row, row)
assert_equal(0, row.size)
row = CSV.parse_line("\"a,b\"\r\"")
assert_instance_of(CSV::Row, row)
assert_equal(0, row.size)
row = CSV.parse_line("\"a;b\"\r\"", ?;)
assert_instance_of(CSV::Row, row)
assert_equal(0, row.size)
row = CSV.parse_line("\"a\tb\"\r\"", ?\t)
assert_instance_of(CSV::Row, row)
assert_equal(0, row.size)
end
def test_s_parse_row
@@fullCSVData.each do |col, str|
buf = CSV::Row.new
cols, idx = CSV.parse_row(str + "\r\n", 0, buf)
assert_equal(cols, buf.size, "Reported size.")
assert_equal(col.size, buf.size, "Size.")
assert(buf.match(col))
buf = CSV::Row.new
cols, idx = CSV.parse_row(str + "\n", 0, buf)
assert_equal(cols, buf.size, "Reported size.")
assert_equal(col.size, buf.size, "Size.")
assert(buf.match(col))
end
@@fullCSVData.each do |col, str|
str = csv2ssv(str)
buf = CSV::Row.new
cols, idx = CSV.parse_row(str + "\r\n", 0, buf, ?;)
assert_equal(cols, buf.size, "Reported size.")
assert_equal(col.size, buf.size, "Size.")
assert(buf.match(col))
end
@@fullCSVData.each do |col, str|
str = csv2tsv(str)
buf = CSV::Row.new
cols, idx = CSV.parse_row(str + "\r\n", 0, buf, ?\t)
assert_equal(cols, buf.size, "Reported size.")
assert_equal(col.size, buf.size, "Size.")
assert(buf.match(col))
end
buf = CSV::Row.new
cols, idx = CSV.parse_row("a,b,\"c\r\"", 0, buf)
assert_equal(["a", "b", "c\r"], buf.to_a)
buf = CSV::Row.new
cols, idx = CSV.parse_row("a;b;\"c\r\"", 0, buf, ?;)
assert_equal(["a", "b", "c\r"], buf.to_a)
buf = CSV::Row.new
cols, idx = CSV.parse_row("a\tb\t\"c\r\"", 0, buf, ?\t)
assert_equal(["a", "b", "c\r"], buf.to_a)
buf = CSV::Row.new
cols, idx = CSV.parse_row("a,b,c\n", 0, buf)
assert_equal(["a", "b", "c"], buf.to_a)
buf = CSV::Row.new
cols, idx = CSV.parse_row("a\tb\tc\n", 0, buf, ?\t)
assert_equal(["a", "b", "c"], buf.to_a)
# Illegal format.
buf = CSV::Row.new
cols, idx = CSV.parse_row("a,b,c\"", 0, buf)
assert_equal(0, cols, "Illegal format; unbalanced double-quote.")
buf = CSV::Row.new
cols, idx = CSV.parse_row("a;b;c\"", 0, buf, ?;)
assert_equal(0, cols, "Illegal format; unbalanced double-quote.")
buf = CSV::Row.new
cols, idx = CSV.parse_row("a,b,\"c\"\ra", 0, buf)
assert_equal(0, cols)
assert_equal(0, idx)
buf = CSV::Row.new
cols, idx = CSV.parse_row("a,b,\"c\"\ra", 0, buf, ?;)
assert_equal(0, cols)
assert_equal(0, idx)
buf = CSV::Row.new
cols, idx = CSV.parse_row("a,b\"", 0, buf)
assert_equal(0, cols)
assert_equal(0, idx)
buf = CSV::Row.new
cols, idx = CSV.parse_row("a;b\"", 0, buf, ?;)
assert_equal(0, cols)
assert_equal(0, idx)
buf = CSV::Row.new
cols, idx = CSV.parse_row("\"a,b\"\r,", 0, buf)
assert_equal(0, cols)
assert_equal(0, idx)
buf = CSV::Row.new
cols, idx = CSV.parse_row("a\r,", 0, buf)
assert_equal(0, cols)
assert_equal(0, idx)
buf = CSV::Row.new
cols, idx = CSV.parse_row("a\r", 0, buf)
assert_equal(0, cols)
assert_equal(0, idx)
buf = CSV::Row.new
cols, idx = CSV.parse_row("a\rbc", 0, buf)
assert_equal(0, cols)
assert_equal(0, idx)
buf = CSV::Row.new
cols, idx = CSV.parse_row("a\r\"\"", 0, buf)
assert_equal(0, cols)
assert_equal(0, idx)
buf = CSV::Row.new
cols, idx = CSV.parse_row("a\r\rabc,", 0, buf)
assert_equal(0, cols)
assert_equal(0, idx)
buf = CSV::Row.new
cols, idx = CSV.parse_row("\"a;b\"\r;", 0, buf, ?;)
assert_equal(0, cols)
assert_equal(0, idx)
buf = CSV::Row.new
cols, idx = CSV.parse_row("\"a,b\"\r\"", 0, buf)
assert_equal(0, cols)
assert_equal(0, idx)
buf = CSV::Row.new
cols, idx = CSV.parse_row("\"a;b\"\r\"", 0, buf, ?;)
assert_equal(0, cols)
assert_equal(0, idx)
end
def test_s_parse_rowEOF
@@fullCSVData.each do |col, str|
if str == ''
# String "" is not allowed.
next
end
buf = CSV::Row.new
cols, idx = CSV.parse_row(str, 0, buf)
assert_equal(col.size, cols, "Reported size.")
assert_equal(col.size, buf.size, "Size.")
assert(buf.match(col))
end
end
def test_s_parse_rowConcat
buf = ''
toBe = []
@@fullCSVData.each do |col, str|
buf << str << "\r\n"
toBe.concat(col)
end
idx = 0
cols = 0
parsed = CSV::Row.new
parsedCols = 0
begin
cols, idx = CSV.parse_row(buf, idx, parsed)
parsedCols += cols
end while cols > 0
assert_equal(toBe.size, parsedCols)
assert_equal(toBe.size, parsed.size)
assert(parsed.match(toBe))
buf = ''
toBe = []
@@fullCSVData.each do |col, str|
buf << str << "\n"
toBe.concat(col)
end
idx = 0
cols = 0
parsed = CSV::Row.new
parsedCols = 0
begin
cols, idx = CSV.parse_row(buf, idx, parsed)
parsedCols += cols
end while cols > 0
assert_equal(toBe.size, parsedCols)
assert_equal(toBe.size, parsed.size)
assert(parsed.match(toBe))
buf = ''
toBe = []
@@fullCSVData.sort { |a, b|
a[0].length <=> b[0].length
}.each do |col, str|
buf << str << "\n"
toBe.concat(col)
end
idx = 0
cols = 0
parsed = CSV::Row.new
parsedCols = 0
begin
cols, idx = CSV.parse_row(buf, idx, parsed)
parsedCols += cols
end while cols > 0
assert_equal(toBe.size, parsedCols)
assert_equal(toBe.size, parsed.size)
assert(parsed.match(toBe))
end
def test_utf8
rows = []
CSV.open(@bomfile, "r") do |row|
rows << row.to_a
end
assert_equal([["foo"], ["bar"]], rows)
rows = []
file = File.open(@bomfile)
CSV::Reader.parse(file.read) do |row|
rows << row.to_a
end
assert_equal([["foo"], ["bar"]], rows)
file.close
end
#### CSV unit test
InputStreamPattern = '0123456789'
InputStreamPatternSize = InputStreamPattern.size
def expChar(idx)
InputStreamPattern[idx % InputStreamPatternSize]
end
def expStr(idx, n)
if n > InputStreamPatternSize
InputStreamPattern + expStr(0, n - InputStreamPatternSize)
else
InputStreamPattern[idx % InputStreamPatternSize, n]
end
end
def setupInputStream(size, bufSize = nil)
setBufSize(bufSize) if bufSize
m = ((size / InputStreamPatternSize) + 1).to_i
File.open(@outfile, "wb") do |f|
f << (InputStreamPattern * m)[0, size]
end
file = File.open(@outfile, "rb")
buf = CSV::IOBuf.new(file)
if block_given?
yield(buf)
file.close
nil
else
buf
end
end
def setBufSize(size)
CSV::StreamBuf.module_eval('remove_const("BufSize")')
CSV::StreamBuf.module_eval("BufSize = #{ size }")
end
class StrBuf < CSV::StreamBuf
private
def initialize(string)
@str = string
@idx = 0
super()
end
def read(size)
str = @str[@idx, size]
if str.empty?
nil
else
@idx += str.size
str
end
end
end
class ErrBuf < CSV::StreamBuf
class Error < RuntimeError; end
private
def initialize
@first = true
super()
end
def read(size)
if @first
@first = false
"a" * size
else
raise ErrBuf::Error.new
end
end
end
def test_StreamBuf_MyBuf
# At first, check ruby's behaviour.
s = "abc"
assert_equal(?a, s[0])
assert_equal(?b, s[1])
assert_equal(?c, s[2])
assert_equal(nil, s[3])
assert_equal("a", s[0, 1])
assert_equal("b", s[1, 1])
assert_equal("c", s[2, 1])
assert_equal("", s[3, 1])
assert_equal(nil, s[4, 1])
s = StrBuf.new("abc")
assert_equal(?a, s[0])
assert_equal(?b, s.get(1))
assert_equal(?c, s[2])
assert_equal(nil, s.get(3))
assert_equal("a", s[0, 1])
assert_equal("b", s.get(1, 1))
assert_equal("c", s[2, 1])
assert_equal("", s.get(3, 1))
assert_equal(nil, s[4, 1])
dropped = s.drop(1)
assert_equal(1, dropped)
assert_equal(?b, s[0])
assert(!s.is_eos?)
dropped = s.drop(1)
assert_equal(1, dropped)
assert_equal(?c, s[0])
assert(!s.is_eos?)
dropped = s.drop(1)
assert_equal(1, dropped)
assert_equal(nil, s[0])
assert(s.is_eos?)
dropped = s.drop(1)
assert_equal(0, dropped)
assert_equal(nil, s[0])
assert(s.is_eos?)
s = StrBuf.new("")
assert_equal(nil, s[0])
s = StrBuf.new("")
dropped = s.drop(1)
assert_equal(0, dropped)
assert_raises(TestCSV::ErrBuf::Error) do
s = ErrBuf.new
s[1024]
end
assert_raises(TestCSV::ErrBuf::Error) do
s = ErrBuf.new
s.drop(1024)
end
end
def test_StreamBuf_AREF # '[idx]'
setupInputStream(22, 1024) do |s|
[0, 1, 9, 10, 19, 20, 21].each do |idx|
assert_equal(expChar(idx), s[idx], idx.to_s)
end
[22, 23].each do |idx|
assert_equal(nil, s[idx], idx.to_s)
end
assert_equal(nil, s[-1])
end
setupInputStream(22, 1) do |s|
[0, 1, 9, 10, 19, 20, 21].each do |idx|
assert_equal(expChar(idx), s[idx], idx.to_s)
end
[22, 23].each do |idx|
assert_equal(nil, s[idx], idx.to_s)
end
end
setupInputStream(1024, 1) do |s|
[1023, 0].each do |idx|
assert_equal(expChar(idx), s[idx], idx.to_s)
end
[1024, 1025].each do |idx|
assert_equal(nil, s[idx], idx.to_s)
end
end
setupInputStream(1, 1) do |s|
[0].each do |idx|
assert_equal(expChar(idx), s[idx], idx.to_s)
end
[1, 2].each do |idx|
assert_equal(nil, s[idx], idx.to_s)
end
end
end
def test_StreamBuf_AREF_n # '[idx, n]'
# At first, check ruby's behaviour.
assert_equal("", "abc"[3, 1])
assert_equal(nil, "abc"[4, 1])
setupInputStream(22, 1024) do |s|
[0, 1, 9, 10, 19, 20, 21].each do |idx|
assert_equal(expStr(idx, 1), s[idx, 1], idx.to_s)
end
assert_equal("", s[22, 1])
assert_equal(nil, s[23, 1])
end
setupInputStream(22, 1) do |s|
[0, 1, 9, 10, 19, 20, 21].each do |idx|
assert_equal(expStr(idx, 1), s[idx, 1], idx.to_s)
end
assert_equal("", s[22, 1])
assert_equal(nil, s[23, 1])
end
setupInputStream(1024, 1) do |s|
[1023, 0].each do |idx|
assert_equal(expStr(idx, 1), s[idx, 1], idx.to_s)
end
assert_equal("", s[1024, 1])
assert_equal(nil, s[1025, 1])
end
setupInputStream(1, 1) do |s|
[0].each do |idx|
assert_equal(expStr(idx, 1), s[idx, 1], idx.to_s)
end
assert_equal("", s[1, 1])
assert_equal(nil, s[2, 1])
end
setupInputStream(22, 11) do |s|
[0, 1, 10, 11, 20].each do |idx|
assert_equal(expStr(idx, 2), s[idx, 2], idx.to_s)
end
assert_equal(expStr(21, 1), s[21, 2])
assert_equal(expStr(0, 12), s[0, 12])
assert_equal(expStr(10, 12), s[10, 12])
assert_equal(expStr(10, 12), s[10, 13])
assert_equal(expStr(10, 12), s[10, 14])
assert_equal(expStr(10, 12), s[10, 1024])
assert_equal(nil, s[0, -1])
assert_equal(nil, s[21, -1])
assert_equal(nil, s[-1, 10])
assert_equal(nil, s[-1, -1])
end
end
def test_StreamBuf_get
setupInputStream(22, 1024) do |s|
[0, 1, 9, 10, 19, 20, 21].each do |idx|
assert_equal(expChar(idx), s.get(idx), idx.to_s)
end
[22, 23].each do |idx|
assert_equal(nil, s.get(idx), idx.to_s)
end
assert_equal(nil, s.get(-1))
end
end
def test_StreamBuf_get_n
setupInputStream(22, 1024) do |s|
[0, 1, 9, 10, 19, 20, 21].each do |idx|
assert_equal(expStr(idx, 1), s.get(idx, 1), idx.to_s)
end
assert_equal("", s.get(22, 1))
assert_equal(nil, s.get(23, 1))
assert_equal(nil, s.get(-1, 1))
assert_equal(nil, s.get(-1, -1))
end
end
def test_StreamBuf_drop
setupInputStream(22, 1024) do |s|
assert_equal(expChar(0), s[0])
assert_equal(expChar(21), s[21])
assert_equal(nil, s[22])
dropped = s.drop(-1)
assert_equal(0, dropped)
assert_equal(expChar(0), s[0])
dropped = s.drop(0)
assert_equal(0, dropped)
assert_equal(expChar(0), s[0])
dropped = s.drop(1)
assert_equal(1, dropped)
assert_equal(expChar(1), s[0])
assert_equal(expChar(2), s[1])
dropped = s.drop(1)
assert_equal(1, dropped)
assert_equal(expChar(2), s[0])
assert_equal(expChar(3), s[1])
end
setupInputStream(4, 2) do |s|
dropped = s.drop(2)
assert_equal(2, dropped)
assert_equal(expChar(2), s[0])
assert_equal(expChar(3), s[1])
dropped = s.drop(1)
assert_equal(1, dropped)
assert_equal(expChar(3), s[0])
assert_equal(nil, s[1])
dropped = s.drop(1)
assert_equal(1, dropped)
assert_equal(nil, s[0])
assert_equal(nil, s[1])
dropped = s.drop(0)
assert_equal(0, dropped)
assert_equal(nil, s[0])
assert_equal(nil, s[1])
end
setupInputStream(6, 3) do |s|
dropped = s.drop(2)
assert_equal(2, dropped)
dropped = s.drop(2)
assert_equal(2, dropped)
assert_equal(expChar(4), s[0])
assert_equal(expChar(5), s[1])
dropped = s.drop(3)
assert_equal(2, dropped)
assert_equal(nil, s[0])
assert_equal(nil, s[1])
end
end
def test_StreamBuf_is_eos?
setupInputStream(3, 1024) do |s|
assert(!s.is_eos?)
s.drop(1)
assert(!s.is_eos?)
s.drop(1)
assert(!s.is_eos?)
s.drop(1)
assert(s.is_eos?)
s.drop(1)
assert(s.is_eos?)
end
setupInputStream(3, 2) do |s|
assert(!s.is_eos?)
s.drop(1)
assert(!s.is_eos?)
s.drop(1)
assert(!s.is_eos?)
s.drop(1)
assert(s.is_eos?)
s.drop(1)
assert(s.is_eos?)
end
end
def test_StreamBuf_s_new
# NotImplementedError should be raised from StreamBuf#read.
assert_raises(NotImplementedError) do
CSV::StreamBuf.new
end
end
def test_IOBuf_close
f = File.open(@outfile, "wb")
f << "tst"
f.close
f = File.open(@outfile, "rb")
iobuf = CSV::IOBuf.new(f)
iobuf.close
assert(true) # iobuf.close does not raise any exception.
f.close
end
def test_IOBuf_s_new
iobuf = CSV::IOBuf.new(Tempfile.new("in.csv"))
assert_instance_of(CSV::IOBuf, iobuf)
end
#### CSV functional test
# sample data
#
# 1 2 3 4 5 6 7 8
# +------+-------+---------+-------+--------+------+----+------+
# | foo | "foo" | foo,bar | "" |(empty) |(null)| \r | \r\n |
# +------+-------+---------+-------+--------+------+----+------+
# | NaHi | "Na" | Na,Hi | \r.\n | \r\n\n | " | \n | \r\n |
# +------+-------+---------+-------+--------+------+----+------+
#
def test_s_parseAndCreate
colSize = 8
csvStr = "foo,!!!foo!!!,!foo,bar!,!!!!!!,!!,,!\r!,!\r\n!\r\nNaHi,!!!Na!!!,!Na,Hi!,!\r.\n!,!\r\n\n!,!!!!,!\n!,!\r\n!".gsub!('!', '"')
csvStrTerminated = csvStr + "\r\n"
myStr = csvStr.dup
res1 = []; res2 = []
idx = 0
col, idx = CSV::parse_row(myStr, 0, res1)
col, idx = CSV::parse_row(myStr, idx, res2)
buf = ''
col = CSV::generate_row(res1, colSize, buf)
col = CSV::generate_row(res2, colSize, buf)
assert_equal(csvStrTerminated, buf)
parsed = []
CSV::Reader.parse(csvStrTerminated) do |row|
parsed << row
end
buf = ''
CSV::Writer.generate(buf) do |writer|
parsed.each do |row|
writer.add_row(row)
end
end
assert_equal(csvStrTerminated, buf)
buf = ''
CSV::Writer.generate(buf) do |writer|
parsed.each do |row|
writer << row.collect { |e| e.is_null ? nil : e.data }
end
end
assert_equal(csvStrTerminated, buf)
end
end