require 'test/unit/testsuite' require 'test/unit/testcase' require 'tempfile' require 'fileutils' require 'csv' class CSV class StreamBuf # Let buffer work hard. remove_const("BufSize") BufSize = 2 end end module CSVTestSupport def d(data, is_null = false) CSV::Cell.new(data.to_s, is_null) end end class TestCSVCell < Test::Unit::TestCase @@colData = ['', nil, true, false, 'foo', '!' * 1000] def test_Cell_EQUAL # '==' d1 = CSV::Cell.new('d', false) d2 = CSV::Cell.new('d', false) d3 = CSV::Cell.new('d', true) d4 = CSV::Cell.new('d', true) assert(d1 == d2, "Normal case.") assert(d1 != d3, "RHS is null.") assert(d4 != d1, "LHS is null.") assert(d3 != d4, "Either is null.") end def test_Cell_match d1 = CSV::Cell.new('d', false) d2 = CSV::Cell.new('d', false) d3 = CSV::Cell.new('d', true) d4 = CSV::Cell.new('d', true) assert(d1.match(d2), "Normal case.") assert(!d1.match(d3), "RHS is null.") assert(!d4.match(d1), "LHS is null.") assert(d3.match(d4), "Either is null.") end def test_Cell_data d = CSV::Cell.new() @@colData.each do |v| d.data = v assert_equal(d.data, v, "Case: #{ v }.") end end def test_Cell_data= d = CSV::Cell.new() @@colData.each do |v| d.data = v assert_equal(d.data, v, "Case: #{ v }.") end end def test_Cell_is_null d = CSV::Cell.new() d.is_null = true assert_equal(d.is_null, true, "Case: true.") d.is_null = false assert_equal(d.is_null, false, "Case: false.") end def test_Cell_is_null= d = CSV::Cell.new() d.is_null = true assert_equal(d.is_null, true, "Case: true.") d.is_null = false assert_equal(d.is_null, false, "Case: false.") end def test_Cell_s_new d1 = CSV::Cell.new() assert_equal(d1.data, '', "Default: data.") assert_equal(d1.is_null, true, "Default: is_null.") @@colData.each do |v| d = CSV::Cell.new(v) assert_equal(d.data, v, "Data: #{ v }.") end d2 = CSV::Cell.new(nil, true) assert_equal(d2.is_null, true, "Data: true.") d3 = CSV::Cell.new(nil, false) assert_equal(d3.is_null, false, "Data: false.") end end class TestCSVRow < Test::Unit::TestCase include CSVTestSupport def test_Row_s_match c1 = CSV::Row[d(1), d(2), d(3)] c2 = CSV::Row[d(1, false), d(2, false), d(3, false)] assert(c1.match(c2), "Normal case.") c1 = CSV::Row[d(1), d('foo', true), d(3)] c2 = CSV::Row[d(1, false), d('bar', true), d(3, false)] assert(c1.match(c2), "Either is null.") c1 = CSV::Row[d(1), d('foo', true), d(3)] c2 = CSV::Row[d(1, false), d('bar', false), d(3, false)] assert(!c1.match(c2), "LHS is null.") c1 = CSV::Row[d(1), d('foo'), d(3)] c2 = CSV::Row[d(1, false), d('bar', true), d(3, false)] assert(!c1.match(c2), "RHS is null.") c1 = CSV::Row[d(1), d('', true), d(3)] c2 = CSV::Row[d(1, false), d('', true), d(3, false)] assert(c1.match(c2), "Either is null(empty data).") c1 = CSV::Row[d(1), d('', true), d(3)] c2 = CSV::Row[d(1, false), d('', false), d(3, false)] assert(!c1.match(c2), "LHS is null(empty data).") c1 = CSV::Row[d(1), d(''), d(3)] c2 = CSV::Row[d(1, false), d('', true), d(3, false)] assert(!c1.match(c2), "RHS is null(empty data).") c1 = CSV::Row[] c2 = CSV::Row[] assert(c1.match(c2)) c1 = CSV::Row[] c2 = CSV::Row[d(1)] assert(!c1.match(c2)) end def test_Row_to_a r = CSV::Row[d(1), d(2), d(3)] assert_equal(['1', '2', '3'], r.to_a, 'Normal case') r = CSV::Row[d(1)] assert_equal(['1'], r.to_a, '1 item') r = CSV::Row[d(nil, true), d(2), d(3)] assert_equal([nil, '2', '3'], r.to_a, 'Null in data') r = CSV::Row[d(nil, true), d(nil, true), d(nil, true)] assert_equal([nil, nil, nil], r.to_a, 'Nulls') r = CSV::Row[d(nil, true)] assert_equal([nil], r.to_a, '1 Null') r = CSV::Row[] assert_equal([], r.to_a, 'Empty') end end class TestCSV < Test::Unit::TestCase include CSVTestSupport class << self include CSVTestSupport end @@simpleCSVData = { [nil] => '', [''] => '""', [nil, nil] => ',', [nil, nil, nil] => ',,', ['foo'] => 'foo', [','] => '","', [',', ','] => '",",","', [';'] => ';', [';', ';'] => ';,;', ["\"\r", "\"\r"] => "\"\"\"\r\",\"\"\"\r\"", ["\"\n", "\"\n"] => "\"\"\"\n\",\"\"\"\n\"", ["\t"] => "\t", ["\t", "\t"] => "\t,\t", ['foo', 'bar'] => 'foo,bar', ['foo', '"bar"', 'baz'] => 'foo,"""bar""",baz', ['foo', 'foo,bar', 'baz'] => 'foo,"foo,bar",baz', ['foo', '""', 'baz'] => 'foo,"""""",baz', ['foo', '', 'baz'] => 'foo,"",baz', ['foo', nil, 'baz'] => 'foo,,baz', [nil, 'foo', 'bar'] => ',foo,bar', ['foo', 'bar', nil] => 'foo,bar,', ['foo', "\r", 'baz'] => "foo,\"\r\",baz", ['foo', "\n", 'baz'] => "foo,\"\n\",baz", ['foo', "\r\n\r", 'baz'] => "foo,\"\r\n\r\",baz", ['foo', "\r\n", 'baz'] => "foo,\"\r\n\",baz", ['foo', "\r.\n", 'baz'] => "foo,\"\r.\n\",baz", ['foo', "\r\n\n", 'baz'] => "foo,\"\r\n\n\",baz", ['foo', '"', 'baz'] => 'foo,"""",baz', } @@fullCSVData = { [d('', true)] => '', [d('')] => '""', [d('', true), d('', true)] => ',', [d('', true), d('', true), d('', true)] => ',,', [d('foo')] => 'foo', [d('foo'), d('bar')] => 'foo,bar', [d('foo'), d('"bar"'), d('baz')] => 'foo,"""bar""",baz', [d('foo'), d('foo,bar'), d('baz')] => 'foo,"foo,bar",baz', [d('foo'), d('""'), d('baz')] => 'foo,"""""",baz', [d('foo'), d(''), d('baz')] => 'foo,"",baz', [d('foo'), d('', true), d('baz')] => 'foo,,baz', [d('foo'), d("\r"), d('baz')] => "foo,\"\r\",baz", [d('foo'), d("\n"), d('baz')] => "foo,\"\n\",baz", [d('foo'), d("\r\n"), d('baz')] => "foo,\"\r\n\",baz", [d('foo'), d("\r.\n"), d('baz')] => "foo,\"\r.\n\",baz", [d('foo'), d("\r\n\n"), d('baz')] => "foo,\"\r\n\n\",baz", [d('foo'), d('"'), d('baz')] => 'foo,"""",baz', } @@fullCSVDataArray = @@fullCSVData.collect { |key, value| key } def ssv2csv(ssvStr, row_sep = nil) sepConv(ssvStr, ?;, ?,, row_sep) end def csv2ssv(csvStr, row_sep = nil) sepConv(csvStr, ?,, ?;, row_sep) end def tsv2csv(tsvStr, row_sep = nil) sepConv(tsvStr, ?\t, ?,, row_sep) end def csv2tsv(csvStr, row_sep = nil) sepConv(csvStr, ?,, ?\t, row_sep) end def sepConv(srcStr, srcSep, destSep, row_sep = nil) rows = CSV::Row.new cols, idx = CSV.parse_row(srcStr, 0, rows, srcSep, row_sep) destStr = '' cols = CSV.generate_row(rows, rows.size, destStr, destSep, row_sep) destStr end public def setup @tmpdir = File.join(Dir.tmpdir, "ruby_test_csv_tmp_#{$$}") Dir.mkdir(@tmpdir) @infile = File.join(@tmpdir, 'in.csv') @infiletsv = File.join(@tmpdir, 'in.tsv') @emptyfile = File.join(@tmpdir, 'empty.csv') @outfile = File.join(@tmpdir, 'out.csv') @bomfile = File.join(File.dirname(__FILE__), "bom.csv") @macfile = File.join(File.dirname(__FILE__), "mac.csv") CSV.open(@infile, "w") do |writer| @@fullCSVDataArray.each do |row| writer.add_row(row) end end CSV.open(@infiletsv, "w", ?\t) do |writer| @@fullCSVDataArray.each do |row| writer.add_row(row) end end CSV.generate(@emptyfile) do |writer| # Create empty file. end end def teardown FileUtils.rm_rf(@tmpdir) end #### CSV::Reader unit test def test_Reader_each file = File.open(@infile, "rb") begin reader = CSV::Reader.create(file) expectedArray = @@fullCSVDataArray.dup first = true ret = reader.each { |row| if first assert_instance_of(CSV::Row, row) first = false end expected = expectedArray.shift assert(row.match(expected)) } assert_nil(ret, "Return is nil") assert(expectedArray.empty?) ensure file.close end # Illegal format. reader = CSV::Reader.create("a,b\r\na,b,\"c\"\ra") assert_raises(CSV::IllegalFormatError) do reader.each do |row| end end reader = CSV::Reader.create("a,b\r\n\"") assert_raises(CSV::IllegalFormatError) do reader.each do |row| end end end def test_Reader_shift file = File.open(@infile, "rb") begin reader = CSV::Reader.create(file) first = true checked = 0 @@fullCSVDataArray.each do |expected| actual = reader.shift if first assert_instance_of(CSV::Row, actual) first = false end assert(actual.match(expected)) checked += 1 end assert(checked == @@fullCSVDataArray.size) ensure file.close end # Illegal format. reader = CSV::Reader.create("a,b\r\na,b,\"c\"\ra") assert_raises(CSV::IllegalFormatError) do reader.shift reader.shift end reader = CSV::Reader.create("a,b\r\na,b,\"c\"\ra") assert_raises(CSV::IllegalFormatError) do reader.shift reader.shift end end def test_Reader_getRow if CSV::Reader.respond_to?(:allocate) obj = CSV::Reader.allocate assert_raises(NotImplementedError) do row = [] obj.shift end end end def test_IOReader_close_on_terminate f = File.open(@infile, "r") reader = CSV::IOReader.create(f) reader.close assert(!f.closed?) f.close f = File.open(@infile, "r") writer = CSV::IOReader.create(f) writer.close_on_terminate writer.close assert(f.closed?) end def test_Reader_close f = File.open(@infile, "r") reader = CSV::IOReader.create(f) reader.close_on_terminate reader.close assert(f.closed?) end def test_Reader_s_new assert_raises(RuntimeError) do CSV::Reader.new(nil) end end def test_Reader_s_create reader = CSV::Reader.create("abc") assert_instance_of(CSV::StringReader, reader, "With a String") file = File.open(@infile, "rb") reader = CSV::Reader.create(file) assert_instance_of(CSV::IOReader, reader, 'With an IO') obj = Object.new def obj.sysread(size) "abc" end def obj.read(size) "abc" end reader = CSV::Reader.create(obj) assert_instance_of(CSV::IOReader, reader, "With not an IO or String") # No need to test Tempfile because it's a pseudo IO. I test this here # fors other tests. reader = CSV::Reader.create(Tempfile.new("in.csv")) assert_instance_of(CSV::IOReader, reader, "With an pseudo IO.") file.close end def test_Reader_s_parse ret = CSV::Reader.parse("a,b,c") { |row| assert_instance_of(CSV::Row, row, "Block parameter") } assert_nil(ret, "Return is nil") ret = CSV::Reader.parse("a;b;c", ?;) { |row| assert_instance_of(CSV::Row, row, "Block parameter") } file = Tempfile.new("in.csv") file << "a,b,c" file.open ret = CSV::Reader.parse(file) { |row| assert_instance_of(CSV::Row, row, "Block parameter") } assert_nil(ret, "Return is nil") file = Tempfile.new("in.csv") file << "a,b,c" file.open ret = CSV::Reader.parse(file, ?,) { |row| assert_instance_of(CSV::Row, row, "Block parameter") } # Illegal format. assert_raises(CSV::IllegalFormatError) do CSV::Reader.parse("a,b\r\na,b,\"c\"\ra") do |row| end end assert_raises(CSV::IllegalFormatError) do CSV::Reader.parse("a,b\r\na,b\"") do |row| end end end #### CSV::Writer unit test def test_Writer_s_new assert_raises(RuntimeError) do CSV::Writer.new(nil) end end def test_Writer_s_generate ret = CSV::Writer.generate(STDOUT) { |writer| assert_instance_of(CSV::BasicWriter, writer, "Block parameter") } ret = CSV::Writer.generate(STDOUT, ?;) { |writer| assert_instance_of(CSV::BasicWriter, writer, "Block parameter") } assert_nil(ret, "Return is nil") end def test_Writer_s_create writer = CSV::Writer.create(STDERR) assert_instance_of(CSV::BasicWriter, writer, "String") writer = CSV::Writer.create(STDERR, ?;) assert_instance_of(CSV::BasicWriter, writer, "String") writer = CSV::Writer.create(Tempfile.new("out.csv")) assert_instance_of(CSV::BasicWriter, writer, "IO") end def test_Writer_LSHIFT # '<<' file = Tempfile.new("out.csv") CSV::Writer.generate(file) do |writer| ret = writer << ['a', 'b', 'c'] assert_instance_of(CSV::BasicWriter, ret, 'Return is self') writer << [nil, 'e', 'f'] << [nil, nil, ''] end str = file.open.read assert_equal("a,b,c\r\n,e,f\r\n,,\"\"\r\n", str, 'Normal') file = Tempfile.new("out2.csv") CSV::Writer.generate(file) do |writer| ret = writer << [d('a'), d('b'), d('c')] assert_instance_of(CSV::BasicWriter, ret, 'Return is self') writer << [d(nil, true), d('e'), d('f')] << [d(nil, true), d(nil, true), d('')] end str = file.open.read assert_equal("a,b,c\r\n,e,f\r\n,,\"\"\r\n", str, 'Normal') end def test_Writer_add_row file = Tempfile.new("out.csv") CSV::Writer.generate(file) do |writer| ret = writer.add_row( [d('a', false), d('b', false), d('c', false)]) assert_instance_of(CSV::BasicWriter, ret, 'Return is self') writer.add_row( [d('dummy', true), d('e', false), d('f', false)] ).add_row( [d('a', true), d('b', true), d('', false)] ) end str = file.open.read assert_equal("a,b,c\r\n,e,f\r\n,,\"\"\r\n", str, 'Normal') end def test_Writer_close f = File.open(@outfile, "w") writer = CSV::BasicWriter.create(f) writer.close_on_terminate writer.close assert(f.closed?) end def test_BasicWriter_close_on_terminate f = File.open(@outfile, "w") writer = CSV::BasicWriter.create(f) writer.close assert(!f.closed?) f.close f = File.open(@outfile, "w") writer = CSV::BasicWriter.create(f) writer.close_on_terminate writer.close assert(f.closed?) end #### CSV unit test def test_s_open_reader assert_raises(ArgumentError, 'Illegal mode') do CSV.open("temp", "a") end assert_raises(ArgumentError, 'Illegal mode') do CSV.open("temp", "a", ?;) end reader = CSV.open(@infile, "r") assert_instance_of(CSV::IOReader, reader) reader.close reader = CSV.open(@infile, "rb") assert_instance_of(CSV::IOReader, reader) reader.close reader = CSV.open(@infile, "r", ?;) assert_instance_of(CSV::IOReader, reader) reader.close CSV.open(@infile, "r") do |row| assert_instance_of(CSV::Row, row) break end CSV.open(@infiletsv, "r", ?\t) do |row| assert_instance_of(CSV::Row, row) break end assert_raises(Errno::ENOENT) do CSV.open("NoSuchFileOrDirectory", "r") end assert_raises(Errno::ENOENT) do CSV.open("NoSuchFileOrDirectory", "r", ?;) end # Illegal format. File.open(@outfile, "w") do |f| f << "a,b\r\na,b,\"c\"\ra" end assert_raises(CSV::IllegalFormatError) do CSV.open(@outfile, "r") do |row| end end File.open(@outfile, "w") do |f| f << "a,b\r\na,b\"" end assert_raises(CSV::IllegalFormatError) do CSV.open(@outfile, "r") do |row| end end CSV.open(@emptyfile, "r") do |row| assert_fail("Must not reach here") end end def test_s_parse reader = CSV.parse(@infile) assert_instance_of(CSV::IOReader, reader) reader.close reader = CSV.parse(@infile) assert_instance_of(CSV::IOReader, reader) reader.close reader = CSV.parse(@infile, ?;) assert_instance_of(CSV::IOReader, reader) reader.close CSV.parse(@infile) do |row| assert_instance_of(CSV::Row, row) break end CSV.parse(@infiletsv, ?\t) do |row| assert_instance_of(CSV::Row, row) break end assert_raises(Errno::ENOENT) do CSV.parse("NoSuchFileOrDirectory") end assert_raises(Errno::ENOENT) do CSV.parse("NoSuchFileOrDirectory", ?;) end CSV.parse(@emptyfile) do |row| assert_fail("Must not reach here") end end def test_s_open_writer writer = CSV.open(@outfile, "w") assert_instance_of(CSV::BasicWriter, writer) writer.close writer = CSV.open(@outfile, "wb") assert_instance_of(CSV::BasicWriter, writer) writer.close writer = CSV.open(@outfile, "wb", ?;) assert_instance_of(CSV::BasicWriter, writer) writer.close CSV.open(@outfile, "w") do |writer| assert_instance_of(CSV::BasicWriter, writer) end CSV.open(@outfile, "w", ?;) do |writer| assert_instance_of(CSV::BasicWriter, writer) end begin CSV.open(@tmpdir, "w") assert(false) rescue Exception => ex assert(ex.is_a?(Errno::EEXIST) || ex.is_a?(Errno::EISDIR) || ex.is_a?(Errno::EACCES)) end end def test_s_generate writer = CSV.generate(@outfile) assert_instance_of(CSV::BasicWriter, writer) writer.close writer = CSV.generate(@outfile, ?;) assert_instance_of(CSV::BasicWriter, writer) writer.close CSV.generate(@outfile) do |writer| assert_instance_of(CSV::BasicWriter, writer) end CSV.generate(@outfile, ?;) do |writer| assert_instance_of(CSV::BasicWriter, writer) end begin CSV.generate(@tmpdir) assert(false) rescue Exception => ex assert(ex.is_a?(Errno::EEXIST) || ex.is_a?(Errno::EISDIR) || ex.is_a?(Errno::EACCES)) end end def test_s_generate_line str = CSV.generate_line([]) assert_equal('', str, "Extra boundary check.") str = CSV.generate_line([], ?;) assert_equal('', str, "Extra boundary check.") @@simpleCSVData.each do |col, str| buf = CSV.generate_line(col) assert_equal(str, buf) end @@simpleCSVData.each do |col, str| buf = CSV.generate_line(col, ?;) assert_equal(str + "\r\n", ssv2csv(buf)) end @@simpleCSVData.each do |col, str| buf = CSV.generate_line(col, ?\t) assert_equal(str + "\r\n", tsv2csv(buf)) end end def test_s_generate_row buf = '' cols = CSV.generate_row([], 0, buf) assert_equal(0, cols) assert_equal("\r\n", buf, "Extra boundary check.") buf = '' cols = CSV.generate_row([], 0, buf, ?;) assert_equal(0, cols) assert_equal("\r\n", buf, "Extra boundary check.") buf = '' cols = CSV.generate_row([], 0, buf, ?\t) assert_equal(0, cols) assert_equal("\r\n", buf, "Extra boundary check.") buf = '' cols = CSV.generate_row([], 0, buf, ?\t, ?|) assert_equal(0, cols) assert_equal("|", buf, "Extra boundary check.") buf = '' cols = CSV.generate_row([d(1)], 2, buf) assert_equal('1,', buf) buf = '' cols = CSV.generate_row([d(1)], 2, buf, ?;) assert_equal('1;', buf) buf = '' cols = CSV.generate_row([d(1)], 2, buf, ?\t) assert_equal("1\t", buf) buf = '' cols = CSV.generate_row([d(1)], 2, buf, ?\t, ?|) assert_equal("1\t", buf) buf = '' cols = CSV.generate_row([d(1), d(2)], 1, buf) assert_equal("1\r\n", buf) buf = '' cols = CSV.generate_row([d(1), d(2)], 1, buf, ?;) assert_equal("1\r\n", buf) buf = '' cols = CSV.generate_row([d(1), d(2)], 1, buf, ?\t) assert_equal("1\r\n", buf) buf = '' cols = CSV.generate_row([d(1), d(2)], 1, buf, ?\t, ?\n) assert_equal("1\n", buf) buf = '' cols = CSV.generate_row([d(1), d(2)], 1, buf, ?\t, ?\r) assert_equal("1\r", buf) buf = '' cols = CSV.generate_row([d(1), d(2)], 1, buf, ?\t, ?|) assert_equal("1|", buf) @@fullCSVData.each do |col, str| buf = '' cols = CSV.generate_row(col, col.size, buf) assert_equal(col.size, cols) assert_equal(str + "\r\n", buf) end @@fullCSVData.each do |col, str| buf = '' cols = CSV.generate_row(col, col.size, buf, ?;) assert_equal(col.size, cols) assert_equal(str + "\r\n", ssv2csv(buf)) end @@fullCSVData.each do |col, str| buf = '' cols = CSV.generate_row(col, col.size, buf, ?\t) assert_equal(col.size, cols) assert_equal(str + "\r\n", tsv2csv(buf)) end # row separator @@fullCSVData.each do |col, str| buf = '' cols = CSV.generate_row(col, col.size, buf, ?,, ?|) assert_equal(col.size, cols) assert_equal(str + "|", buf) end # col and row separator @@fullCSVData.each do |col, str| buf = '' cols = CSV.generate_row(col, col.size, buf, ?\t, ?|) assert_equal(col.size, cols) assert_equal(str + "|", tsv2csv(buf, ?|)) end buf = '' toBe = '' cols = 0 colsToBe = 0 @@fullCSVData.each do |col, str| cols += CSV.generate_row(col, col.size, buf) toBe << str << "\r\n" colsToBe += col.size end assert_equal(colsToBe, cols) assert_equal(toBe, buf) buf = '' toBe = '' cols = 0 colsToBe = 0 @@fullCSVData.each do |col, str| lineBuf = '' cols += CSV.generate_row(col, col.size, lineBuf, ?;) buf << ssv2csv(lineBuf) << "\r\n" toBe << ssv2csv(lineBuf) << "\r\n" colsToBe += col.size end assert_equal(colsToBe, cols) assert_equal(toBe, buf) buf = '' toBe = '' cols = 0 colsToBe = 0 @@fullCSVData.each do |col, str| lineBuf = '' cols += CSV.generate_row(col, col.size, lineBuf, ?\t) buf << tsv2csv(lineBuf) << "\r\n" toBe << tsv2csv(lineBuf) << "\r\n" colsToBe += col.size end assert_equal(colsToBe, cols) assert_equal(toBe, buf) buf = '' toBe = '' cols = 0 colsToBe = 0 @@fullCSVData.each do |col, str| lineBuf = '' cols += CSV.generate_row(col, col.size, lineBuf, ?|) buf << tsv2csv(lineBuf, ?|) toBe << tsv2csv(lineBuf, ?|) colsToBe += col.size end assert_equal(colsToBe, cols) assert_equal(toBe, buf) end def test_s_parse_line @@simpleCSVData.each do |col, str| row = CSV.parse_line(str) assert_instance_of(CSV::Row, row) assert_equal(col.size, row.size) assert_equal(col, row) end @@simpleCSVData.each do |col, str| str = csv2ssv(str) row = CSV.parse_line(str, ?;) assert_instance_of(CSV::Row, row) assert_equal(col.size, row.size) assert_equal(col, row) end @@simpleCSVData.each do |col, str| str = csv2tsv(str) row = CSV.parse_line(str, ?\t) assert_instance_of(CSV::Row, row) assert_equal(col.size, row.size) assert_equal(col, row) end # Illegal format. buf = CSV::Row.new row = CSV.parse_line("a,b,\"c\"\ra") assert_instance_of(CSV::Row, row) assert_equal(0, row.size) buf = CSV::Row.new row = CSV.parse_line("a;b;\"c\"\ra", ?;) assert_instance_of(CSV::Row, row) assert_equal(0, row.size) buf = CSV::Row.new row = CSV.parse_line("a\tb\t\"c\"\ra", ?\t) assert_instance_of(CSV::Row, row) assert_equal(0, row.size) row = CSV.parse_line("a,b\"") assert_instance_of(CSV::Row, row) assert_equal(0, row.size) row = CSV.parse_line("a;b\"", ?;) assert_instance_of(CSV::Row, row) assert_equal(0, row.size) row = CSV.parse_line("a\tb\"", ?\t) assert_instance_of(CSV::Row, row) assert_equal(0, row.size) row = CSV.parse_line("\"a,b\"\r,") assert_instance_of(CSV::Row, row) assert_equal(0, row.size) row = CSV.parse_line("\"a;b\"\r;", ?;) assert_instance_of(CSV::Row, row) assert_equal(0, row.size) row = CSV.parse_line("\"a\tb\"\r\t", ?\t) assert_instance_of(CSV::Row, row) assert_equal(0, row.size) row = CSV.parse_line("\"a,b\"\r\"") assert_instance_of(CSV::Row, row) assert_equal(0, row.size) row = CSV.parse_line("\"a;b\"\r\"", ?;) assert_instance_of(CSV::Row, row) assert_equal(0, row.size) row = CSV.parse_line("\"a\tb\"\r\"", ?\t) assert_instance_of(CSV::Row, row) assert_equal(0, row.size) end def test_s_parse_row @@fullCSVData.each do |col, str| buf = CSV::Row.new cols, idx = CSV.parse_row(str + "\r\n", 0, buf) assert_equal(cols, buf.size, "Reported size.") assert_equal(col.size, buf.size, "Size.") assert(buf.match(col)) buf = CSV::Row.new cols, idx = CSV.parse_row(str + "\n", 0, buf) assert_equal(cols, buf.size, "Reported size.") assert_equal(col.size, buf.size, "Size.") assert(buf.match(col)) # separator: | buf = CSV::Row.new cols, idx = CSV.parse_row(str + "|", 0, buf, ?,) assert(!buf.match(col)) buf = CSV::Row.new cols, idx = CSV.parse_row(str + "|", 0, buf, ?,, ?|) assert_equal(cols, buf.size, "Reported size.") assert_equal(col.size, buf.size, "Size.") assert(buf.match(col)) end @@fullCSVData.each do |col, str| str = csv2ssv(str) buf = CSV::Row.new cols, idx = CSV.parse_row(str + "\r\n", 0, buf, ?;) assert_equal(cols, buf.size, "Reported size.") assert_equal(col.size, buf.size, "Size.") assert(buf.match(col)) end @@fullCSVData.each do |col, str| str = csv2tsv(str) buf = CSV::Row.new cols, idx = CSV.parse_row(str + "\r\n", 0, buf, ?\t) assert_equal(cols, buf.size, "Reported size.") assert_equal(col.size, buf.size, "Size.") assert(buf.match(col)) end @@fullCSVData.each do |col, str| str = csv2tsv(str, ?|) buf = CSV::Row.new cols, idx = CSV.parse_row(str + "|", 0, buf, ?\t, ?|) assert_equal(cols, buf.size, "Reported size.") assert_equal(col.size, buf.size, "Size.") assert(buf.match(col), str) end buf = CSV::Row.new cols, idx = CSV.parse_row("a,b,\"c\r\"", 0, buf) assert_equal(["a", "b", "c\r"], buf.to_a) buf = CSV::Row.new cols, idx = CSV.parse_row("a;b;\"c\r\"", 0, buf, ?;) assert_equal(["a", "b", "c\r"], buf.to_a) buf = CSV::Row.new cols, idx = CSV.parse_row("a\tb\t\"c\r\"", 0, buf, ?\t) assert_equal(["a", "b", "c\r"], buf.to_a) buf = CSV::Row.new cols, idx = CSV.parse_row("a,b,c\n", 0, buf) assert_equal(["a", "b", "c"], buf.to_a) buf = CSV::Row.new cols, idx = CSV.parse_row("a\tb\tc\n", 0, buf, ?\t) assert_equal(["a", "b", "c"], buf.to_a) # Illegal format. buf = CSV::Row.new cols, idx = CSV.parse_row("a,b,c\"", 0, buf) assert_equal(0, cols, "Illegal format; unbalanced double-quote.") buf = CSV::Row.new cols, idx = CSV.parse_row("a;b;c\"", 0, buf, ?;) assert_equal(0, cols, "Illegal format; unbalanced double-quote.") buf = CSV::Row.new cols, idx = CSV.parse_row("a,b,\"c\"\ra", 0, buf) assert_equal(0, cols) assert_equal(0, idx) buf = CSV::Row.new cols, idx = CSV.parse_row("a,b,\"c\"\ra", 0, buf, ?;) assert_equal(0, cols) assert_equal(0, idx) buf = CSV::Row.new cols, idx = CSV.parse_row("a,b\"", 0, buf) assert_equal(0, cols) assert_equal(0, idx) buf = CSV::Row.new cols, idx = CSV.parse_row("a;b\"", 0, buf, ?;) assert_equal(0, cols) assert_equal(0, idx) buf = CSV::Row.new cols, idx = CSV.parse_row("\"a,b\"\r,", 0, buf) assert_equal(0, cols) assert_equal(0, idx) buf = CSV::Row.new cols, idx = CSV.parse_row("a\r,", 0, buf) assert_equal(0, cols) assert_equal(0, idx) buf = CSV::Row.new cols, idx = CSV.parse_row("a\r", 0, buf) assert_equal(0, cols) assert_equal(0, idx) buf = CSV::Row.new cols, idx = CSV.parse_row("a\rbc", 0, buf) assert_equal(0, cols) assert_equal(0, idx) buf = CSV::Row.new cols, idx = CSV.parse_row("a\r\"\"", 0, buf) assert_equal(0, cols) assert_equal(0, idx) buf = CSV::Row.new cols, idx = CSV.parse_row("a\r\rabc,", 0, buf) assert_equal(0, cols) assert_equal(0, idx) buf = CSV::Row.new cols, idx = CSV.parse_row("\"a;b\"\r;", 0, buf, ?;) assert_equal(0, cols) assert_equal(0, idx) buf = CSV::Row.new cols, idx = CSV.parse_row("\"a,b\"\r\"", 0, buf) assert_equal(0, cols) assert_equal(0, idx) buf = CSV::Row.new cols, idx = CSV.parse_row("\"a;b\"\r\"", 0, buf, ?;) assert_equal(0, cols) assert_equal(0, idx) end def test_s_parse_rowEOF @@fullCSVData.each do |col, str| if str == '' # String "" is not allowed. next end buf = CSV::Row.new cols, idx = CSV.parse_row(str, 0, buf) assert_equal(col.size, cols, "Reported size.") assert_equal(col.size, buf.size, "Size.") assert(buf.match(col)) end end def test_s_parse_rowConcat buf = '' toBe = [] @@fullCSVData.each do |col, str| buf << str << "\r\n" toBe.concat(col) end idx = 0 cols = 0 parsed = CSV::Row.new parsedCols = 0 begin cols, idx = CSV.parse_row(buf, idx, parsed) parsedCols += cols end while cols > 0 assert_equal(toBe.size, parsedCols) assert_equal(toBe.size, parsed.size) assert(parsed.match(toBe)) buf = '' toBe = [] @@fullCSVData.each do |col, str| buf << str << "\n" toBe.concat(col) end idx = 0 cols = 0 parsed = CSV::Row.new parsedCols = 0 begin cols, idx = CSV.parse_row(buf, idx, parsed) parsedCols += cols end while cols > 0 assert_equal(toBe.size, parsedCols) assert_equal(toBe.size, parsed.size) assert(parsed.match(toBe)) buf = '' toBe = [] @@fullCSVData.sort { |a, b| a[0].length <=> b[0].length }.each do |col, str| buf << str << "\n" toBe.concat(col) end idx = 0 cols = 0 parsed = CSV::Row.new parsedCols = 0 begin cols, idx = CSV.parse_row(buf, idx, parsed) parsedCols += cols end while cols > 0 assert_equal(toBe.size, parsedCols) assert_equal(toBe.size, parsed.size) assert(parsed.match(toBe)) buf = '' toBe = [] @@fullCSVData.each do |col, str| buf << str << "|" toBe.concat(col) end idx = 0 cols = 0 parsed = CSV::Row.new parsedCols = 0 begin cols, idx = CSV.parse_row(buf, idx, parsed, ?,, ?|) parsedCols += cols end while cols > 0 assert_equal(toBe.size, parsedCols) assert_equal(toBe.size, parsed.size) assert(parsed.match(toBe)) end def test_utf8 rows = [] CSV.open(@bomfile, "r") do |row| rows << row.to_a end assert_equal([["foo"], ["bar"]], rows) rows = [] file = File.open(@bomfile) CSV::Reader.parse(file.read) do |row| rows << row.to_a end assert_equal([["foo"], ["bar"]], rows) file.close end def test_macCR rows = [] CSV.open(@macfile, "r", ?,, ?\r) do |row| rows << row.to_a end assert_equal([["Avenches", "aus Umgebung"], ["Bad Hersfeld", "Ausgrabung"]], rows) rows = [] assert_raises(CSV::IllegalFormatError) do CSV.open(@macfile, "r") do |row| rows << row.to_a end end rows = [] file = File.open(@macfile) CSV::Reader.parse(file.read, ?,, ?\r) do |row| rows << row.to_a end assert_equal([["Avenches", "aus Umgebung"], ["Bad Hersfeld", "Ausgrabung"]], rows) file.close rows = [] file = File.open(@macfile) assert_raises(CSV::IllegalFormatError) do CSV::Reader.parse(file.read, ?,) do |row| rows << row.to_a end end file.close end #### CSV unit test InputStreamPattern = '0123456789' InputStreamPatternSize = InputStreamPattern.size def expChar(idx) InputStreamPattern[idx % InputStreamPatternSize] end def expStr(idx, n) if n > InputStreamPatternSize InputStreamPattern + expStr(0, n - InputStreamPatternSize) else InputStreamPattern[idx % InputStreamPatternSize, n] end end def setupInputStream(size, bufSize = nil) setBufSize(bufSize) if bufSize m = ((size / InputStreamPatternSize) + 1).to_i File.open(@outfile, "wb") do |f| f << (InputStreamPattern * m)[0, size] end file = File.open(@outfile, "rb") buf = CSV::IOBuf.new(file) if block_given? yield(buf) file.close nil else buf end end def setBufSize(size) CSV::StreamBuf.module_eval('remove_const("BufSize")') CSV::StreamBuf.module_eval("BufSize = #{ size }") end class StrBuf < CSV::StreamBuf private def initialize(string) @str = string @idx = 0 super() end def read(size) str = @str[@idx, size] if str.empty? nil else @idx += str.size str end end end class ErrBuf < CSV::StreamBuf class Error < RuntimeError; end private def initialize @first = true super() end def read(size) if @first @first = false "a" * size else raise ErrBuf::Error.new end end end def test_StreamBuf_MyBuf # At first, check ruby's behaviour. s = "abc" assert_equal(?a, s[0]) assert_equal(?b, s[1]) assert_equal(?c, s[2]) assert_equal(nil, s[3]) assert_equal("a", s[0, 1]) assert_equal("b", s[1, 1]) assert_equal("c", s[2, 1]) assert_equal("", s[3, 1]) assert_equal(nil, s[4, 1]) s = StrBuf.new("abc") assert_equal(?a, s[0]) assert_equal(?b, s.get(1)) assert_equal(?c, s[2]) assert_equal(nil, s.get(3)) assert_equal("a", s[0, 1]) assert_equal("b", s.get(1, 1)) assert_equal("c", s[2, 1]) assert_equal("", s.get(3, 1)) assert_equal(nil, s[4, 1]) dropped = s.drop(1) assert_equal(1, dropped) assert_equal(?b, s[0]) assert(!s.is_eos?) dropped = s.drop(1) assert_equal(1, dropped) assert_equal(?c, s[0]) assert(!s.is_eos?) dropped = s.drop(1) assert_equal(1, dropped) assert_equal(nil, s[0]) assert(s.is_eos?) dropped = s.drop(1) assert_equal(0, dropped) assert_equal(nil, s[0]) assert(s.is_eos?) s = StrBuf.new("") assert_equal(nil, s[0]) s = StrBuf.new("") dropped = s.drop(1) assert_equal(0, dropped) assert_raises(TestCSV::ErrBuf::Error) do s = ErrBuf.new s[1024] end assert_raises(TestCSV::ErrBuf::Error) do s = ErrBuf.new s.drop(1024) end end def test_StreamBuf_AREF # '[idx]' setupInputStream(22, 1024) do |s| [0, 1, 9, 10, 19, 20, 21].each do |idx| assert_equal(expChar(idx), s[idx], idx.to_s) end [22, 23].each do |idx| assert_equal(nil, s[idx], idx.to_s) end assert_equal(nil, s[-1]) end setupInputStream(22, 1) do |s| [0, 1, 9, 10, 19, 20, 21].each do |idx| assert_equal(expChar(idx), s[idx], idx.to_s) end [22, 23].each do |idx| assert_equal(nil, s[idx], idx.to_s) end end setupInputStream(1024, 1) do |s| [1023, 0].each do |idx| assert_equal(expChar(idx), s[idx], idx.to_s) end [1024, 1025].each do |idx| assert_equal(nil, s[idx], idx.to_s) end end setupInputStream(1, 1) do |s| [0].each do |idx| assert_equal(expChar(idx), s[idx], idx.to_s) end [1, 2].each do |idx| assert_equal(nil, s[idx], idx.to_s) end end end def test_StreamBuf_AREF_n # '[idx, n]' # At first, check ruby's behaviour. assert_equal("", "abc"[3, 1]) assert_equal(nil, "abc"[4, 1]) setupInputStream(22, 1024) do |s| [0, 1, 9, 10, 19, 20, 21].each do |idx| assert_equal(expStr(idx, 1), s[idx, 1], idx.to_s) end assert_equal("", s[22, 1]) assert_equal(nil, s[23, 1]) end setupInputStream(22, 1) do |s| [0, 1, 9, 10, 19, 20, 21].each do |idx| assert_equal(expStr(idx, 1), s[idx, 1], idx.to_s) end assert_equal("", s[22, 1]) assert_equal(nil, s[23, 1]) end setupInputStream(1024, 1) do |s| [1023, 0].each do |idx| assert_equal(expStr(idx, 1), s[idx, 1], idx.to_s) end assert_equal("", s[1024, 1]) assert_equal(nil, s[1025, 1]) end setupInputStream(1, 1) do |s| [0].each do |idx| assert_equal(expStr(idx, 1), s[idx, 1], idx.to_s) end assert_equal("", s[1, 1]) assert_equal(nil, s[2, 1]) end setupInputStream(22, 11) do |s| [0, 1, 10, 11, 20].each do |idx| assert_equal(expStr(idx, 2), s[idx, 2], idx.to_s) end assert_equal(expStr(21, 1), s[21, 2]) assert_equal(expStr(0, 12), s[0, 12]) assert_equal(expStr(10, 12), s[10, 12]) assert_equal(expStr(10, 12), s[10, 13]) assert_equal(expStr(10, 12), s[10, 14]) assert_equal(expStr(10, 12), s[10, 1024]) assert_equal(nil, s[0, -1]) assert_equal(nil, s[21, -1]) assert_equal(nil, s[-1, 10]) assert_equal(nil, s[-1, -1]) end end def test_StreamBuf_get setupInputStream(22, 1024) do |s| [0, 1, 9, 10, 19, 20, 21].each do |idx| assert_equal(expChar(idx), s.get(idx), idx.to_s) end [22, 23].each do |idx| assert_equal(nil, s.get(idx), idx.to_s) end assert_equal(nil, s.get(-1)) end end def test_StreamBuf_get_n setupInputStream(22, 1024) do |s| [0, 1, 9, 10, 19, 20, 21].each do |idx| assert_equal(expStr(idx, 1), s.get(idx, 1), idx.to_s) end assert_equal("", s.get(22, 1)) assert_equal(nil, s.get(23, 1)) assert_equal(nil, s.get(-1, 1)) assert_equal(nil, s.get(-1, -1)) end end def test_StreamBuf_drop setupInputStream(22, 1024) do |s| assert_equal(expChar(0), s[0]) assert_equal(expChar(21), s[21]) assert_equal(nil, s[22]) dropped = s.drop(-1) assert_equal(0, dropped) assert_equal(expChar(0), s[0]) dropped = s.drop(0) assert_equal(0, dropped) assert_equal(expChar(0), s[0]) dropped = s.drop(1) assert_equal(1, dropped) assert_equal(expChar(1), s[0]) assert_equal(expChar(2), s[1]) dropped = s.drop(1) assert_equal(1, dropped) assert_equal(expChar(2), s[0]) assert_equal(expChar(3), s[1]) end setupInputStream(4, 2) do |s| dropped = s.drop(2) assert_equal(2, dropped) assert_equal(expChar(2), s[0]) assert_equal(expChar(3), s[1]) dropped = s.drop(1) assert_equal(1, dropped) assert_equal(expChar(3), s[0]) assert_equal(nil, s[1]) dropped = s.drop(1) assert_equal(1, dropped) assert_equal(nil, s[0]) assert_equal(nil, s[1]) dropped = s.drop(0) assert_equal(0, dropped) assert_equal(nil, s[0]) assert_equal(nil, s[1]) end setupInputStream(6, 3) do |s| dropped = s.drop(2) assert_equal(2, dropped) dropped = s.drop(2) assert_equal(2, dropped) assert_equal(expChar(4), s[0]) assert_equal(expChar(5), s[1]) dropped = s.drop(3) assert_equal(2, dropped) assert_equal(nil, s[0]) assert_equal(nil, s[1]) end end def test_StreamBuf_is_eos? setupInputStream(3, 1024) do |s| assert(!s.is_eos?) s.drop(1) assert(!s.is_eos?) s.drop(1) assert(!s.is_eos?) s.drop(1) assert(s.is_eos?) s.drop(1) assert(s.is_eos?) end setupInputStream(3, 2) do |s| assert(!s.is_eos?) s.drop(1) assert(!s.is_eos?) s.drop(1) assert(!s.is_eos?) s.drop(1) assert(s.is_eos?) s.drop(1) assert(s.is_eos?) end end def test_StreamBuf_s_new # NotImplementedError should be raised from StreamBuf#read. assert_raises(NotImplementedError) do CSV::StreamBuf.new end end def test_IOBuf_close f = File.open(@outfile, "wb") f << "tst" f.close f = File.open(@outfile, "rb") iobuf = CSV::IOBuf.new(f) iobuf.close assert(true) # iobuf.close does not raise any exception. f.close end def test_IOBuf_s_new iobuf = CSV::IOBuf.new(Tempfile.new("in.csv")) assert_instance_of(CSV::IOBuf, iobuf) end #### CSV functional test # sample data # # 1 2 3 4 5 6 7 8 # +------+-------+---------+-------+--------+------+----+------+ # | foo | "foo" | foo,bar | "" |(empty) |(null)| \r | \r\n | # +------+-------+---------+-------+--------+------+----+------+ # | NaHi | "Na" | Na,Hi | \r.\n | \r\n\n | " | \n | \r\n | # +------+-------+---------+-------+--------+------+----+------+ # def test_s_parseAndCreate colSize = 8 csvStr = "foo,!!!foo!!!,!foo,bar!,!!!!!!,!!,,!\r!,!\r\n!\r\nNaHi,!!!Na!!!,!Na,Hi!,!\r.\n!,!\r\n\n!,!!!!,!\n!,!\r\n!".gsub!('!', '"') csvStrTerminated = csvStr + "\r\n" myStr = csvStr.dup res1 = []; res2 = [] idx = 0 col, idx = CSV::parse_row(myStr, 0, res1) col, idx = CSV::parse_row(myStr, idx, res2) buf = '' col = CSV::generate_row(res1, colSize, buf) col = CSV::generate_row(res2, colSize, buf) assert_equal(csvStrTerminated, buf) parsed = [] CSV::Reader.parse(csvStrTerminated) do |row| parsed << row end buf = '' CSV::Writer.generate(buf) do |writer| parsed.each do |row| writer.add_row(row) end end assert_equal(csvStrTerminated, buf) buf = '' CSV::Writer.generate(buf) do |writer| parsed.each do |row| writer << row.collect { |e| e.is_null ? nil : e.data } end end assert_equal(csvStrTerminated, buf) end end if $0 == __FILE__ suite = Test::Unit::TestSuite.new('CSV') ObjectSpace.each_object(Class) do |klass| suite << klass.suite if (Test::Unit::TestCase > klass) end require 'test/unit/ui/console/testrunner' Test::Unit::UI::Console::TestRunner.run(suite).passed? end