Merge branch 'master' into 3453-arv-list-docker-images
[arvados.git] / sdk / ruby / test / test_keep_manifest.rb
1 require "minitest/autorun"
2 require "arvados/keep"
3
4 def random_block(size=nil)
5   sprintf("%032x+%d", rand(16 ** 32), size || rand(64 * 1024 * 1024))
6 end
7
8 class ManifestTest < Minitest::Test
9   SIMPLEST_MANIFEST = ". #{random_block(9)} 0:9:simple.txt\n"
10   MULTILEVEL_MANIFEST =
11     [". #{random_block(9)} 0:3:file1 3:3:file2 6:3:file3\n",
12      "./dir1 #{random_block(9)} 0:3:file1 3:3:file2 6:3:file3\n",
13      "./dir1/subdir #{random_block(9)} 0:3:file1 3:3:file2 6:3:file3\n",
14      "./dir2 #{random_block(9)} 0:3:file1 3:3:file2 6:3:file3\n"].join("")
15
16   def test_simple_each_stream_array
17     manifest = Keep::Manifest.new(SIMPLEST_MANIFEST)
18     stream_name, block_s, file = SIMPLEST_MANIFEST.strip.split
19     stream_a = manifest.each_stream.to_a
20     assert_equal(1, stream_a.size, "wrong number of streams")
21     assert_equal(stream_name, stream_a[0][0])
22     assert_equal([block_s], stream_a[0][1].map(&:to_s))
23     assert_equal([file], stream_a[0][2])
24   end
25
26   def test_simple_each_stream_block
27     manifest = Keep::Manifest.new(SIMPLEST_MANIFEST)
28     result = []
29     manifest.each_stream do |stream, blocks, files|
30       result << files
31     end
32     assert_equal([[SIMPLEST_MANIFEST.split.last]], result,
33                  "wrong result from each_stream block")
34   end
35
36   def test_multilevel_each_stream
37     manifest = Keep::Manifest.new(MULTILEVEL_MANIFEST)
38     seen = []
39     manifest.each_stream do |stream, blocks, files|
40       refute(seen.include?(stream),
41              "each_stream already yielded stream #{stream}")
42       seen << stream
43       assert_equal(3, files.size, "wrong file count for stream #{stream}")
44     end
45     assert_equal(4, seen.size, "wrong number of streams")
46   end
47
48   def test_empty_each_stream
49     assert_empty(Keep::Manifest.new("").each_stream.to_a)
50   end
51
52   def test_backslash_escape_parsing
53     m_text = "./dir\\040name #{random_block} 0:0:file\\\\name\\011\\here.txt\n"
54     manifest = Keep::Manifest.new(m_text)
55     streams = manifest.each_stream.to_a
56     assert_equal(1, streams.size, "wrong number of streams with whitespace")
57     assert_equal("./dir name", streams.first.first,
58                  "wrong stream name with whitespace")
59     assert_equal(["0:0:file\\name\t\\here.txt"], streams.first.last,
60                  "wrong filename(s) with whitespace")
61   end
62
63   def test_simple_each_file_array
64     manifest = Keep::Manifest.new(SIMPLEST_MANIFEST)
65     assert_equal([[".", "simple.txt", 9]], manifest.each_file.to_a)
66   end
67
68   def test_multilevel_each_file
69     manifest = Keep::Manifest.new(MULTILEVEL_MANIFEST)
70     seen = Hash.new { |this, key| this[key] = [] }
71     manifest.each_file do |stream, basename, size|
72       refute(seen[stream].include?(basename),
73              "each_file repeated #{stream}/#{basename}")
74       seen[stream] << basename
75       assert_equal(3, size, "wrong size for #{stream}/#{basename}")
76     end
77     seen.each_pair do |stream, basenames|
78       assert_equal(%w(file1 file2 file3), basenames.sort,
79                    "wrong file list for #{stream}")
80     end
81   end
82
83   def test_each_file_handles_filenames_with_colons
84     manifest = Keep::Manifest.new(". #{random_block(9)} 0:9:file:test.txt\n")
85     assert_equal([[".", "file:test.txt", 9]], manifest.each_file.to_a)
86   end
87 end