1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
|
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
class TestArrowTable < Test::Unit::TestCase
def setup
@count_field = Arrow::Field.new("count", :uint8)
@visible_field = Arrow::Field.new("visible", :boolean)
@label_field = Arrow::Field.new("label", :string)
schema = Arrow::Schema.new([@count_field, @visible_field, @label_field])
count_arrays = [
Arrow::UInt8Array.new([1, 2]),
Arrow::UInt8Array.new([4, 8, 16]),
Arrow::UInt8Array.new([32, 64]),
Arrow::UInt8Array.new([128]),
]
visible_arrays = [
Arrow::BooleanArray.new([true, false, nil]),
Arrow::BooleanArray.new([true]),
Arrow::BooleanArray.new([true, false]),
Arrow::BooleanArray.new([nil]),
Arrow::BooleanArray.new([nil]),
]
label_arrays = [
Arrow::StringArray.new(["a"]),
Arrow::StringArray.new(["b", "c"]),
Arrow::StringArray.new(["d", nil, nil]),
Arrow::StringArray.new(["e", "f"]),
]
@count_array = Arrow::ChunkedArray.new(count_arrays)
@visible_array = Arrow::ChunkedArray.new(visible_arrays)
@label_array = Arrow::ChunkedArray.new(label_arrays)
@table = Arrow::Table.new(schema,
[@count_array, @visible_array, @label_array])
@output = Tempfile.open(["red-parquet", ".parquet"])
begin
yield(@output)
ensure
@output.close!
end
end
def test_save_load_path
@table.save(@output.path)
assert do
@table.equal_metadata(Arrow::Table.load(@output.path), false)
end
end
def test_save_load_buffer
buffer = Arrow::ResizableBuffer.new(1024)
@table.save(buffer, format: :parquet)
assert do
@table.equal_metadata(Arrow::Table.load(buffer, format: :parquet), false)
end
end
def test_save_load_compression
@table.save(@output.path, compression: :zstd)
assert do
@table.equal_metadata(Arrow::Table.load(@output.path), false)
end
end
def test_save_load_compression_path
@table.save(@output.path, compression: {"count" => :zstd})
assert do
@table.equal_metadata(Arrow::Table.load(@output.path), false)
end
end
def test_save_load_dictionary
@table.save(@output.path, dictionary: false)
assert do
@table.equal_metadata(Arrow::Table.load(@output.path), false)
end
end
def test_save_load_dictionary_path
@table.save(@output.path, dictionary: [["label", false]])
assert do
@table.equal_metadata(Arrow::Table.load(@output.path), false)
end
end
end
|