summaryrefslogtreecommitdiffstats
path: root/src/arrow/ruby/red-parquet/test/test-arrow-table.rb
blob: 1ea2669e316d9f809c6b4faf5f60ae0dd2dcff27 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements.  See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership.  The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License.  You may obtain a copy of the License at
#
#   http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied.  See the License for the
# specific language governing permissions and limitations
# under the License.

class TestArrowTable < Test::Unit::TestCase
  def setup
    @count_field = Arrow::Field.new("count", :uint8)
    @visible_field = Arrow::Field.new("visible", :boolean)
    @label_field = Arrow::Field.new("label", :string)
    schema = Arrow::Schema.new([@count_field, @visible_field, @label_field])
    count_arrays = [
      Arrow::UInt8Array.new([1, 2]),
      Arrow::UInt8Array.new([4, 8, 16]),
      Arrow::UInt8Array.new([32, 64]),
      Arrow::UInt8Array.new([128]),
    ]
    visible_arrays = [
      Arrow::BooleanArray.new([true, false, nil]),
      Arrow::BooleanArray.new([true]),
      Arrow::BooleanArray.new([true, false]),
      Arrow::BooleanArray.new([nil]),
      Arrow::BooleanArray.new([nil]),
    ]
    label_arrays = [
      Arrow::StringArray.new(["a"]),
      Arrow::StringArray.new(["b", "c"]),
      Arrow::StringArray.new(["d", nil, nil]),
      Arrow::StringArray.new(["e", "f"]),
    ]
    @count_array = Arrow::ChunkedArray.new(count_arrays)
    @visible_array = Arrow::ChunkedArray.new(visible_arrays)
    @label_array = Arrow::ChunkedArray.new(label_arrays)
    @table = Arrow::Table.new(schema,
                              [@count_array, @visible_array, @label_array])

    @output = Tempfile.open(["red-parquet", ".parquet"])
    begin
      yield(@output)
    ensure
      @output.close!
    end
  end

  def test_save_load_path
    @table.save(@output.path)
    assert do
      @table.equal_metadata(Arrow::Table.load(@output.path), false)
    end
  end

  def test_save_load_buffer
    buffer = Arrow::ResizableBuffer.new(1024)
    @table.save(buffer, format: :parquet)
    assert do
      @table.equal_metadata(Arrow::Table.load(buffer, format: :parquet), false)
    end
  end

  def test_save_load_compression
    @table.save(@output.path, compression: :zstd)
    assert do
      @table.equal_metadata(Arrow::Table.load(@output.path), false)
    end
  end

  def test_save_load_compression_path
    @table.save(@output.path, compression: {"count" => :zstd})
    assert do
      @table.equal_metadata(Arrow::Table.load(@output.path), false)
    end
  end

  def test_save_load_dictionary
    @table.save(@output.path, dictionary: false)
    assert do
      @table.equal_metadata(Arrow::Table.load(@output.path), false)
    end
  end

  def test_save_load_dictionary_path
    @table.save(@output.path, dictionary: [["label", false]])
    assert do
      @table.equal_metadata(Arrow::Table.load(@output.path), false)
    end
  end
end