# Licensed to the Apache Software Foundation (ASF) under one # or more contributor license agreements. See the NOTICE file # distributed with this work for additional information # regarding copyright ownership. The ASF licenses this file # to you under the Apache License, Version 2.0 (the # "License"); you may not use this file except in compliance # with the License. You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, # software distributed under the License is distributed on an # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY # KIND, either express or implied. See the License for the # specific language governing permissions and limitations # under the License. class TestDatasetScannerBuilder < Test::Unit::TestCase include Helper::Buildable include Helper::Writable def setup omit("Arrow Dataset is required") unless defined?(ArrowDataset) Dir.mktmpdir do |tmpdir| path = File.join(tmpdir, "table.arrow") @table = build_table(visible: [ build_boolean_array([true, false, true]), build_boolean_array([false, true, false, true]), ], point: [ build_int32_array([1, 2, 3]), build_int32_array([-1, -2, -3, -4]), ]) @format = ArrowDataset::IPCFileFormat.new write_table(@table, path) factory = ArrowDataset::FileSystemDatasetFactory.new(@format) factory.file_system_uri = build_file_uri(path) @dataset = factory.finish @builder = @dataset.begin_scan yield end end def test_new_record_batch_reader reader = Arrow::TableBatchReader.new(@table) builder = ArrowDataset::ScannerBuilder.new(reader) scanner = builder.finish assert_equal(@table, scanner.to_table) end def test_filter visible = Arrow::FieldExpression.new("visible") true_scalar = Arrow::BooleanScalar.new(true) true_datum = Arrow::ScalarDatum.new(true_scalar) true_literal = Arrow::LiteralExpression.new(true_datum) filter = Arrow::CallExpression.new("equal", [visible, true_literal]) @builder.filter = filter scanner = @builder.finish assert_equal(build_table(visible: [ build_boolean_array([true, true]), build_boolean_array([true, true]), ], point: [ build_int32_array([1, 3]), build_int32_array([-2, -4]), ]), scanner.to_table) end def test_use_async @builder.use_async = true scanner = @builder.finish assert_equal(@table, scanner.to_table) end end