diff options
author | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-04-21 11:54:28 +0000 |
---|---|---|
committer | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-04-21 11:54:28 +0000 |
commit | e6918187568dbd01842d8d1d2c808ce16a894239 (patch) | |
tree | 64f88b554b444a49f656b6c656111a145cbbaa28 /src/arrow/ruby/red-arrow-dataset/lib/arrow-dataset/arrow-table-loadable.rb | |
parent | Initial commit. (diff) | |
download | ceph-upstream/18.2.2.tar.xz ceph-upstream/18.2.2.zip |
Adding upstream version 18.2.2.upstream/18.2.2
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'src/arrow/ruby/red-arrow-dataset/lib/arrow-dataset/arrow-table-loadable.rb')
-rw-r--r-- | src/arrow/ruby/red-arrow-dataset/lib/arrow-dataset/arrow-table-loadable.rb | 61 |
1 files changed, 61 insertions, 0 deletions
diff --git a/src/arrow/ruby/red-arrow-dataset/lib/arrow-dataset/arrow-table-loadable.rb b/src/arrow/ruby/red-arrow-dataset/lib/arrow-dataset/arrow-table-loadable.rb new file mode 100644 index 000000000..14c8dce6f --- /dev/null +++ b/src/arrow/ruby/red-arrow-dataset/lib/arrow-dataset/arrow-table-loadable.rb @@ -0,0 +1,61 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. + +module ArrowDataset + module ArrowTableLoadable + private + def path_to_uri(path) + absolute_path = ::File.expand_path(path) + if absolute_path.start_with?("/") + URI("file://#{absolute_path}") + else + URI("file:///#{absolute_path}") + end + end + + def load_from_directory + internal_load_from_uri(path_to_uri(@input)) + end + + def load_from_uri + internal_load_from_uri(@input) + end + + def internal_load_from_uri(uri) + format = FileFormat.resolve(@options[:format]) + dataset = FileSystemDataset.build(format) do |factory| + factory.file_system_uri = uri + end + scanner_builder = dataset.begin_scan + @options.each do |key, value| + next if key == :format + next if value.nil? + setter = "#{key}=" + next unless scanner_builder.respond_to?(setter) + scanner_builder.public_send(setter, value) + end + scanner = scanner_builder.finish + scanner.to_table + end + end +end + +module Arrow + class TableLoader + include ArrowDataset::ArrowTableLoadable + end +end |