// Licensed to the Apache Software Foundation (ASF) under one // or more contributor license agreements. See the NOTICE file // distributed with this work for additional information // regarding copyright ownership. The ASF licenses this file // to you under the Apache License, Version 2.0 (the // "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, // software distributed under the License is distributed on an // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, either express or implied. See the License for the // specific language governing permissions and limitations // under the License. #include #include #include #include "parquet/api/reader.h" int main(int argc, char** argv) { if (argc > 5 || argc < 2) { std::cerr << "Usage: parquet-reader [--only-metadata] [--no-memory-map] [--json] " << "[--dump] [--print-key-value-metadata] [--columns=...] " << std::endl; return -1; } std::string filename; bool print_values = true; bool print_key_value_metadata = false; bool memory_map = true; bool format_json = false; bool format_dump = false; // Read command-line options const std::string COLUMNS_PREFIX = "--columns="; std::list columns; char *param, *value; for (int i = 1; i < argc; i++) { if ((param = std::strstr(argv[i], "--only-metadata"))) { print_values = false; } else if ((param = std::strstr(argv[i], "--print-key-value-metadata"))) { print_key_value_metadata = true; } else if ((param = std::strstr(argv[i], "--no-memory-map"))) { memory_map = false; } else if ((param = std::strstr(argv[i], "--json"))) { format_json = true; } else if ((param = std::strstr(argv[i], "--dump"))) { format_dump = true; } else if ((param = std::strstr(argv[i], COLUMNS_PREFIX.c_str()))) { value = std::strtok(param + COLUMNS_PREFIX.length(), ","); while (value) { columns.push_back(std::atoi(value)); value = std::strtok(nullptr, ","); } } else { filename = argv[i]; } } try { std::unique_ptr reader = parquet::ParquetFileReader::OpenFile(filename, memory_map); parquet::ParquetFilePrinter printer(reader.get()); if (format_json) { printer.JSONPrint(std::cout, columns, filename.c_str()); } else { printer.DebugPrint(std::cout, columns, print_values, format_dump, print_key_value_metadata, filename.c_str()); } } catch (const std::exception& e) { std::cerr << "Parquet error: " << e.what() << std::endl; return -1; } return 0; }