summaryrefslogtreecommitdiffstats
path: root/cmake/modules/BuildArrow.cmake
diff options
context:
space:
mode:
Diffstat (limited to 'cmake/modules/BuildArrow.cmake')
-rw-r--r--cmake/modules/BuildArrow.cmake167
1 files changed, 167 insertions, 0 deletions
diff --git a/cmake/modules/BuildArrow.cmake b/cmake/modules/BuildArrow.cmake
new file mode 100644
index 000000000..691108a40
--- /dev/null
+++ b/cmake/modules/BuildArrow.cmake
@@ -0,0 +1,167 @@
+# apache arrow and its parquet library are used in radosgw for s3 select
+
+function(build_arrow)
+ # only enable the parquet component
+ set(arrow_CMAKE_ARGS -DARROW_PARQUET=ON)
+
+ # only use preinstalled dependencies for arrow, don't fetch/build any
+ list(APPEND arrow_CMAKE_ARGS -DARROW_DEPENDENCY_SOURCE=SYSTEM)
+
+ # only build static version of arrow and parquet
+ list(APPEND arrow_CMAKE_ARGS -DARROW_BUILD_SHARED=OFF)
+ list(APPEND arrow_CMAKE_ARGS -DARROW_BUILD_STATIC=ON)
+
+ # arrow only supports its own bundled version of jemalloc, so can't
+ # share the version ceph is using
+ list(APPEND arrow_CMAKE_ARGS -DARROW_JEMALLOC=OFF)
+
+ # transitive dependencies
+ list(APPEND arrow_INTERFACE_LINK_LIBRARIES thrift)
+
+ if (NOT WITH_SYSTEM_UTF8PROC)
+ # forward utf8proc_ROOT from build_utf8proc()
+ list(APPEND arrow_CMAKE_ARGS -Dutf8proc_ROOT=${utf8proc_ROOT})
+ # non-system utf8proc is bundled as a static library
+ list(APPEND arrow_CMAKE_ARGS -DARROW_UTF8PROC_USE_SHARED=OFF)
+ # make sure utf8proc submodule builds first, so arrow can find its byproducts
+ list(APPEND arrow_DEPENDS utf8proc::utf8proc)
+ endif()
+
+ list(APPEND arrow_CMAKE_ARGS -DARROW_WITH_BROTLI=${HAVE_BROTLI})
+ if (HAVE_BROTLI) # optional, off by default
+ list(APPEND arrow_INTERFACE_LINK_LIBRARIES ${brotli_libs})
+ endif (HAVE_BROTLI)
+
+ list(APPEND arrow_CMAKE_ARGS -DARROW_WITH_BZ2=OFF)
+
+ list(APPEND arrow_CMAKE_ARGS -DARROW_WITH_LZ4=${HAVE_LZ4})
+ if (HAVE_LZ4) # optional, on by default
+ list(APPEND arrow_INTERFACE_LINK_LIBRARIES LZ4::LZ4)
+ endif (HAVE_LZ4)
+
+ list(APPEND arrow_CMAKE_ARGS -DARROW_WITH_SNAPPY=ON) # required
+ list(APPEND arrow_INTERFACE_LINK_LIBRARIES snappy::snappy)
+
+ if(WITH_RADOSGW_ARROW_FLIGHT)
+ message("building arrow flight; make sure grpc-plugins is installed on the system")
+ list(APPEND arrow_CMAKE_ARGS
+ -DARROW_FLIGHT=ON -DARROW_WITH_RE2=OFF)
+ find_package(gRPC REQUIRED)
+ find_package(Protobuf REQUIRED)
+ find_package(c-ares 1.13.0 QUIET REQUIRED)
+ endif(WITH_RADOSGW_ARROW_FLIGHT)
+
+ list(APPEND arrow_CMAKE_ARGS -DARROW_WITH_ZLIB=ON) # required
+ list(APPEND arrow_INTERFACE_LINK_LIBRARIES ZLIB::ZLIB)
+
+ list(APPEND arrow_CMAKE_ARGS -DARROW_WITH_ZSTD=${WITH_SYSTEM_ZSTD})
+ if (WITH_SYSTEM_ZSTD)
+ find_package(Zstd 1.4.4 REQUIRED)
+ list(APPEND arrow_INTERFACE_LINK_LIBRARIES Zstd::Zstd)
+ endif (WITH_SYSTEM_ZSTD)
+
+ list(APPEND arrow_CMAKE_ARGS -DBOOST_ROOT=${BOOST_ROOT})
+ list(APPEND arrow_CMAKE_ARGS -DBOOST_INCLUDEDIR=${Boost_INCLUDE_DIR})
+ list(APPEND arrow_CMAKE_ARGS -DBOOST_LIBRARYDIR=${BOOST_LIBRARYDIR})
+
+ if (NOT WITH_SYSTEM_BOOST)
+ # make sure boost submodule builds first, so arrow can find its byproducts
+ list(APPEND arrow_DEPENDS Boost)
+ endif()
+
+ # cmake doesn't properly handle arguments containing ";", such as
+ # CMAKE_PREFIX_PATH, for which reason we'll have to use some other separator.
+ string(REPLACE ";" "!" CMAKE_PREFIX_PATH_ALT_SEP "${CMAKE_PREFIX_PATH}")
+ list(APPEND arrow_CMAKE_ARGS -DCMAKE_PREFIX_PATH=${CMAKE_PREFIX_PATH_ALT_SEP})
+ if(CMAKE_TOOLCHAIN_FILE)
+ list(APPEND arrow_CMAKE_ARGS
+ -DCMAKE_TOOLCHAIN_FILE=${CMAKE_TOOLCHAIN_FILE})
+ endif()
+
+ list(APPEND arrow_CMAKE_ARGS -DCMAKE_C_COMPILER=${CMAKE_C_COMPILER})
+ list(APPEND arrow_CMAKE_ARGS -DCMAKE_CXX_COMPILER=${CMAKE_CXX_COMPILER})
+ list(APPEND arrow_CMAKE_ARGS -DCMAKE_AR=${CMAKE_AR})
+ if(CMAKE_BUILD_TYPE AND NOT CMAKE_BUILD_TYPE STREQUAL "None")
+ list(APPEND arrow_CMAKE_ARGS -DCMAKE_BUILD_TYPE=${CMAKE_BUILD_TYPE})
+ else()
+ list(APPEND arrow_CMAKE_ARGS -DCMAKE_BUILD_TYPE=Release)
+ endif()
+
+ # we use an external project and copy the sources to bin directory to ensure
+ # that object files are built outside of the source tree.
+ include(ExternalProject)
+ set(arrow_SOURCE_DIR "${CMAKE_CURRENT_SOURCE_DIR}/arrow/cpp")
+ set(arrow_BINARY_DIR "${CMAKE_CURRENT_BINARY_DIR}/arrow/cpp")
+
+ set(arrow_INSTALL_PREFIX "${CMAKE_CURRENT_BINARY_DIR}/arrow")
+ list(APPEND arrow_CMAKE_ARGS -DCMAKE_INSTALL_PREFIX=${arrow_INSTALL_PREFIX})
+
+ set(arrow_INSTALL_LIBDIR "lib") # force lib so we don't have to guess between lib/lib64
+ list(APPEND arrow_CMAKE_ARGS -DCMAKE_INSTALL_LIBDIR=${arrow_INSTALL_LIBDIR})
+ set(arrow_LIBRARY_DIR "${arrow_INSTALL_PREFIX}/${arrow_INSTALL_LIBDIR}")
+
+ set(arrow_LIBRARY "${arrow_LIBRARY_DIR}/libarrow.a")
+ set(parquet_LIBRARY "${arrow_LIBRARY_DIR}/libparquet.a")
+
+ set(arrow_INCLUDE_DIR "${arrow_INSTALL_PREFIX}/include")
+ # this include directory won't exist until the install step, but the
+ # imported targets need it early for INTERFACE_INCLUDE_DIRECTORIES
+ file(MAKE_DIRECTORY "${arrow_INCLUDE_DIR}")
+
+ set(arrow_BYPRODUCTS ${arrow_LIBRARY})
+ list(APPEND arrow_BYPRODUCTS ${parquet_LIBRARY})
+
+ if(WITH_RADOSGW_ARROW_FLIGHT)
+ set(arrow_flight_LIBRARY "${arrow_LIBRARY_DIR}/libarrow_flight.a")
+ list(APPEND arrow_BYPRODUCTS ${arrow_flight_LIBRARY})
+ endif(WITH_RADOSGW_ARROW_FLIGHT)
+
+ if(CMAKE_MAKE_PROGRAM MATCHES "make")
+ # try to inherit command line arguments passed by parent "make" job
+ set(make_cmd $(MAKE))
+ set(install_cmd $(MAKE) install)
+ else()
+ set(make_cmd ${CMAKE_COMMAND} --build <BINARY_DIR>)
+ set(install_cmd ${CMAKE_COMMAND} --build <BINARY_DIR> --target install)
+ endif()
+
+ # clear the DESTDIR environment variable from debian/rules,
+ # because it messes with the internal install paths of arrow's bundled deps
+ set(NO_DESTDIR_COMMAND ${CMAKE_COMMAND} -E env --unset=DESTDIR)
+
+ ExternalProject_Add(arrow_ext
+ SOURCE_DIR "${arrow_SOURCE_DIR}"
+ CMAKE_ARGS ${arrow_CMAKE_ARGS}
+ BINARY_DIR "${arrow_BINARY_DIR}"
+ BUILD_COMMAND ${NO_DESTDIR_COMMAND} ${make_cmd}
+ BUILD_BYPRODUCTS "${arrow_BYPRODUCTS}"
+ INSTALL_COMMAND ${NO_DESTDIR_COMMAND} ${install_cmd}
+ INSTALL_DIR "${arrow_INSTALL_PREFIX}"
+ DEPENDS "${arrow_DEPENDS}"
+ LIST_SEPARATOR !)
+
+ add_library(Arrow::Arrow STATIC IMPORTED)
+ add_dependencies(Arrow::Arrow arrow_ext)
+ set_target_properties(Arrow::Arrow PROPERTIES
+ INTERFACE_INCLUDE_DIRECTORIES "${arrow_INCLUDE_DIR}"
+ INTERFACE_LINK_LIBRARIES "${arrow_INTERFACE_LINK_LIBRARIES}"
+ IMPORTED_LINK_INTERFACE_LANGUAGES "CXX"
+ IMPORTED_LOCATION "${arrow_LIBRARY}")
+
+ add_library(Arrow::Parquet STATIC IMPORTED)
+ add_dependencies(Arrow::Parquet arrow_ext)
+ target_link_libraries(Arrow::Parquet INTERFACE Arrow::Arrow)
+ set_target_properties(Arrow::Parquet PROPERTIES
+ IMPORTED_LINK_INTERFACE_LANGUAGES "CXX"
+ IMPORTED_LOCATION "${parquet_LIBRARY}")
+
+ if(WITH_RADOSGW_ARROW_FLIGHT)
+ add_library(Arrow::Flight STATIC IMPORTED)
+ add_dependencies(Arrow::Flight arrow_ext)
+ target_link_libraries(Arrow::Flight INTERFACE Arrow::Arrow gRPC::grpc++)
+ set_target_properties(Arrow::Flight PROPERTIES
+ INTERFACE_INCLUDE_DIRECTORIES "${arrow_INCLUDE_DIR}" # flight is accessed via "arrow/flight"
+ IMPORTED_LINK_INTERFACE_LANGUAGES "CXX"
+ IMPORTED_LOCATION "${arrow_flight_LIBRARY}")
+ endif(WITH_RADOSGW_ARROW_FLIGHT)
+endfunction()