# Licensed to the Apache Software Foundation (ASF) under one # or more contributor license agreements. See the NOTICE file # distributed with this work for additional information # regarding copyright ownership. The ASF licenses this file # to you under the Apache License, Version 2.0 (the # "License"); you may not use this file except in compliance # with the License. You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, # software distributed under the License is distributed on an # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY # KIND, either express or implied. See the License for the # specific language governing permissions and limitations # under the License. from libcpp.memory cimport shared_ptr from pyarrow.includes.libarrow cimport (CArray, CDataType, CField, CRecordBatch, CSchema, CTable, CTensor, CSparseCOOTensor, CSparseCSRMatrix, CSparseCSCMatrix, CSparseCSFTensor) # You cannot assign something to a dereferenced pointer in Cython thus these # methods don't use Status to indicate a successful operation. cdef api bint pyarrow_is_buffer(object buffer): return isinstance(buffer, Buffer) cdef api shared_ptr[CBuffer] pyarrow_unwrap_buffer(object buffer): cdef Buffer buf if pyarrow_is_buffer(buffer): buf = (buffer) return buf.buffer return shared_ptr[CBuffer]() cdef api object pyarrow_wrap_buffer(const shared_ptr[CBuffer]& buf): cdef Buffer result = Buffer.__new__(Buffer) result.init(buf) return result cdef api object pyarrow_wrap_resizable_buffer( const shared_ptr[CResizableBuffer]& buf): cdef ResizableBuffer result = ResizableBuffer.__new__(ResizableBuffer) result.init_rz(buf) return result cdef api bint pyarrow_is_data_type(object type_): return isinstance(type_, DataType) cdef api shared_ptr[CDataType] pyarrow_unwrap_data_type( object data_type): cdef DataType type_ if pyarrow_is_data_type(data_type): type_ = (data_type) return type_.sp_type return shared_ptr[CDataType]() # Workaround for Cython parsing bug # https://github.com/cython/cython/issues/2143 ctypedef const CPyExtensionType* _CPyExtensionTypePtr cdef api object pyarrow_wrap_data_type( const shared_ptr[CDataType]& type): cdef: const CExtensionType* ext_type const CPyExtensionType* cpy_ext_type DataType out if type.get() == NULL: return None if type.get().id() == _Type_DICTIONARY: out = DictionaryType.__new__(DictionaryType) elif type.get().id() == _Type_LIST: out = ListType.__new__(ListType) elif type.get().id() == _Type_LARGE_LIST: out = LargeListType.__new__(LargeListType) elif type.get().id() == _Type_MAP: out = MapType.__new__(MapType) elif type.get().id() == _Type_FIXED_SIZE_LIST: out = FixedSizeListType.__new__(FixedSizeListType) elif type.get().id() == _Type_STRUCT: out = StructType.__new__(StructType) elif type.get().id() == _Type_SPARSE_UNION: out = SparseUnionType.__new__(SparseUnionType) elif type.get().id() == _Type_DENSE_UNION: out = DenseUnionType.__new__(DenseUnionType) elif type.get().id() == _Type_TIMESTAMP: out = TimestampType.__new__(TimestampType) elif type.get().id() == _Type_DURATION: out = DurationType.__new__(DurationType) elif type.get().id() == _Type_FIXED_SIZE_BINARY: out = FixedSizeBinaryType.__new__(FixedSizeBinaryType) elif type.get().id() == _Type_DECIMAL128: out = Decimal128Type.__new__(Decimal128Type) elif type.get().id() == _Type_DECIMAL256: out = Decimal256Type.__new__(Decimal256Type) elif type.get().id() == _Type_EXTENSION: ext_type = type.get() cpy_ext_type = dynamic_cast[_CPyExtensionTypePtr](ext_type) if cpy_ext_type != nullptr: return cpy_ext_type.GetInstance() else: out = BaseExtensionType.__new__(BaseExtensionType) else: out = DataType.__new__(DataType) out.init(type) return out cdef object pyarrow_wrap_metadata( const shared_ptr[const CKeyValueMetadata]& meta): if meta.get() == nullptr: return None else: return KeyValueMetadata.wrap(meta) cdef api bint pyarrow_is_metadata(object metadata): return isinstance(metadata, KeyValueMetadata) cdef shared_ptr[const CKeyValueMetadata] pyarrow_unwrap_metadata(object meta): cdef shared_ptr[const CKeyValueMetadata] c_meta if pyarrow_is_metadata(meta): c_meta = (meta).unwrap() return c_meta cdef api bint pyarrow_is_field(object field): return isinstance(field, Field) cdef api shared_ptr[CField] pyarrow_unwrap_field(object field): cdef Field field_ if pyarrow_is_field(field): field_ = (field) return field_.sp_field return shared_ptr[CField]() cdef api object pyarrow_wrap_field(const shared_ptr[CField]& field): if field.get() == NULL: return None cdef Field out = Field.__new__(Field) out.init(field) return out cdef api bint pyarrow_is_schema(object schema): return isinstance(schema, Schema) cdef api shared_ptr[CSchema] pyarrow_unwrap_schema(object schema): cdef Schema sch if pyarrow_is_schema(schema): sch = (schema) return sch.sp_schema return shared_ptr[CSchema]() cdef api object pyarrow_wrap_schema(const shared_ptr[CSchema]& schema): cdef Schema out = Schema.__new__(Schema) out.init_schema(schema) return out cdef api bint pyarrow_is_array(object array): return isinstance(array, Array) cdef api shared_ptr[CArray] pyarrow_unwrap_array(object array): cdef Array arr if pyarrow_is_array(array): arr = (array) return arr.sp_array return shared_ptr[CArray]() cdef api object pyarrow_wrap_array(const shared_ptr[CArray]& sp_array): if sp_array.get() == NULL: raise ValueError('Array was NULL') klass = get_array_class_from_type(sp_array.get().type()) cdef Array arr = klass.__new__(klass) arr.init(sp_array) return arr cdef api bint pyarrow_is_chunked_array(object array): return isinstance(array, ChunkedArray) cdef api shared_ptr[CChunkedArray] pyarrow_unwrap_chunked_array(object array): cdef ChunkedArray arr if pyarrow_is_chunked_array(array): arr = (array) return arr.sp_chunked_array return shared_ptr[CChunkedArray]() cdef api object pyarrow_wrap_chunked_array( const shared_ptr[CChunkedArray]& sp_array): if sp_array.get() == NULL: raise ValueError('ChunkedArray was NULL') cdef CDataType* data_type = sp_array.get().type().get() if data_type == NULL: raise ValueError('ChunkedArray data type was NULL') cdef ChunkedArray arr = ChunkedArray.__new__(ChunkedArray) arr.init(sp_array) return arr cdef api bint pyarrow_is_scalar(object value): return isinstance(value, Scalar) cdef api shared_ptr[CScalar] pyarrow_unwrap_scalar(object scalar): if pyarrow_is_scalar(scalar): return ( scalar).unwrap() return shared_ptr[CScalar]() cdef api object pyarrow_wrap_scalar(const shared_ptr[CScalar]& sp_scalar): if sp_scalar.get() == NULL: raise ValueError('Scalar was NULL') cdef CDataType* data_type = sp_scalar.get().type.get() if data_type == NULL: raise ValueError('Scalar data type was NULL') if data_type.id() == _Type_NA: return _NULL if data_type.id() not in _scalar_classes: raise ValueError('Scalar type not supported') klass = _scalar_classes[data_type.id()] cdef Scalar scalar = klass.__new__(klass) scalar.init(sp_scalar) return scalar cdef api bint pyarrow_is_tensor(object tensor): return isinstance(tensor, Tensor) cdef api shared_ptr[CTensor] pyarrow_unwrap_tensor(object tensor): cdef Tensor ten if pyarrow_is_tensor(tensor): ten = (tensor) return ten.sp_tensor return shared_ptr[CTensor]() cdef api object pyarrow_wrap_tensor( const shared_ptr[CTensor]& sp_tensor): if sp_tensor.get() == NULL: raise ValueError('Tensor was NULL') cdef Tensor tensor = Tensor.__new__(Tensor) tensor.init(sp_tensor) return tensor cdef api bint pyarrow_is_sparse_coo_tensor(object sparse_tensor): return isinstance(sparse_tensor, SparseCOOTensor) cdef api shared_ptr[CSparseCOOTensor] pyarrow_unwrap_sparse_coo_tensor( object sparse_tensor): cdef SparseCOOTensor sten if pyarrow_is_sparse_coo_tensor(sparse_tensor): sten = (sparse_tensor) return sten.sp_sparse_tensor return shared_ptr[CSparseCOOTensor]() cdef api object pyarrow_wrap_sparse_coo_tensor( const shared_ptr[CSparseCOOTensor]& sp_sparse_tensor): if sp_sparse_tensor.get() == NULL: raise ValueError('SparseCOOTensor was NULL') cdef SparseCOOTensor sparse_tensor = SparseCOOTensor.__new__( SparseCOOTensor) sparse_tensor.init(sp_sparse_tensor) return sparse_tensor cdef api bint pyarrow_is_sparse_csr_matrix(object sparse_tensor): return isinstance(sparse_tensor, SparseCSRMatrix) cdef api shared_ptr[CSparseCSRMatrix] pyarrow_unwrap_sparse_csr_matrix( object sparse_tensor): cdef SparseCSRMatrix sten if pyarrow_is_sparse_csr_matrix(sparse_tensor): sten = (sparse_tensor) return sten.sp_sparse_tensor return shared_ptr[CSparseCSRMatrix]() cdef api object pyarrow_wrap_sparse_csr_matrix( const shared_ptr[CSparseCSRMatrix]& sp_sparse_tensor): if sp_sparse_tensor.get() == NULL: raise ValueError('SparseCSRMatrix was NULL') cdef SparseCSRMatrix sparse_tensor = SparseCSRMatrix.__new__( SparseCSRMatrix) sparse_tensor.init(sp_sparse_tensor) return sparse_tensor cdef api bint pyarrow_is_sparse_csc_matrix(object sparse_tensor): return isinstance(sparse_tensor, SparseCSCMatrix) cdef api shared_ptr[CSparseCSCMatrix] pyarrow_unwrap_sparse_csc_matrix( object sparse_tensor): cdef SparseCSCMatrix sten if pyarrow_is_sparse_csc_matrix(sparse_tensor): sten = (sparse_tensor) return sten.sp_sparse_tensor return shared_ptr[CSparseCSCMatrix]() cdef api object pyarrow_wrap_sparse_csc_matrix( const shared_ptr[CSparseCSCMatrix]& sp_sparse_tensor): if sp_sparse_tensor.get() == NULL: raise ValueError('SparseCSCMatrix was NULL') cdef SparseCSCMatrix sparse_tensor = SparseCSCMatrix.__new__( SparseCSCMatrix) sparse_tensor.init(sp_sparse_tensor) return sparse_tensor cdef api bint pyarrow_is_sparse_csf_tensor(object sparse_tensor): return isinstance(sparse_tensor, SparseCSFTensor) cdef api shared_ptr[CSparseCSFTensor] pyarrow_unwrap_sparse_csf_tensor( object sparse_tensor): cdef SparseCSFTensor sten if pyarrow_is_sparse_csf_tensor(sparse_tensor): sten = (sparse_tensor) return sten.sp_sparse_tensor return shared_ptr[CSparseCSFTensor]() cdef api object pyarrow_wrap_sparse_csf_tensor( const shared_ptr[CSparseCSFTensor]& sp_sparse_tensor): if sp_sparse_tensor.get() == NULL: raise ValueError('SparseCSFTensor was NULL') cdef SparseCSFTensor sparse_tensor = SparseCSFTensor.__new__( SparseCSFTensor) sparse_tensor.init(sp_sparse_tensor) return sparse_tensor cdef api bint pyarrow_is_table(object table): return isinstance(table, Table) cdef api shared_ptr[CTable] pyarrow_unwrap_table(object table): cdef Table tab if pyarrow_is_table(table): tab = (table) return tab.sp_table return shared_ptr[CTable]() cdef api object pyarrow_wrap_table(const shared_ptr[CTable]& ctable): cdef Table table = Table.__new__(Table) table.init(ctable) return table cdef api bint pyarrow_is_batch(object batch): return isinstance(batch, RecordBatch) cdef api shared_ptr[CRecordBatch] pyarrow_unwrap_batch(object batch): cdef RecordBatch bat if pyarrow_is_batch(batch): bat = (batch) return bat.sp_batch return shared_ptr[CRecordBatch]() cdef api object pyarrow_wrap_batch( const shared_ptr[CRecordBatch]& cbatch): cdef RecordBatch batch = RecordBatch.__new__(RecordBatch) batch.init(cbatch) return batch