mirror of
https://github.com/aykhans/AzSuicideDataVisualization.git
synced 2025-04-21 10:15:45 +00:00
135 lines
5.6 KiB
Cython
135 lines
5.6 KiB
Cython
# Licensed to the Apache Software Foundation (ASF) under one
|
|
# or more contributor license agreements. See the NOTICE file
|
|
# distributed with this work for additional information
|
|
# regarding copyright ownership. The ASF licenses this file
|
|
# to you under the Apache License, Version 2.0 (the
|
|
# "License"); you may not use this file except in compliance
|
|
# with the License. You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing,
|
|
# software distributed under the License is distributed on an
|
|
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
# KIND, either express or implied. See the License for the
|
|
# specific language governing permissions and limitations
|
|
# under the License.
|
|
|
|
# distutils: language = c++
|
|
# cython: language_level = 3
|
|
|
|
from libcpp cimport bool as c_bool
|
|
from libc.string cimport const_char
|
|
from libcpp.vector cimport vector as std_vector
|
|
from pyarrow.includes.common cimport *
|
|
from pyarrow.includes.libarrow cimport (CArray, CSchema, CStatus,
|
|
CResult, CTable, CMemoryPool,
|
|
CKeyValueMetadata,
|
|
CRecordBatch,
|
|
CTable, CCompressionType,
|
|
CRandomAccessFile, COutputStream,
|
|
TimeUnit)
|
|
|
|
cdef extern from "arrow/adapters/orc/options.h" \
|
|
namespace "arrow::adapters::orc" nogil:
|
|
cdef enum CompressionStrategy \
|
|
" arrow::adapters::orc::CompressionStrategy":
|
|
_CompressionStrategy_SPEED \
|
|
" arrow::adapters::orc::CompressionStrategy::kSpeed"
|
|
_CompressionStrategy_COMPRESSION \
|
|
" arrow::adapters::orc::CompressionStrategy::kCompression"
|
|
|
|
cdef enum WriterId" arrow::adapters::orc::WriterId":
|
|
_WriterId_ORC_JAVA_WRITER" arrow::adapters::orc::WriterId::kOrcJava"
|
|
_WriterId_ORC_CPP_WRITER" arrow::adapters::orc::WriterId::kOrcCpp"
|
|
_WriterId_PRESTO_WRITER" arrow::adapters::orc::WriterId::kPresto"
|
|
_WriterId_SCRITCHLEY_GO \
|
|
" arrow::adapters::orc::WriterId::kScritchleyGo"
|
|
_WriterId_TRINO_WRITER" arrow::adapters::orc::WriterId::kTrino"
|
|
_WriterId_UNKNOWN_WRITER" arrow::adapters::orc::WriterId::kUnknown"
|
|
|
|
cdef enum WriterVersion" arrow::adapters::orc::WriterVersion":
|
|
_WriterVersion_ORIGINAL \
|
|
" arrow::adapters::orc::WriterVersion::kOriginal"
|
|
_WriterVersion_HIVE_8732 \
|
|
" arrow::adapters::orc::WriterVersion::kHive8732"
|
|
_WriterVersion_HIVE_4243 \
|
|
" arrow::adapters::orc::WriterVersion::kHive4243"
|
|
_WriterVersion_HIVE_12055 \
|
|
" arrow::adapters::orc::WriterVersion::kHive12055"
|
|
_WriterVersion_HIVE_13083 \
|
|
" arrow::adapters::orc::WriterVersion::kHive13083"
|
|
_WriterVersion_ORC_101" arrow::adapters::orc::WriterVersion::kOrc101"
|
|
_WriterVersion_ORC_135" arrow::adapters::orc::WriterVersion::kOrc135"
|
|
_WriterVersion_ORC_517" arrow::adapters::orc::WriterVersion::kOrc517"
|
|
_WriterVersion_ORC_203" arrow::adapters::orc::WriterVersion::kOrc203"
|
|
_WriterVersion_ORC_14" arrow::adapters::orc::WriterVersion::kOrc14"
|
|
_WriterVersion_MAX" arrow::adapters::orc::WriterVersion::kMax"
|
|
|
|
cdef cppclass FileVersion" arrow::adapters::orc::FileVersion":
|
|
FileVersion(uint32_t major_version, uint32_t minor_version)
|
|
uint32_t major_version()
|
|
uint32_t minor_version()
|
|
c_string ToString()
|
|
|
|
cdef struct WriteOptions" arrow::adapters::orc::WriteOptions":
|
|
int64_t batch_size
|
|
FileVersion file_version
|
|
int64_t stripe_size
|
|
CCompressionType compression
|
|
int64_t compression_block_size
|
|
CompressionStrategy compression_strategy
|
|
int64_t row_index_stride
|
|
double padding_tolerance
|
|
double dictionary_key_size_threshold
|
|
std_vector[int64_t] bloom_filter_columns
|
|
double bloom_filter_fpp
|
|
|
|
|
|
cdef extern from "arrow/adapters/orc/adapter.h" \
|
|
namespace "arrow::adapters::orc" nogil:
|
|
|
|
cdef cppclass ORCFileReader:
|
|
@staticmethod
|
|
CResult[unique_ptr[ORCFileReader]] Open(
|
|
const shared_ptr[CRandomAccessFile]& file,
|
|
CMemoryPool* pool)
|
|
|
|
CResult[shared_ptr[const CKeyValueMetadata]] ReadMetadata()
|
|
|
|
CResult[shared_ptr[CSchema]] ReadSchema()
|
|
|
|
CResult[shared_ptr[CRecordBatch]] ReadStripe(int64_t stripe)
|
|
CResult[shared_ptr[CRecordBatch]] ReadStripe(
|
|
int64_t stripe, std_vector[c_string])
|
|
|
|
CResult[shared_ptr[CTable]] Read()
|
|
CResult[shared_ptr[CTable]] Read(std_vector[c_string])
|
|
|
|
int64_t NumberOfStripes()
|
|
int64_t NumberOfRows()
|
|
FileVersion GetFileVersion()
|
|
c_string GetSoftwareVersion()
|
|
CResult[CCompressionType] GetCompression()
|
|
int64_t GetCompressionSize()
|
|
int64_t GetRowIndexStride()
|
|
WriterId GetWriterId()
|
|
int32_t GetWriterIdValue()
|
|
WriterVersion GetWriterVersion()
|
|
int64_t GetNumberOfStripeStatistics()
|
|
int64_t GetContentLength()
|
|
int64_t GetStripeStatisticsLength()
|
|
int64_t GetFileFooterLength()
|
|
int64_t GetFilePostscriptLength()
|
|
int64_t GetFileLength()
|
|
c_string GetSerializedFileTail()
|
|
|
|
cdef cppclass ORCFileWriter:
|
|
@staticmethod
|
|
CResult[unique_ptr[ORCFileWriter]] Open(
|
|
COutputStream* output_stream, const WriteOptions& writer_options)
|
|
|
|
CStatus Write(const CTable& table)
|
|
|
|
CStatus Close()
|