// Licensed to the Apache Software Foundation (ASF) under one // or more contributor license agreements. See the NOTICE file // distributed with this work for additional information // regarding copyright ownership. The ASF licenses this file // to you under the Apache License, Version 2.0 (the // "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, // software distributed under the License is distributed on an // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, either express or implied. See the License for the // specific language governing permissions and limitations // under the License. #pragma once #include #include #include #include #include "arrow/result.h" #include "arrow/status.h" #include "arrow/util/type_fwd.h" #include "arrow/util/visibility.h" namespace arrow { namespace util { constexpr int kUseDefaultCompressionLevel = std::numeric_limits::min(); /// \brief Streaming compressor interface /// class ARROW_EXPORT Compressor { public: virtual ~Compressor() = default; struct CompressResult { int64_t bytes_read; int64_t bytes_written; }; struct FlushResult { int64_t bytes_written; bool should_retry; }; struct EndResult { int64_t bytes_written; bool should_retry; }; /// \brief Compress some input. /// /// If bytes_read is 0 on return, then a larger output buffer should be supplied. virtual Result Compress(int64_t input_len, const uint8_t* input, int64_t output_len, uint8_t* output) = 0; /// \brief Flush part of the compressed output. /// /// If should_retry is true on return, Flush() should be called again /// with a larger buffer. virtual Result Flush(int64_t output_len, uint8_t* output) = 0; /// \brief End compressing, doing whatever is necessary to end the stream. /// /// If should_retry is true on return, End() should be called again /// with a larger buffer. Otherwise, the Compressor should not be used anymore. /// /// End() implies Flush(). virtual Result End(int64_t output_len, uint8_t* output) = 0; // XXX add methods for buffer size heuristics? }; /// \brief Streaming decompressor interface /// class ARROW_EXPORT Decompressor { public: virtual ~Decompressor() = default; struct DecompressResult { // XXX is need_more_output necessary? (Brotli?) int64_t bytes_read; int64_t bytes_written; bool need_more_output; }; /// \brief Decompress some input. /// /// If need_more_output is true on return, a larger output buffer needs /// to be supplied. virtual Result Decompress(int64_t input_len, const uint8_t* input, int64_t output_len, uint8_t* output) = 0; /// \brief Return whether the compressed stream is finished. /// /// This is a heuristic. If true is returned, then it is guaranteed /// that the stream is finished. If false is returned, however, it may /// simply be that the underlying library isn't able to provide the information. virtual bool IsFinished() = 0; /// \brief Reinitialize decompressor, making it ready for a new compressed stream. virtual Status Reset() = 0; // XXX add methods for buffer size heuristics? }; /// \brief Compression codec class ARROW_EXPORT Codec { public: virtual ~Codec() = default; /// \brief Return special value to indicate that a codec implementation /// should use its default compression level static int UseDefaultCompressionLevel(); /// \brief Return a string name for compression type static const std::string& GetCodecAsString(Compression::type t); /// \brief Return compression type for name (all lower case) static Result GetCompressionType(const std::string& name); /// \brief Create a codec for the given compression algorithm static Result> Create( Compression::type codec, int compression_level = kUseDefaultCompressionLevel); /// \brief Return true if support for indicated codec has been enabled static bool IsAvailable(Compression::type codec); /// \brief Return true if indicated codec supports setting a compression level static bool SupportsCompressionLevel(Compression::type codec); /// \brief Return the smallest supported compression level for the codec /// Note: This function creates a temporary Codec instance static Result MinimumCompressionLevel(Compression::type codec); /// \brief Return the largest supported compression level for the codec /// Note: This function creates a temporary Codec instance static Result MaximumCompressionLevel(Compression::type codec); /// \brief Return the default compression level /// Note: This function creates a temporary Codec instance static Result DefaultCompressionLevel(Compression::type codec); /// \brief Return the smallest supported compression level virtual int minimum_compression_level() const = 0; /// \brief Return the largest supported compression level virtual int maximum_compression_level() const = 0; /// \brief Return the default compression level virtual int default_compression_level() const = 0; /// \brief One-shot decompression function /// /// output_buffer_len must be correct and therefore be obtained in advance. /// The actual decompressed length is returned. /// /// \note One-shot decompression is not always compatible with streaming /// compression. Depending on the codec (e.g. LZ4), different formats may /// be used. virtual Result Decompress(int64_t input_len, const uint8_t* input, int64_t output_buffer_len, uint8_t* output_buffer) = 0; /// \brief One-shot compression function /// /// output_buffer_len must first have been computed using MaxCompressedLen(). /// The actual compressed length is returned. /// /// \note One-shot compression is not always compatible with streaming /// decompression. Depending on the codec (e.g. LZ4), different formats may /// be used. virtual Result Compress(int64_t input_len, const uint8_t* input, int64_t output_buffer_len, uint8_t* output_buffer) = 0; virtual int64_t MaxCompressedLen(int64_t input_len, const uint8_t* input) = 0; /// \brief Create a streaming compressor instance virtual Result> MakeCompressor() = 0; /// \brief Create a streaming compressor instance virtual Result> MakeDecompressor() = 0; /// \brief This Codec's compression type virtual Compression::type compression_type() const = 0; /// \brief The name of this Codec's compression type const std::string& name() const { return GetCodecAsString(compression_type()); } /// \brief This Codec's compression level, if applicable virtual int compression_level() const { return UseDefaultCompressionLevel(); } private: /// \brief Initializes the codec's resources. virtual Status Init(); }; } // namespace util } // namespace arrow