// Licensed to the Apache Software Foundation (ASF) under one // or more contributor license agreements. See the NOTICE file // distributed with this work for additional information // regarding copyright ownership. The ASF licenses this file // to you under the Apache License, Version 2.0 (the // "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, // software distributed under the License is distributed on an // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, either express or implied. See the License for the // specific language governing permissions and limitations // under the License. // This API is EXPERIMENTAL. #pragma once #include #include #include "arrow/dataset/file_base.h" #include "arrow/dataset/type_fwd.h" #include "arrow/dataset/visibility.h" #include "arrow/io/type_fwd.h" #include "arrow/ipc/type_fwd.h" #include "arrow/result.h" namespace arrow { namespace dataset { /// \addtogroup dataset-file-formats /// /// @{ constexpr char kIpcTypeName[] = "ipc"; /// \brief A FileFormat implementation that reads from and writes to Ipc files class ARROW_DS_EXPORT IpcFileFormat : public FileFormat { public: std::string type_name() const override { return kIpcTypeName; } bool Equals(const FileFormat& other) const override { return type_name() == other.type_name(); } Result IsSupported(const FileSource& source) const override; /// \brief Return the schema of the file if possible. Result> Inspect(const FileSource& source) const override; Result ScanBatchesAsync( const std::shared_ptr& options, const std::shared_ptr& file) const override; Future> CountRows( const std::shared_ptr& file, compute::Expression predicate, const std::shared_ptr& options) override; Result> MakeWriter( std::shared_ptr destination, std::shared_ptr schema, std::shared_ptr options, fs::FileLocator destination_locator) const override; std::shared_ptr DefaultWriteOptions() override; }; /// \brief Per-scan options for IPC fragments class ARROW_DS_EXPORT IpcFragmentScanOptions : public FragmentScanOptions { public: std::string type_name() const override { return kIpcTypeName; } /// Options passed to the IPC file reader. /// included_fields, memory_pool, and use_threads are ignored. std::shared_ptr options; /// If present, the async scanner will enable I/O coalescing. /// This is ignored by the sync scanner. std::shared_ptr cache_options; }; class ARROW_DS_EXPORT IpcFileWriteOptions : public FileWriteOptions { public: /// Options passed to ipc::MakeFileWriter. use_threads is ignored std::shared_ptr options; /// custom_metadata written to the file's footer std::shared_ptr metadata; protected: using FileWriteOptions::FileWriteOptions; friend class IpcFileFormat; }; class ARROW_DS_EXPORT IpcFileWriter : public FileWriter { public: Status Write(const std::shared_ptr& batch) override; private: IpcFileWriter(std::shared_ptr destination, std::shared_ptr writer, std::shared_ptr schema, std::shared_ptr options, fs::FileLocator destination_locator); Future<> FinishInternal() override; std::shared_ptr destination_; std::shared_ptr batch_writer_; friend class IpcFileFormat; }; /// @} } // namespace dataset } // namespace arrow