mirror of
https://github.com/aykhans/AzSuicideDataVisualization.git
synced 2025-07-02 06:22:25 +00:00
214 lines
6.4 KiB
C++
214 lines
6.4 KiB
C++
// Licensed to the Apache Software Foundation (ASF) under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing,
|
|
// software distributed under the License is distributed on an
|
|
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
// KIND, either express or implied. See the License for the
|
|
// specific language governing permissions and limitations
|
|
// under the License.
|
|
|
|
#pragma once
|
|
|
|
#include <cstdint>
|
|
#include <cstring>
|
|
#include <memory>
|
|
#include <type_traits>
|
|
|
|
#include "arrow/array/builder_base.h"
|
|
#include "arrow/buffer.h"
|
|
#include "arrow/status.h"
|
|
#include "arrow/type.h"
|
|
#include "arrow/util/macros.h"
|
|
#include "arrow/util/visibility.h"
|
|
|
|
namespace arrow {
|
|
|
|
/// \addtogroup numeric-builders
|
|
///
|
|
/// @{
|
|
|
|
namespace internal {
|
|
|
|
class ARROW_EXPORT AdaptiveIntBuilderBase : public ArrayBuilder {
|
|
public:
|
|
AdaptiveIntBuilderBase(uint8_t start_int_size, MemoryPool* pool);
|
|
|
|
explicit AdaptiveIntBuilderBase(MemoryPool* pool)
|
|
: AdaptiveIntBuilderBase(sizeof(uint8_t), pool) {}
|
|
|
|
/// \brief Append multiple nulls
|
|
/// \param[in] length the number of nulls to append
|
|
Status AppendNulls(int64_t length) final {
|
|
ARROW_RETURN_NOT_OK(CommitPendingData());
|
|
if (ARROW_PREDICT_TRUE(length > 0)) {
|
|
ARROW_RETURN_NOT_OK(Reserve(length));
|
|
memset(data_->mutable_data() + length_ * int_size_, 0, int_size_ * length);
|
|
UnsafeSetNull(length);
|
|
}
|
|
return Status::OK();
|
|
}
|
|
|
|
Status AppendNull() final {
|
|
pending_data_[pending_pos_] = 0;
|
|
pending_valid_[pending_pos_] = 0;
|
|
pending_has_nulls_ = true;
|
|
++pending_pos_;
|
|
++length_;
|
|
++null_count_;
|
|
|
|
if (ARROW_PREDICT_FALSE(pending_pos_ >= pending_size_)) {
|
|
return CommitPendingData();
|
|
}
|
|
return Status::OK();
|
|
}
|
|
|
|
Status AppendEmptyValues(int64_t length) final {
|
|
ARROW_RETURN_NOT_OK(CommitPendingData());
|
|
if (ARROW_PREDICT_TRUE(length > 0)) {
|
|
ARROW_RETURN_NOT_OK(Reserve(length));
|
|
memset(data_->mutable_data() + length_ * int_size_, 0, int_size_ * length);
|
|
UnsafeSetNotNull(length);
|
|
}
|
|
return Status::OK();
|
|
}
|
|
|
|
Status AppendEmptyValue() final {
|
|
pending_data_[pending_pos_] = 0;
|
|
pending_valid_[pending_pos_] = 1;
|
|
++pending_pos_;
|
|
++length_;
|
|
|
|
if (ARROW_PREDICT_FALSE(pending_pos_ >= pending_size_)) {
|
|
return CommitPendingData();
|
|
}
|
|
return Status::OK();
|
|
}
|
|
|
|
void Reset() override;
|
|
Status Resize(int64_t capacity) override;
|
|
|
|
protected:
|
|
Status AppendInternal(const uint64_t val) {
|
|
pending_data_[pending_pos_] = val;
|
|
pending_valid_[pending_pos_] = 1;
|
|
++pending_pos_;
|
|
++length_;
|
|
|
|
if (ARROW_PREDICT_FALSE(pending_pos_ >= pending_size_)) {
|
|
return CommitPendingData();
|
|
}
|
|
return Status::OK();
|
|
}
|
|
|
|
virtual Status CommitPendingData() = 0;
|
|
|
|
template <typename new_type, typename old_type>
|
|
typename std::enable_if<sizeof(old_type) >= sizeof(new_type), Status>::type
|
|
ExpandIntSizeInternal();
|
|
template <typename new_type, typename old_type>
|
|
typename std::enable_if<(sizeof(old_type) < sizeof(new_type)), Status>::type
|
|
ExpandIntSizeInternal();
|
|
|
|
std::shared_ptr<ResizableBuffer> data_;
|
|
uint8_t* raw_data_ = NULLPTR;
|
|
|
|
const uint8_t start_int_size_;
|
|
uint8_t int_size_;
|
|
|
|
static constexpr int32_t pending_size_ = 1024;
|
|
uint8_t pending_valid_[pending_size_];
|
|
uint64_t pending_data_[pending_size_];
|
|
int32_t pending_pos_ = 0;
|
|
bool pending_has_nulls_ = false;
|
|
};
|
|
|
|
} // namespace internal
|
|
|
|
class ARROW_EXPORT AdaptiveUIntBuilder : public internal::AdaptiveIntBuilderBase {
|
|
public:
|
|
explicit AdaptiveUIntBuilder(uint8_t start_int_size,
|
|
MemoryPool* pool = default_memory_pool());
|
|
|
|
explicit AdaptiveUIntBuilder(MemoryPool* pool = default_memory_pool())
|
|
: AdaptiveUIntBuilder(sizeof(uint8_t), pool) {}
|
|
|
|
using ArrayBuilder::Advance;
|
|
using internal::AdaptiveIntBuilderBase::Reset;
|
|
|
|
/// Scalar append
|
|
Status Append(const uint64_t val) { return AppendInternal(val); }
|
|
|
|
/// \brief Append a sequence of elements in one shot
|
|
/// \param[in] values a contiguous C array of values
|
|
/// \param[in] length the number of values to append
|
|
/// \param[in] valid_bytes an optional sequence of bytes where non-zero
|
|
/// indicates a valid (non-null) value
|
|
/// \return Status
|
|
Status AppendValues(const uint64_t* values, int64_t length,
|
|
const uint8_t* valid_bytes = NULLPTR);
|
|
|
|
Status FinishInternal(std::shared_ptr<ArrayData>* out) override;
|
|
|
|
std::shared_ptr<DataType> type() const override;
|
|
|
|
protected:
|
|
Status CommitPendingData() override;
|
|
Status ExpandIntSize(uint8_t new_int_size);
|
|
|
|
Status AppendValuesInternal(const uint64_t* values, int64_t length,
|
|
const uint8_t* valid_bytes);
|
|
|
|
template <typename new_type>
|
|
Status ExpandIntSizeN();
|
|
};
|
|
|
|
class ARROW_EXPORT AdaptiveIntBuilder : public internal::AdaptiveIntBuilderBase {
|
|
public:
|
|
explicit AdaptiveIntBuilder(uint8_t start_int_size,
|
|
MemoryPool* pool = default_memory_pool());
|
|
|
|
explicit AdaptiveIntBuilder(MemoryPool* pool = default_memory_pool())
|
|
: AdaptiveIntBuilder(sizeof(uint8_t), pool) {}
|
|
|
|
using ArrayBuilder::Advance;
|
|
using internal::AdaptiveIntBuilderBase::Reset;
|
|
|
|
/// Scalar append
|
|
Status Append(const int64_t val) { return AppendInternal(static_cast<uint64_t>(val)); }
|
|
|
|
/// \brief Append a sequence of elements in one shot
|
|
/// \param[in] values a contiguous C array of values
|
|
/// \param[in] length the number of values to append
|
|
/// \param[in] valid_bytes an optional sequence of bytes where non-zero
|
|
/// indicates a valid (non-null) value
|
|
/// \return Status
|
|
Status AppendValues(const int64_t* values, int64_t length,
|
|
const uint8_t* valid_bytes = NULLPTR);
|
|
|
|
Status FinishInternal(std::shared_ptr<ArrayData>* out) override;
|
|
|
|
std::shared_ptr<DataType> type() const override;
|
|
|
|
protected:
|
|
Status CommitPendingData() override;
|
|
Status ExpandIntSize(uint8_t new_int_size);
|
|
|
|
Status AppendValuesInternal(const int64_t* values, int64_t length,
|
|
const uint8_t* valid_bytes);
|
|
|
|
template <typename new_type>
|
|
Status ExpandIntSizeN();
|
|
};
|
|
|
|
/// @}
|
|
|
|
} // namespace arrow
|