* Copyright (C) 2020-2022. Huawei Technologies Co., Ltd. All rights reserved.
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#ifndef CPP_TYPE_H
#define CPP_TYPE_H
#include <vector/vector_common.h>
#include "../io/SparkFile.hh"
#include "../io/ColumnWriter.hh"
using namespace spark;
using namespace omniruntime::mem;
static constexpr int32_t kDefaultSplitterBufferSize = 4096;
static constexpr int32_t kDefaultNumSubDirs = 64;
static constexpr double spillThreshold = 0.9;
static int64_t offHeapSize = MemoryManager::GetGlobalMemoryLimit();
struct SplitOptions {
int32_t buffer_size = kDefaultSplitterBufferSize;
int32_t num_sub_dirs = kDefaultNumSubDirs;
CompressionKind compression_type = CompressionKind_NONE;
std::string next_spilled_file_dir = "";
std::string data_file;
int64_t thread_id = -1;
int64_t task_attempt_id = -1;
Allocator *allocator = Allocator::GetAllocator();
uint64_t spill_batch_row_num = 10000;
uint64_t task_spill_mem_threshold = 2L * 1024 * 1024 * 1024;
uint64_t executor_spill_mem_threshold = spillThreshold * offHeapSize;
uint64_t compress_block_size = 64 * 1024;
static SplitOptions Defaults();
};
enum ShuffleTypeId : int {
SHUFFLE_1BYTE = 0,
SHUFFLE_2BYTE = 1,
SHUFFLE_4BYTE = 2,
SHUFFLE_8BYTE = 3,
SHUFFLE_DECIMAL128 = 4,
SHUFFLE_BIT = 5,
SHUFFLE_BINARY = 6,
SHUFFLE_LARGE_BINARY = 7,
SHUFFLE_NULL = 8,
NUM_TYPES = 9,
SHUFFLE_NOT_IMPLEMENTED = 10
};
struct InputDataTypes {
int32_t *inputVecTypeIds = nullptr;
uint32_t *inputDataPrecisions = nullptr;
uint32_t *inputDataScales = nullptr;
};
#endif