/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#include "shuffle/HashPartitioner.h"

namespace gluten {

int32_t computePid(const int32_t* pidArr, int64_t i, int32_t numPartitions) {
  auto pid = pidArr[i] % numPartitions;
#if defined(__x86_64__)
  // force to generate ASM
  __asm__(
      "lea (%[num_partitions],%[pid],1),%[tmp]\n"
      "test %[pid],%[pid]\n"
      "cmovs %[tmp],%[pid]\n"
      : [pid] "+r"(pid)
      : [num_partitions] "r"(numPartitions), [tmp] "r"(0));
#else
  if (pid < 0) {
    pid += numPartitions;
  }
#endif
  return pid;
}

arrow::Status
gluten::HashPartitioner::compute(const int32_t* pidArr, const int64_t numRows, std::vector<uint32_t>& row2partition) {
  row2partition.resize(numRows);
  for (auto i = 0; i < numRows; ++i) {
    auto pid = computePid(pidArr, i, numPartitions_);
    row2partition[i] = pid;
  }
  return arrow::Status::OK();
}

arrow::Status gluten::HashPartitioner::compute(
    const int32_t* pidArr,
    const int64_t numRows,
    const int32_t vectorIndex,
    std::unordered_map<int32_t, std::vector<int64_t>>& rowVectorIndexMap) {
  auto index = static_cast<int64_t>(vectorIndex) << 32;
  for (auto i = 0; i < numRows; ++i) {
    auto pid = computePid(pidArr, i, numPartitions_);
    int64_t combined = index | (i & 0xFFFFFFFFLL);
    auto& vec = rowVectorIndexMap[pid];
    vec.push_back(combined);
  }

  return arrow::Status::OK();
}

} // namespace gluten