openGauss-server/src/gausskernel/storage/access/hash/hashfunc.cpp-代码预览-openGauss-server:基于关系型数据库技术的企业级数据库管理系统项目 - AtomGit

Lli-judong1、老问题：修复分区剪枝、分区路由未使用正确的collation导致的core问题和剪枝问题
97f9f7d2创建于 2023年7月3日历史提交
/* -------------------------------------------------------------------------
 *
 * hashfunc.cpp
 *	  Support functions for hash access method.
 *
 * Portions Copyright (c) 2020 Huawei Technologies Co.,Ltd.
 * Portions Copyright (c) 1996-2012, PostgreSQL Global Development Group
 * Portions Copyright (c) 1994, Regents of the University of California
 *
 *
 * IDENTIFICATION
 *	  src/gausskernel/storage/access/hash/hashfunc.cpp
 *
 * NOTES
 *	  These functions are stored in pg_amproc.	For each operator class
 *	  defined for hash indexes, they compute the hash value of the argument.
 *
 *	  Additional hash functions appear in /utils/adt/ files for various
 *	  specialized datatypes.
 *
 *	  It is expected that every bit of a hash function's 32-bit result is
 *	  as random as every other; failure to ensure this is likely to lead
 *	  to poor performance of hash joins, for example.  In most cases a hash
 *	  function should use hash_any() or its variant hash_uint32().
 *
 * -------------------------------------------------------------------------
 */
#include "postgres.h"
#include "knl/knl_variable.h"

#include "access/hash.h"
#include "catalog/gs_collation.h"

#ifdef PGXC
#include "catalog/pg_type.h"
#include "utils/builtins.h"
#include "utils/timestamp.h"
#include "utils/date.h"
#include "utils/nabstime.h"
#include "utils/guc.h"
#include "pgxc/groupmgr.h"
#include "pgxc/locator.h"
#include "utils/typcache.h"
#include "vecexecutor/vectorbatch.h"
#include "utils/uuid.h"
#endif

#ifndef ENABLE_MULTIPLE_NODES
#define EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE \
    ereport(ERROR, (errcode(ERRCODE_FEATURE_NOT_SUPPORTED), errmsg("unsupported proc in single node mode.")))
#endif

/* Note: this is used for both "char" and boolean datatypes */
Datum hashchar(PG_FUNCTION_ARGS)
{
    return hash_uint32((int32)PG_GETARG_CHAR(0));
}

Datum hashint1(PG_FUNCTION_ARGS)
{
    return hash_uint32((int32)PG_GETARG_UINT8(0));
}

Datum hashint2(PG_FUNCTION_ARGS)
{
    return hash_uint32((int32)PG_GETARG_INT16(0));
}

Datum hashint4(PG_FUNCTION_ARGS)
{
    return hash_uint32(PG_GETARG_INT32(0));
}

Datum hashint8(PG_FUNCTION_ARGS)
{
    /*
     * The idea here is to produce a hash value compatible with the values
     * produced by hashint4 and hashint2 for logically equal inputs; this is
     * necessary to support cross-type hash joins across these input types.
     * Since all three types are signed, we can xor the high half of the int8
     * value if the sign is positive, or the complement of the high half when
     * the sign is negative.
     */
    int64 val = PG_GETARG_INT64(0);
    uint32 lohalf = (uint32)val;
    uint32 hihalf = (uint32)((uint64)val >> 32);

    lohalf ^= (val >= 0) ? hihalf : ~hihalf;

    return hash_uint32(lohalf);
}

Datum hashoid(PG_FUNCTION_ARGS)
{
    return hash_uint32((uint32)PG_GETARG_OID(0));
}

Datum hashenum(PG_FUNCTION_ARGS)
{
    return hash_uint32((uint32)PG_GETARG_OID(0));
}

Datum hashfloat4(PG_FUNCTION_ARGS)
{
    float4 key = PG_GETARG_FLOAT4(0);
    float8 key8;

    /*
     * On IEEE-float machines, minus zero and zero have different bit patterns
     * but should compare as equal.  We must ensure that they have the same
     * hash value, which is most reliably done this way:
     */
    if (key == (float4)0)
        PG_RETURN_UINT32(0);

    /*
     * To support cross-type hashing of float8 and float4, we want to return
     * the same hash value hashfloat8 would produce for an equal float8 value.
     * So, widen the value to float8 and hash that.  (We must do this rather
     * than have hashfloat8 try to narrow its value to float4; that could fail
     * on overflow.)
     */
    key8 = key;

    return hash_any((unsigned char *)&key8, sizeof(key8));
}

Datum hashfloat8(PG_FUNCTION_ARGS)
{
    float8 key = PG_GETARG_FLOAT8(0);
    /*
     * On IEEE-float machines, minus zero and zero have different bit patterns
     * but should compare as equal.  We must ensure that they have the same
     * hash value, which is most reliably done this way:
     */
    if (key == (float8)0)
        PG_RETURN_UINT32(0);

    return hash_any((unsigned char *)&key, sizeof(key));
}

Datum hashoidvector(PG_FUNCTION_ARGS)
{
    oidvector *key = (oidvector *)PG_GETARG_POINTER(0);

    return hash_any((unsigned char *)key->values, key->dim1 * sizeof(Oid));
}

Datum hashint2vector(PG_FUNCTION_ARGS)
{
    int2vector *key = (int2vector *)PG_GETARG_POINTER(0);

    return hash_any((unsigned char *)key->values, key->dim1 * sizeof(int2));
}

Datum hashname(PG_FUNCTION_ARGS)
{
    char *key = NameStr(*PG_GETARG_NAME(0));
    unsigned keylen = strlen(key);

    return hash_any((unsigned char *)key, keylen);
}

Datum hashtext(PG_FUNCTION_ARGS)
{
    text *key = PG_GETARG_TEXT_PP(0);
    Datum result;
    Oid collid = PG_GET_COLLATION();

    FUNC_CHECK_HUGE_POINTER(false, key, "hashtext()");

    if (is_b_format_collation(collid)) {
        result = hash_text_by_builtin_collations((unsigned char *)VARDATA_ANY(key), VARSIZE_ANY_EXHDR(key), collid);
        PG_FREE_IF_COPY(key, 0);
        return result;
    }

#ifdef PGXC
    if (g_instance.attr.attr_sql.string_hash_compatible) {
        result = hash_any((unsigned char *)VARDATA_ANY(key), bcTruelen(key));
    } else {
#endif
        /*
         * Note: this is currently identical in behavior to hashvarlena, but keep
         * it as a separate function in case we someday want to do something
         * different in non-C locales.	(See also hashbpchar, if so.)
         */
        result = hash_any((unsigned char *)VARDATA_ANY(key), VARSIZE_ANY_EXHDR(key));
#ifdef PGXC
    }
#endif

    /* Avoid leaking memory for toasted inputs */
    PG_FREE_IF_COPY(key, 0);

    return result;
}

/*
 * hashvarlena() can be used for any varlena datatype in which there are
 * no non-significant bits, ie, distinct bitpatterns never compare as equal.
 */
Datum hashvarlena(PG_FUNCTION_ARGS)
{
    struct varlena *key = PG_GETARG_VARLENA_PP(0);
    Datum result;

#ifdef PGXC
    if (g_instance.attr.attr_sql.string_hash_compatible) {
        result = hash_any((unsigned char *)VARDATA_ANY(key), bcTruelen(key));
    } else {
#endif
        result = hash_any((unsigned char *)VARDATA_ANY(key), VARSIZE_ANY_EXHDR(key));
#ifdef PGXC
    }
#endif

    /* Avoid leaking memory for toasted inputs */
    PG_FREE_IF_COPY(key, 0);

    return result;
}

/*
 * This hash function was written by Bob Jenkins
 * (bob_jenkins@burtleburtle.net), and superficially adapted
 * for PostgreSQL by Neil Conway. For more information on this
 * hash function, see http://burtleburtle.net/bob/hash/doobs.html,
 * or Bob's article in Dr. Dobb's Journal, Sept. 1997.
 *
 * In the current code, we have adopted Bob's 2006 update of his hash
 * function to fetch the data a word at a time when it is suitably aligned.
 * This makes for a useful speedup, at the cost of having to maintain
 * four code paths (aligned vs unaligned, and little-endian vs big-endian).
 * It also uses two separate mixing functions mix() and final(), instead
 * of a slower multi-purpose function.
 */
/* Get a bit mask of the bits set in non-uint32 aligned addresses */
#define UINT32_ALIGN_MASK (sizeof(uint32) - 1)

/* Rotate a uint32 value left by k bits - note multiple evaluation! */
#define rot(x, k) (((x) << (k)) | ((x) >> (32 - (k))))

/* ----------
 * mix -- mix 3 32-bit values reversibly.
 *
 * This is reversible, so any information in (a,b,c) before mix() is
 * still in (a,b,c) after mix().
 *
 * If four pairs of (a,b,c) inputs are run through mix(), or through
 * mix() in reverse, there are at least 32 bits of the output that
 * are sometimes the same for one pair and different for another pair.
 * This was tested for:
 * * pairs that differed by one bit, by two bits, in any combination
 *	 of top bits of (a,b,c), or in any combination of bottom bits of (a,b,c).
 * * "differ" is defined as +, -, ^, or ~^.  For + and -, I transformed
 *	 the output delta to a Gray code (a^(a>>1)) so a string of 1's (as
 *	 is commonly produced by subtraction) look like a single 1-bit
 *	 difference.
 * * the base values were pseudorandom, all zero but one bit set, or
 *	 all zero plus a counter that starts at zero.
 *
 * This does not achieve avalanche.  There are input bits of (a,b,c)
 * that fail to affect some output bits of (a,b,c), especially of a.  The
 * most thoroughly mixed value is c, but it doesn't really even achieve
 * avalanche in c.
 *
 * This allows some parallelism.  Read-after-writes are good at doubling
 * the number of bits affected, so the goal of mixing pulls in the opposite
 * direction from the goal of parallelism.	I did what I could.  Rotates
 * seem to cost as much as shifts on every machine I could lay my hands on,
 * and rotates are much kinder to the top and bottom bits, so I used rotates.
 * ----------
 */
#define mix(a, b, c)       \
    {                      \
        a -= (c);          \
        a ^= (rot(c, 4));  \
        c += (b);          \
        b -= (a);          \
        b ^= (rot(a, 6));  \
        a += (c);          \
        c -= (b);          \
        c ^= (rot(b, 8));  \
        b += (a);          \
        a -= (c);          \
        a ^= (rot(c, 16)); \
        c += (b);          \
        b -= (a);          \
        b ^= (rot(a, 19)); \
        a += (c);          \
        c -= (b);          \
        c ^= (rot(b, 4));  \
        b += (a);          \
    }

/* ----------
 * final -- final mixing of 3 32-bit values (a,b,c) into c
 *
 * Pairs of (a,b,c) values differing in only a few bits will usually
 * produce values of c that look totally different.  This was tested for
 * * pairs that differed by one bit, by two bits, in any combination
 *	 of top bits of (a,b,c), or in any combination of bottom bits of (a,b,c).
 * * "differ" is defined as +, -, ^, or ~^.  For + and -, I transformed
 *	 the output delta to a Gray code (a^(a>>1)) so a string of 1's (as
 *	 is commonly produced by subtraction) look like a single 1-bit
 *	 difference.
 * * the base values were pseudorandom, all zero but one bit set, or
 *	 all zero plus a counter that starts at zero.
 *
 * The use of separate functions for mix() and final() allow for a
 * substantial performance increase since final() does not need to
 * do well in reverse, but is does need to affect all output bits.
 * mix(), on the other hand, does not need to affect all output
 * bits (affecting 32 bits is enough).	The original hash function had
 * a single mixing operation that had to satisfy both sets of requirements
 * and was slower as a result.
 * ----------
 */
#define final(a, b, c)     \
    {                      \
        c ^= (b);          \
        c -= (rot(b, 14)); \
        a ^= (c);          \
        a -= (rot(c, 11)); \
        b ^= (a);          \
        b -= (rot(a, 25)); \
        c ^= (b);          \
        c -= (rot(b, 16)); \
        a ^= (c);          \
        a -= (rot(c, 4));  \
        b ^= (a);          \
        b -= (rot(a, 14)); \
        c ^= (b);          \
        c -= (rot(b, 24)); \
    }

/*
 * hash_any() -- hash a variable-length key into a 32-bit value
 *		k		: the key (the unaligned variable-length array of bytes)
 *		len		: the length of the key, counting by bytes
 *
 * Returns a uint32 value.	Every bit of the key affects every bit of
 * the return value.  Every 1-bit and 2-bit delta achieves avalanche.
 * About 6*len+35 instructions. The best hash table sizes are powers
 * of 2.  There is no need to do mod a prime (mod is sooo slow!).
 * If you need less than 32 bits, use a bitmask.
 *
 * Note: we could easily change this function to return a 64-bit hash value
 * by using the final values of both b and c.  b is perhaps a little less
 * well mixed than c, however.
 */
Datum hash_any(register const unsigned char *k, register int keylen)
{
    register uint32 a, b, c, len;

    /* Set up the internal state */
    len = (uint32)keylen;
    a = b = c = 0x9e3779b9 + len + 3923095;

    /* If the source pointer is word-aligned, we use word-wide fetches */
    if (((intptr_t)k & UINT32_ALIGN_MASK) == 0) {
        /* Code path for aligned source data */
        register const uint32 *ka = (const uint32 *)k;

        /* handle most of the key */
        while (len >= 12) {
            a += ka[0];
            b += ka[1];
            c += ka[2];
            mix(a, b, c);
            ka += 3;
            len -= 12;
        }

        /* handle the last 11 bytes */
        k = (const unsigned char *)ka;
#ifdef WORDS_BIGENDIAN
        switch (len) {
            case 11:
                c += ((uint32)k[10] << 8);
            /* fall-through */
            case 10:
                c += ((uint32)k[9] << 16);
            /* fall-through */
            case 9:
                c += ((uint32)k[8] << 24);
            /* the lowest byte of c is reserved for the length */
            /* fall-through */
            case 8:
                b += ka[1];
                a += ka[0];
                break;
            case 7:
                b += ((uint32)k[6] << 8);
            /* fall-through */
            case 6:
                b += ((uint32)k[5] << 16);
            /* fall-through */
            case 5:
                b += ((uint32)k[4] << 24);
            /* fall-through */
            case 4:
                a += ka[0];
                break;
            case 3:
                a += ((uint32)k[2] << 8);
            /* fall-through */
            case 2:
                a += ((uint32)k[1] << 16);
            /* fall-through */
            case 1:
                a += ((uint32)k[0] << 24);
            /* case 0: nothing left to add */
            /* fall-through */
            default:
                break;
        }
#else  /* !WORDS_BIGENDIAN */
        switch (len) {
            case 11:
                c += ((uint32)k[10] << 24);
            /* fall-through */
            case 10:
                c += ((uint32)k[9] << 16);
            /* fall-through */
            case 9:
                c += ((uint32)k[8] << 8);
            /* the lowest byte of c is reserved for the length */
            /* fall-through */
            case 8:
                b += ka[1];
                a += ka[0];
                break;
            case 7:
                b += ((uint32)k[6] << 16);
            /* fall-through */
            case 6:
                b += ((uint32)k[5] << 8);
            /* fall-through */
            case 5:
                b += k[4];
            /* fall-through */
            case 4:
                a += ka[0];
                break;
            case 3:
                a += ((uint32)k[2] << 16);
            /* fall-through */
            case 2:
                a += ((uint32)k[1] << 8);
            /* fall-through */
            case 1:
                a += k[0];
            /* case 0: nothing left to add */
            /* fall-through */
            default:
                break;
        }
#endif /* WORDS_BIGENDIAN */
    } else {
        /* Code path for non-aligned source data */
        while (len >= 12) { /* handle most of the key */
#ifdef WORDS_BIGENDIAN
            a += (k[3] + ((uint32)k[2] << 8) + ((uint32)k[1] << 16) + ((uint32)k[0] << 24));
            b += (k[7] + ((uint32)k[6] << 8) + ((uint32)k[5] << 16) + ((uint32)k[4] << 24));
            c += (k[11] + ((uint32)k[10] << 8) + ((uint32)k[9] << 16) + ((uint32)k[8] << 24));
#else  /* !WORDS_BIGENDIAN */
            a += (k[0] + ((uint32)k[1] << 8) + ((uint32)k[2] << 16) + ((uint32)k[3] << 24));
            b += (k[4] + ((uint32)k[5] << 8) + ((uint32)k[6] << 16) + ((uint32)k[7] << 24));
            c += (k[8] + ((uint32)k[9] << 8) + ((uint32)k[10] << 16) + ((uint32)k[11] << 24));
#endif /* WORDS_BIGENDIAN */
            mix(a, b, c);
            k += 12;
            len -= 12;
        }

        /* handle the last 11 bytes */
#ifdef WORDS_BIGENDIAN
        switch (len) {
            /* all the case statements fall through */
            case 11:
                c += ((uint32)k[10] << 8);
            /* fall-through */
            case 10:
                c += ((uint32)k[9] << 16);
            /* fall-through */
            case 9:
                c += ((uint32)k[8] << 24);
            /* the lowest byte of c is reserved for the length */
            /* fall-through */
            case 8:
                b += k[7];
            /* fall-through */
            case 7:
                b += ((uint32)k[6] << 8);
            /* fall-through */
            case 6:
                b += ((uint32)k[5] << 16);
            /* fall-through */
            case 5:
                b += ((uint32)k[4] << 24);
            /* fall-through */
            case 4:
                a += k[3];
            /* fall-through */
            case 3:
                a += ((uint32)k[2] << 8);
            /* fall-through */
            case 2:
                a += ((uint32)k[1] << 16);
            /* fall-through */
            case 1:
                a += ((uint32)k[0] << 24);
            /* case 0: nothing left to add */
            /* fall-through */
            default:
                break;
        }
#else  /* !WORDS_BIGENDIAN */
        switch (len) {
            /* all the case statements fall through */
            case 11:
                c += ((uint32)k[10] << 24);
            /* fall-through */
            case 10:
                c += ((uint32)k[9] << 16);
            /* fall-through */
            case 9:
                c += ((uint32)k[8] << 8);
            /* the lowest byte of c is reserved for the length */
            /* fall-through */
            case 8:
                b += ((uint32)k[7] << 24);
            /* fall-through */
            case 7:
                b += ((uint32)k[6] << 16);
            /* fall-through */
            case 6:
                b += ((uint32)k[5] << 8);
            /* fall-through */
            case 5:
                b += k[4];
            /* fall-through */
            case 4:
                a += ((uint32)k[3] << 24);
            /* fall-through */
            case 3:
                a += ((uint32)k[2] << 16);
            /* fall-through */
            case 2:
                a += ((uint32)k[1] << 8);
            /* fall-through */
            case 1:
                a += k[0];
            /* case 0: nothing left to add */
            /* fall-through */
            default:
                break;
        }
#endif /* WORDS_BIGENDIAN */
    }

    final(a, b, c);

    /* report the result */
    return UInt32GetDatum(c);
}

/*
 * hash_new_uint32() -- hash a 32-bit value
 * This is a new hash function, which is different from
 * hash_uint32.
 */
Datum hash_new_uint32(uint32 k)
{
    register uint32 a, b, c;

    a = 0xdeadbeef + k;
    b = 0xdeadbeef;
    c = 3923095 + (uint32)sizeof(uint32);

    mix(a, b, c);

    /* report the result */
    return UInt32GetDatum(c);
}

/*
 * hash_uint32() -- hash a 32-bit value
 *
 * This has the same result as: hash_any(&k, sizeof(uint32))
 * but is faster and doesn't force the caller to store k into memory.
 */
Datum hash_uint32(uint32 k)
{
    register uint32 a, b, c;

    a = b = c = 0x9e3779b9 + (uint32)sizeof(uint32) + 3923095;
    a += k;

    final(a, b, c);

    /* report the result */
    return UInt32GetDatum(c);
}

#ifdef PGXC
/*
 * compute_hash() -- Generic hash function for all datatypes
 */
Datum compute_hash(Oid type, Datum value, char locator, Oid collation)
{
    uint8 tmp8;
    int16 tmp16;
    int32 tmp32;
    int64 tmp64;
    Oid tmpoid;
    char tmpch;

    switch (type) {
        case INT8OID:
            /* This gives added advantage that
             *	a = 8446744073709551359
             * and	a = 8446744073709551359::int8 both work */
            tmp64 = DatumGetInt64(value);
            if (locator == LOCATOR_TYPE_HASH)
                return DirectFunctionCall1(hashint8, value);
            return tmp64;
        case INT1OID:
            tmp8 = DatumGetUInt8(value);
            if (locator == LOCATOR_TYPE_HASH)
                return DirectFunctionCall1(hashint1, tmp8);
            return tmp8;
        case INT2OID:
            tmp16 = DatumGetInt16(value);
            if (locator == LOCATOR_TYPE_HASH)
                return DirectFunctionCall1(hashint2, tmp16);
            return tmp16;
        case OIDOID:
            tmpoid = DatumGetObjectId(value);
            if (locator == LOCATOR_TYPE_HASH)
                return DirectFunctionCall1(hashoid, tmpoid);
            return tmpoid;
        case INT4OID:
            tmp32 = DatumGetInt32(value);
            if (locator == LOCATOR_TYPE_HASH)
                return DirectFunctionCall1(hashint4, tmp32);
            return tmp32;
        case BOOLOID:
            tmpch = (char)DatumGetBool(value);
            if (locator == LOCATOR_TYPE_HASH)
                return DirectFunctionCall1(hashchar, tmpch);
            return tmpch;

        case CHAROID:
            return DirectFunctionCall1(hashchar, value);
        case NAMEOID:
            return DirectFunctionCall1(hashname, value);
        case INT2VECTOROID:
            return DirectFunctionCall1(hashint2vector, value);

        case CLOBOID:
        case NVARCHAR2OID:
        case VARCHAROID:
        case TEXTOID:
            return DirectFunctionCall1Coll(hashtext, collation, value);

        case OIDVECTOROID:
            return DirectFunctionCall1(hashoidvector, value);
        case FLOAT4OID:
            return DirectFunctionCall1(hashfloat4, value);
        case FLOAT8OID:
            return DirectFunctionCall1(hashfloat8, value);

        case ABSTIMEOID:
            tmp32 = DatumGetAbsoluteTime(value);
            if (locator == LOCATOR_TYPE_HASH)
                return DirectFunctionCall1(hashint4, tmp32);
            return tmp32;
        case RELTIMEOID:
            tmp32 = DatumGetRelativeTime(value);
            if (locator == LOCATOR_TYPE_HASH)
                return DirectFunctionCall1(hashint4, tmp32);
            return tmp32;
        case CASHOID:
            return DirectFunctionCall1(hashint8, value);

        case BPCHAROID:
            return DirectFunctionCall1Coll(hashbpchar, collation, value);

        case RAWOID:
        case BYTEAOID:
        case BYTEAWITHOUTORDERCOLOID:
        case BYTEAWITHOUTORDERWITHEQUALCOLOID:
            return DirectFunctionCall1(hashvarlena, value);
        case DATEOID:
            tmp32 = DatumGetDateADT(value);
            if (locator == LOCATOR_TYPE_HASH)
                return DirectFunctionCall1(hashint4, tmp32);
            return tmp32;
        case TIMEOID:
            return DirectFunctionCall1(time_hash, value);
        case TIMESTAMPOID:
            return DirectFunctionCall1(timestamp_hash, value);
        case TIMESTAMPTZOID:
            return DirectFunctionCall1(timestamp_hash, value);
        case INTERVALOID:
            return DirectFunctionCall1(interval_hash, value);
        case TIMETZOID:
            return DirectFunctionCall1(timetz_hash, value);
        case SMALLDATETIMEOID:
            return DirectFunctionCall1(timestamp_hash, value);

        case NUMERICOID:
            return DirectFunctionCall1(hash_numeric, value);
        case UUIDOID:
            return DirectFunctionCall1(uuid_hash, value);

        default:
            if (u_sess->hook_cxt.computeHashHook != NULL) {
                return ((computeHashFunc)(u_sess->hook_cxt.computeHashHook))(type, value, locator);
            }
            ereport(ERROR, (errcode(ERRCODE_WRONG_OBJECT_TYPE),
                            errmsg("Unhandled datatype for modulo or hash distribution\n")));
    }
    /* Control should not come here. */
    ereport(ERROR,
            (errcode(ERRCODE_WRONG_OBJECT_TYPE), errmsg("Unhandled datatype for modulo or hash distribution\n")));
    /* Keep compiler silent */
    return (Datum)0;
}

uint32 hashValueCombination(uint32 hashValue, Oid colType, Datum val, bool allIsNull, char locatorType, Oid collation)
{
    if (!allIsNull) {
        hashValue = (hashValue << 1) | ((hashValue & 0x80000000) ? 1 : 0);
        hashValue ^= (uint32)compute_hash(colType, val, locatorType, collation);
    } else {
        hashValue = (uint32)compute_hash(colType, val, locatorType, collation);
    }
    return hashValue;
}

/*
 * get_compute_hash_function
 * Get hash function name depending on the hash type.
 * For some cases of hash or modulo distribution, a function might
 * be required or not.
 */
char *get_compute_hash_function(Oid type, char locator)
{
    switch (type) {
        case INT8OID:
            if (locator == LOCATOR_TYPE_HASH)
                return "hashint8";
            return NULL;
        case INT2OID:
            if (locator == LOCATOR_TYPE_HASH)
                return "hashint2";
            return NULL;
        case OIDOID:
            if (locator == LOCATOR_TYPE_HASH)
                return "hashoid";
            return NULL;
        case DATEOID:
        case INT4OID:
            if (locator == LOCATOR_TYPE_HASH)
                return "hashint4";
            return NULL;
        case BOOLOID:
            if (locator == LOCATOR_TYPE_HASH)
                return "hashchar";
            return NULL;
        case CHAROID:
            return "hashchar";
        case NAMEOID:
            return "hashname";
        case INT2VECTOROID:
            return "hashint2vector";
        case CLOBOID:
        case VARCHAROID:
        case TEXTOID:
            return "hashtext";
        case OIDVECTOROID:
            return "hashoidvector";
        case FLOAT4OID:
            return "hashfloat4";
        case FLOAT8OID:
            return "hashfloat8";
        case RELTIMEOID:
        case ABSTIMEOID:
            if (locator == LOCATOR_TYPE_HASH)
                return "hashint4";
            return NULL;
        case CASHOID:
            return "hashint8";
        case BPCHAROID:
            return "hashbpchar";
        case BYTEAWITHOUTORDERWITHEQUALCOLOID:
        case BYTEAWITHOUTORDERCOLOID:
        case BYTEAOID:
            return "hashvarlena";
        case TIMEOID:
            return "time_hash";
        case TIMESTAMPOID:
        case TIMESTAMPTZOID:
            return "timestamp_hash";
        case INTERVALOID:
            return "interval_hash";
        case TIMETZOID:
            return "timetz_hash";
        case NUMERICOID:
            return "hash_numeric";
        case UUIDOID:
            return "uuid_hash";

        default:
            ereport(ERROR, (errcode(ERRCODE_WRONG_OBJECT_TYPE),
                            errmsg("Unhandled datatype for modulo or hash distribution\n")));
    }

    /* Keep compiler quiet */
    return NULL;
}

Datum bucketint4(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(INT4OID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(INT4OID, value, LOCATOR_TYPE_MODULO);
    }

    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketint2(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(INT2OID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(INT2OID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketint8(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(INT8OID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(INT8OID, value, LOCATOR_TYPE_MODULO);
    }

    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}
Datum bucketint1(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(INT1OID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(INT1OID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketbpchar(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;
    int collation = is_b_format_collation(PG_GET_COLLATION()) ? PG_GET_COLLATION() : InvalidOid;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(BPCHAROID, value, LOCATOR_TYPE_HASH, collation);
    } else {
        hashValue = (long)compute_hash(BPCHAROID, value, LOCATOR_TYPE_MODULO, collation);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}
Datum bucketchar(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(CHAROID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(CHAROID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketvarchar(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;
    int collation = is_b_format_collation(PG_GET_COLLATION()) ? PG_GET_COLLATION() : InvalidOid;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(VARCHAROID, value, LOCATOR_TYPE_HASH, collation);
    } else {
        hashValue = (long)compute_hash(VARCHAROID, value, LOCATOR_TYPE_MODULO, collation);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketnvarchar2(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;
    int collation = is_b_format_collation(PG_GET_COLLATION()) ? PG_GET_COLLATION() : InvalidOid;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(NVARCHAR2OID, value, LOCATOR_TYPE_HASH, collation);
    } else {
        hashValue = (long)compute_hash(NVARCHAR2OID, value, LOCATOR_TYPE_MODULO, collation);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}
Datum bucketdate(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(DATEOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(DATEOID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum buckettime(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(TIMEOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(TIMEOID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum buckettimestamp(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(TIMESTAMPOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(TIMESTAMPOID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum buckettimestamptz(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(TIMESTAMPTZOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(TIMESTAMPTZOID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketinterval(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(INTERVALOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(INTERVALOID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}
Datum buckettimetz(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(TIMETZOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(TIMETZOID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketsmalldatetime(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(SMALLDATETIMEOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(SMALLDATETIMEOID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketnumeric(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(NUMERICOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(NUMERICOID, value, LOCATOR_TYPE_MODULO);
    }

    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

/* useful when g_instance.attr.attr_common.support_extended_features is on */
Datum bucketoid(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(OIDOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(OIDOID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketabstime(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) /* hash */
        hashValue = (long)compute_hash(ABSTIMEOID, value, LOCATOR_TYPE_HASH);
    else
        hashValue = (long)compute_hash(ABSTIMEOID, value, LOCATOR_TYPE_MODULO);
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketreltime(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(RELTIMEOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(RELTIMEOID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketcash(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(CASHOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(CASHOID, value, LOCATOR_TYPE_MODULO);
    }

    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketbytea(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(BYTEAOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(BYTEAOID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketraw(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(RAWOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(RAWOID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketbool(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(BOOLOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(BOOLOID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketname(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(NAMEOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(NAMEOID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketint2vector(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(INT2VECTOROID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(INT2VECTOROID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum buckettext(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;
    int collation = is_b_format_collation(PG_GET_COLLATION()) ? PG_GET_COLLATION() : InvalidOid;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(TEXTOID, value, LOCATOR_TYPE_HASH, collation);
    } else {
        hashValue = (long)compute_hash(TEXTOID, value, LOCATOR_TYPE_MODULO, collation);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketuuid(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(UUIDOID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(UUIDOID, value, LOCATOR_TYPE_MODULO);
    }

    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketoidvector(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(OIDVECTOROID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(OIDVECTOROID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketfloat4(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(FLOAT4OID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(FLOAT4OID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

Datum bucketfloat8(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    int bucket;
    Datum result;
    Datum value = PG_GETARG_DATUM(0);
    int flag = PG_GETARG_INT32(1);
    long hashValue;

    if (flag == 0) { /* hash */
        hashValue = (long)compute_hash(FLOAT8OID, value, LOCATOR_TYPE_HASH);
    } else {
        hashValue = (long)compute_hash(FLOAT8OID, value, LOCATOR_TYPE_MODULO);
    }
    bucket = compute_modulo(abs(hashValue), BUCKETDATALEN);
    result = Int32GetDatum(bucket);
    return result;
#endif
}

#ifdef ENABLE_MULTIPLE_NODES
static Datum getBucketInternal(Datum array, char flag, int bucketcnt, bool *allIsNull)
{
    HeapTupleHeader td;
    Oid tupType;
    int32 tupTypmod;
    TupleDesc tupdesc;
    HeapTupleData tmptup;
    HeapTupleData *tuple = NULL;
    uint32 hashValue = 0;
    Datum result = 0;
    bool isnull = false;
    int i = 0;
    int bucket;

    errno_t rc = memset_s(&tmptup, sizeof(tmptup), 0, sizeof(tmptup));
    securec_check(rc, "", "");

    td = DatumGetHeapTupleHeader(array);

    tupType = HeapTupleHeaderGetTypeId(td);
    tupTypmod = HeapTupleHeaderGetTypMod(td);
    tupdesc = lookup_rowtype_tupdesc(tupType, tupTypmod);

    tmptup.t_len = HeapTupleHeaderGetDatumLength(td);
    tmptup.t_data = td;
    tuple = &tmptup;
    *allIsNull = true;

    for (i = 0; i < tupdesc->natts; i++) {
        Datum val = heap_getattr(tuple, i + 1, tupdesc, &isnull);
        Oid colType = tupdesc->attrs[i].atttypid;
        if (!isnull) {
            hashValue = hashValueCombination(hashValue, colType, val, *allIsNull, flag);
            *allIsNull = false;
        }
    }
    ReleaseTupleDesc(tupdesc);
    if (*allIsNull == false) {
        bucket = compute_modulo(abs((int)hashValue), bucketcnt);
        result = Int32GetDatum(bucket);
        return result;
    } else {
        return (Datum)0;
    }
}
#endif

/* Get bucket from distribute columns with bucketcnt */
Datum getbucketbycnt(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    Datum array = PG_GETARG_DATUM(0);
    char flag = PG_GETARG_CHAR(1);
    int bucketcnt = PG_GETARG_INT32(2);
    bool allIsNull = false;
    Datum ret = getBucketInternal(array, flag, bucketcnt, &allIsNull);

    if (allIsNull) {
        PG_RETURN_NULL();
    } else {
        return ret;
    }
#endif
}

/* Get bucket from distribute columns */
Datum getbucket(PG_FUNCTION_ARGS)
{
#ifndef ENABLE_MULTIPLE_NODES
    EREPORT_UNSUPPORTED_FEATURE_IN_SINGLE_MODE;

    PG_RETURN_NULL();
#else
    Datum array = PG_GETARG_DATUM(0);
    char flag = PG_GETARG_CHAR(1);
    bool allIsNull = false;
    Datum ret = getBucketInternal(array, flag, BUCKETDATALEN, &allIsNull);

    if (allIsNull) {
        PG_RETURN_NULL();
    } else {
        return ret;
    }

#endif
}

uint32 hash_multikey(MultiHashKey *mkeys)
{
    uint32 hashValue = 0;
    bool allIsNull = true;
    char locatorType = mkeys->locatorType;

    for (uint32 i = 0; i < mkeys->keyNum; i++) {
        if (!mkeys->isNulls[i]) {
            hashValue = hashValueCombination(hashValue, mkeys->keyTypes[i], mkeys->keyValues[i], allIsNull,
                                             locatorType);
            allIsNull = false;
        }
    }

    return hashValue;
}

ScalarVector *vgetbucket(PG_FUNCTION_ARGS)
{
    VectorBatch *batch = (VectorBatch *)PG_GETARG_DATUM(0);
    ScalarVector *vecflag = PG_GETARG_VECTOR(1);
    char flag = (char)vecflag->m_vals[0];
    ScalarVector *presultVector = PG_GETARG_VECTOR(3);

    int32 nvalues = PG_GETARG_INT32(2);
    ScalarValue *presult = PG_GETARG_VECVAL(3);
    uint8 *pflagsRes = (uint8 *)(PG_GETARG_VECTOR(3)->m_flag);
    bool *pselection = PG_GETARG_SELECTION(4);

    uint32 hashValue[BatchMaxSize] = {0};
    bool allIsNull[BatchMaxSize];
    ScalarVector *pDistributeVec = NULL;
    Datum val = 0;
    errno_t rc;

    rc = memset_s(allIsNull, BatchMaxSize, 1, BatchMaxSize);
    securec_check(rc, "", "");

    if (pselection == NULL) {
        for (int j = 0; j < batch->m_cols; j++) {
            pDistributeVec = &batch->m_arr[j];
            Oid colType = pDistributeVec->m_desc.typeId;

            for (int i = 0; i < nvalues; i++) {
                val = pDistributeVec->m_vals[i];

                if (!pDistributeVec->IsNull(i)) {
                    /* For vector data, the data types (INTERVALOID and TIMETZOID)
                     * adds a byte to store the length of the data
                     */
                    if (colType == INTERVALOID || colType == TIMETZOID) {
                        val = PointerGetDatum((char *)val + VARHDRSZ_SHORT);
                    }
                    hashValue[i] = hashValueCombination(hashValue[i], colType, val, allIsNull[i], flag);
                    allIsNull[i] = false;
                }
            }
        }

        for (int i = 0; i < nvalues; i++) {
            if (!allIsNull[i]) {
                int bucket = compute_modulo(abs((int)hashValue[i]), BUCKETDATALEN);
                presult[i] = Int32GetDatum(bucket);
                SET_NOTNULL(pflagsRes[i]);
            } else {
                SET_NULL(pflagsRes[i]);
            }
        }
    } else {
        for (int j = 0; j < batch->m_cols; j++) {
            pDistributeVec = &batch->m_arr[j];
            Oid colType = pDistributeVec->m_desc.typeId;

            for (int i = 0; i < nvalues; i++) {
                if (pselection[i]) {
                    val = pDistributeVec->m_vals[i];
                    if (!pDistributeVec->IsNull(i)) {
                        /* For vector data, the data types (INTERVALOID and TIMETZOID)
                         * adds a byte to store the length of the data
                         */
                        if (colType == INTERVALOID || colType == TIMETZOID) {
                            val = PointerGetDatum((char *)val + VARHDRSZ_SHORT);
                        }
                        hashValue[i] = hashValueCombination(hashValue[i], colType, val, allIsNull[i], flag);
                        allIsNull[i] = false;
                    }
                }
            }
        }

        for (int i = 0; i < nvalues; i++) {
            if (pselection[i]) {
                if (!allIsNull[i]) {
                    int bucket = compute_modulo(abs((int)hashValue[i]), BUCKETDATALEN);
                    presult[i] = Int32GetDatum(bucket);
                    SET_NOTNULL(pflagsRes[i]);
                } else {
                    SET_NULL(pflagsRes[i]);
                }
            }
        }
    }

    presultVector->m_rows = nvalues;

    return presultVector;
}
#endif