mirror of https://github.com/citusdata/citus.git
Merge pull request #1353 from citusdata/fix_copy_crasher
Refactor COPY to not directly use cache entry cr: @marcocituspull/1361/head
commit
905ca98a9b
|
@ -1753,12 +1753,6 @@ CitusCopyDestReceiverStartup(DestReceiver *dest, int operation,
|
||||||
/* keep the table metadata to avoid looking it up for every tuple */
|
/* keep the table metadata to avoid looking it up for every tuple */
|
||||||
copyDest->tableMetadata = cacheEntry;
|
copyDest->tableMetadata = cacheEntry;
|
||||||
|
|
||||||
/* determine whether to use binary search */
|
|
||||||
if (partitionMethod != DISTRIBUTE_BY_HASH || !cacheEntry->hasUniformHashDistribution)
|
|
||||||
{
|
|
||||||
copyDest->useBinarySearch = true;
|
|
||||||
}
|
|
||||||
|
|
||||||
if (cacheEntry->replicationModel == REPLICATION_MODEL_2PC)
|
if (cacheEntry->replicationModel == REPLICATION_MODEL_2PC)
|
||||||
{
|
{
|
||||||
CoordinatedTransactionUse2PC();
|
CoordinatedTransactionUse2PC();
|
||||||
|
@ -1835,19 +1829,10 @@ CitusCopyDestReceiverReceive(TupleTableSlot *slot, DestReceiver *dest)
|
||||||
{
|
{
|
||||||
CitusCopyDestReceiver *copyDest = (CitusCopyDestReceiver *) dest;
|
CitusCopyDestReceiver *copyDest = (CitusCopyDestReceiver *) dest;
|
||||||
|
|
||||||
DistTableCacheEntry *tableMetadata = copyDest->tableMetadata;
|
|
||||||
char partitionMethod = tableMetadata->partitionMethod;
|
|
||||||
int partitionColumnIndex = copyDest->partitionColumnIndex;
|
int partitionColumnIndex = copyDest->partitionColumnIndex;
|
||||||
TupleDesc tupleDescriptor = copyDest->tupleDescriptor;
|
TupleDesc tupleDescriptor = copyDest->tupleDescriptor;
|
||||||
CopyStmt *copyStatement = copyDest->copyStatement;
|
CopyStmt *copyStatement = copyDest->copyStatement;
|
||||||
|
|
||||||
int shardCount = tableMetadata->shardIntervalArrayLength;
|
|
||||||
ShardInterval **shardIntervalCache = tableMetadata->sortedShardIntervalArray;
|
|
||||||
|
|
||||||
bool useBinarySearch = copyDest->useBinarySearch;
|
|
||||||
FmgrInfo *hashFunction = tableMetadata->hashFunction;
|
|
||||||
FmgrInfo *compareFunction = tableMetadata->shardIntervalCompareFunction;
|
|
||||||
|
|
||||||
HTAB *shardConnectionHash = copyDest->shardConnectionHash;
|
HTAB *shardConnectionHash = copyDest->shardConnectionHash;
|
||||||
CopyOutState copyOutState = copyDest->copyOutState;
|
CopyOutState copyOutState = copyDest->copyOutState;
|
||||||
FmgrInfo *columnOutputFunctions = copyDest->columnOutputFunctions;
|
FmgrInfo *columnOutputFunctions = copyDest->columnOutputFunctions;
|
||||||
|
@ -1907,10 +1892,7 @@ CitusCopyDestReceiverReceive(TupleTableSlot *slot, DestReceiver *dest)
|
||||||
* For reference table, this function blindly returns the tables single
|
* For reference table, this function blindly returns the tables single
|
||||||
* shard.
|
* shard.
|
||||||
*/
|
*/
|
||||||
shardInterval = FindShardInterval(partitionColumnValue, shardIntervalCache,
|
shardInterval = FindShardInterval(partitionColumnValue, copyDest->tableMetadata);
|
||||||
shardCount, partitionMethod,
|
|
||||||
compareFunction, hashFunction,
|
|
||||||
useBinarySearch);
|
|
||||||
if (shardInterval == NULL)
|
if (shardInterval == NULL)
|
||||||
{
|
{
|
||||||
ereport(ERROR, (errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
|
ereport(ERROR, (errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
|
||||||
|
|
|
@ -1974,8 +1974,9 @@ FindShardForInsert(Query *query, DeferredErrorMessage **planningError)
|
||||||
if (partitionMethod == DISTRIBUTE_BY_HASH || partitionMethod == DISTRIBUTE_BY_RANGE)
|
if (partitionMethod == DISTRIBUTE_BY_HASH || partitionMethod == DISTRIBUTE_BY_RANGE)
|
||||||
{
|
{
|
||||||
Datum partitionValue = partitionValueConst->constvalue;
|
Datum partitionValue = partitionValueConst->constvalue;
|
||||||
ShardInterval *shardInterval = FastShardPruning(distributedTableId,
|
DistTableCacheEntry *cacheEntry = DistributedTableCacheEntry(distributedTableId);
|
||||||
partitionValue);
|
ShardInterval *shardInterval = FindShardInterval(partitionValue, cacheEntry);
|
||||||
|
|
||||||
if (shardInterval != NULL)
|
if (shardInterval != NULL)
|
||||||
{
|
{
|
||||||
prunedShardList = list_make1(shardInterval);
|
prunedShardList = list_make1(shardInterval);
|
||||||
|
@ -2047,50 +2048,6 @@ FindShardForInsert(Query *query, DeferredErrorMessage **planningError)
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
/*
|
|
||||||
* FastShardPruning is a higher level API for FindShardInterval function. Given the
|
|
||||||
* relationId of the distributed table and partitionValue, FastShardPruning function finds
|
|
||||||
* the corresponding shard interval that the partitionValue should be in. FastShardPruning
|
|
||||||
* returns NULL if no ShardIntervals exist for the given partitionValue.
|
|
||||||
*/
|
|
||||||
ShardInterval *
|
|
||||||
FastShardPruning(Oid distributedTableId, Datum partitionValue)
|
|
||||||
{
|
|
||||||
DistTableCacheEntry *cacheEntry = DistributedTableCacheEntry(distributedTableId);
|
|
||||||
int shardCount = cacheEntry->shardIntervalArrayLength;
|
|
||||||
ShardInterval **sortedShardIntervalArray = cacheEntry->sortedShardIntervalArray;
|
|
||||||
bool useBinarySearch = false;
|
|
||||||
char partitionMethod = cacheEntry->partitionMethod;
|
|
||||||
FmgrInfo *shardIntervalCompareFunction = cacheEntry->shardIntervalCompareFunction;
|
|
||||||
bool hasUniformHashDistribution = cacheEntry->hasUniformHashDistribution;
|
|
||||||
FmgrInfo *hashFunction = NULL;
|
|
||||||
ShardInterval *shardInterval = NULL;
|
|
||||||
|
|
||||||
/* determine whether to use binary search */
|
|
||||||
if (partitionMethod != DISTRIBUTE_BY_HASH || !hasUniformHashDistribution)
|
|
||||||
{
|
|
||||||
useBinarySearch = true;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* we only need hash functions for hash distributed tables */
|
|
||||||
if (partitionMethod == DISTRIBUTE_BY_HASH)
|
|
||||||
{
|
|
||||||
hashFunction = cacheEntry->hashFunction;
|
|
||||||
}
|
|
||||||
|
|
||||||
/*
|
|
||||||
* Call FindShardInterval to find the corresponding shard interval for the
|
|
||||||
* given partition value.
|
|
||||||
*/
|
|
||||||
shardInterval = FindShardInterval(partitionValue, sortedShardIntervalArray,
|
|
||||||
shardCount, partitionMethod,
|
|
||||||
shardIntervalCompareFunction, hashFunction,
|
|
||||||
useBinarySearch);
|
|
||||||
|
|
||||||
return shardInterval;
|
|
||||||
}
|
|
||||||
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* FindShardForUpdateOrDelete finds the shard interval in which an UPDATE or
|
* FindShardForUpdateOrDelete finds the shard interval in which an UPDATE or
|
||||||
* DELETE command should be applied, or sets planningError when the query
|
* DELETE command should be applied, or sets planningError when the query
|
||||||
|
|
|
@ -332,6 +332,7 @@ get_shard_id_for_distribution_column(PG_FUNCTION_ARGS)
|
||||||
char *distributionValueString = NULL;
|
char *distributionValueString = NULL;
|
||||||
Datum inputDatum = 0;
|
Datum inputDatum = 0;
|
||||||
Datum distributionValueDatum = 0;
|
Datum distributionValueDatum = 0;
|
||||||
|
DistTableCacheEntry *cacheEntry = DistributedTableCacheEntry(relationId);
|
||||||
|
|
||||||
/* if given table is not reference table, distributionValue cannot be NULL */
|
/* if given table is not reference table, distributionValue cannot be NULL */
|
||||||
if (PG_ARGISNULL(1))
|
if (PG_ARGISNULL(1))
|
||||||
|
@ -351,7 +352,7 @@ get_shard_id_for_distribution_column(PG_FUNCTION_ARGS)
|
||||||
distributionValueDatum = StringToDatum(distributionValueString,
|
distributionValueDatum = StringToDatum(distributionValueString,
|
||||||
distributionDataType);
|
distributionDataType);
|
||||||
|
|
||||||
shardInterval = FastShardPruning(relationId, distributionValueDatum);
|
shardInterval = FindShardInterval(distributionValueDatum, cacheEntry);
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
|
|
|
@ -23,9 +23,7 @@
|
||||||
#include "utils/memutils.h"
|
#include "utils/memutils.h"
|
||||||
|
|
||||||
|
|
||||||
static int FindShardIntervalIndex(Datum searchedValue, ShardInterval **shardIntervalCache,
|
static int FindShardIntervalIndex(Datum searchedValue, DistTableCacheEntry *cacheEntry);
|
||||||
int shardCount, char partitionMethod,
|
|
||||||
FmgrInfo *compareFunction, bool useBinarySearch);
|
|
||||||
static int SearchCachedShardInterval(Datum partitionColumnValue,
|
static int SearchCachedShardInterval(Datum partitionColumnValue,
|
||||||
ShardInterval **shardIntervalCache,
|
ShardInterval **shardIntervalCache,
|
||||||
int shardCount, FmgrInfo *compareFunction);
|
int shardCount, FmgrInfo *compareFunction);
|
||||||
|
@ -188,12 +186,7 @@ ShardIndex(ShardInterval *shardInterval)
|
||||||
Datum shardMinValue = shardInterval->minValue;
|
Datum shardMinValue = shardInterval->minValue;
|
||||||
|
|
||||||
DistTableCacheEntry *cacheEntry = DistributedTableCacheEntry(distributedTableId);
|
DistTableCacheEntry *cacheEntry = DistributedTableCacheEntry(distributedTableId);
|
||||||
ShardInterval **shardIntervalCache = cacheEntry->sortedShardIntervalArray;
|
|
||||||
int shardCount = cacheEntry->shardIntervalArrayLength;
|
|
||||||
char partitionMethod = cacheEntry->partitionMethod;
|
char partitionMethod = cacheEntry->partitionMethod;
|
||||||
FmgrInfo *compareFunction = cacheEntry->shardIntervalCompareFunction;
|
|
||||||
bool hasUniformHashDistribution = cacheEntry->hasUniformHashDistribution;
|
|
||||||
bool useBinarySearch = false;
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Note that, we can also support append and range distributed tables, but
|
* Note that, we can also support append and range distributed tables, but
|
||||||
|
@ -215,15 +208,7 @@ ShardIndex(ShardInterval *shardInterval)
|
||||||
return shardIndex;
|
return shardIndex;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* determine whether to use binary search */
|
shardIndex = FindShardIntervalIndex(shardMinValue, cacheEntry);
|
||||||
if (partitionMethod != DISTRIBUTE_BY_HASH || !hasUniformHashDistribution)
|
|
||||||
{
|
|
||||||
useBinarySearch = true;
|
|
||||||
}
|
|
||||||
|
|
||||||
shardIndex = FindShardIntervalIndex(shardMinValue, shardIntervalCache,
|
|
||||||
shardCount, partitionMethod,
|
|
||||||
compareFunction, useBinarySearch);
|
|
||||||
|
|
||||||
return shardIndex;
|
return shardIndex;
|
||||||
}
|
}
|
||||||
|
@ -236,28 +221,24 @@ ShardIndex(ShardInterval *shardInterval)
|
||||||
* as NULL for them.
|
* as NULL for them.
|
||||||
*/
|
*/
|
||||||
ShardInterval *
|
ShardInterval *
|
||||||
FindShardInterval(Datum partitionColumnValue, ShardInterval **shardIntervalCache,
|
FindShardInterval(Datum partitionColumnValue, DistTableCacheEntry *cacheEntry)
|
||||||
int shardCount, char partitionMethod, FmgrInfo *compareFunction,
|
|
||||||
FmgrInfo *hashFunction, bool useBinarySearch)
|
|
||||||
{
|
{
|
||||||
Datum searchedValue = partitionColumnValue;
|
Datum searchedValue = partitionColumnValue;
|
||||||
int shardIndex = INVALID_SHARD_INDEX;
|
int shardIndex = INVALID_SHARD_INDEX;
|
||||||
|
|
||||||
if (partitionMethod == DISTRIBUTE_BY_HASH)
|
if (cacheEntry->partitionMethod == DISTRIBUTE_BY_HASH)
|
||||||
{
|
{
|
||||||
searchedValue = FunctionCall1(hashFunction, partitionColumnValue);
|
searchedValue = FunctionCall1(cacheEntry->hashFunction, partitionColumnValue);
|
||||||
}
|
}
|
||||||
|
|
||||||
shardIndex = FindShardIntervalIndex(searchedValue, shardIntervalCache,
|
shardIndex = FindShardIntervalIndex(searchedValue, cacheEntry);
|
||||||
shardCount, partitionMethod,
|
|
||||||
compareFunction, useBinarySearch);
|
|
||||||
|
|
||||||
if (shardIndex == INVALID_SHARD_INDEX)
|
if (shardIndex == INVALID_SHARD_INDEX)
|
||||||
{
|
{
|
||||||
return NULL;
|
return NULL;
|
||||||
}
|
}
|
||||||
|
|
||||||
return shardIntervalCache[shardIndex];
|
return cacheEntry->sortedShardIntervalArray[shardIndex];
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
@ -273,10 +254,14 @@ FindShardInterval(Datum partitionColumnValue, ShardInterval **shardIntervalCache
|
||||||
* fire this.
|
* fire this.
|
||||||
*/
|
*/
|
||||||
static int
|
static int
|
||||||
FindShardIntervalIndex(Datum searchedValue, ShardInterval **shardIntervalCache,
|
FindShardIntervalIndex(Datum searchedValue, DistTableCacheEntry *cacheEntry)
|
||||||
int shardCount, char partitionMethod, FmgrInfo *compareFunction,
|
|
||||||
bool useBinarySearch)
|
|
||||||
{
|
{
|
||||||
|
ShardInterval **shardIntervalCache = cacheEntry->sortedShardIntervalArray;
|
||||||
|
int shardCount = cacheEntry->shardIntervalArrayLength;
|
||||||
|
char partitionMethod = cacheEntry->partitionMethod;
|
||||||
|
FmgrInfo *compareFunction = cacheEntry->shardIntervalCompareFunction;
|
||||||
|
bool useBinarySearch = (partitionMethod != DISTRIBUTE_BY_HASH ||
|
||||||
|
!cacheEntry->hasUniformHashDistribution);
|
||||||
int shardIndex = INVALID_SHARD_INDEX;
|
int shardIndex = INVALID_SHARD_INDEX;
|
||||||
|
|
||||||
if (partitionMethod == DISTRIBUTE_BY_HASH)
|
if (partitionMethod == DISTRIBUTE_BY_HASH)
|
||||||
|
|
|
@ -61,7 +61,6 @@ typedef struct CitusCopyDestReceiver
|
||||||
|
|
||||||
/* distributed table metadata */
|
/* distributed table metadata */
|
||||||
DistTableCacheEntry *tableMetadata;
|
DistTableCacheEntry *tableMetadata;
|
||||||
bool useBinarySearch;
|
|
||||||
|
|
||||||
/* open relation handle */
|
/* open relation handle */
|
||||||
Relation distributedRelation;
|
Relation distributedRelation;
|
||||||
|
|
|
@ -44,7 +44,6 @@ extern void AddShardIntervalRestrictionToSelect(Query *subqery,
|
||||||
ShardInterval *shardInterval);
|
ShardInterval *shardInterval);
|
||||||
extern ShardInterval * FindShardForInsert(Query *query,
|
extern ShardInterval * FindShardForInsert(Query *query,
|
||||||
DeferredErrorMessage **planningError);
|
DeferredErrorMessage **planningError);
|
||||||
extern ShardInterval * FastShardPruning(Oid distributedTableId, Datum partitionValue);
|
|
||||||
|
|
||||||
|
|
||||||
#endif /* MULTI_ROUTER_PLANNER_H */
|
#endif /* MULTI_ROUTER_PLANNER_H */
|
||||||
|
|
|
@ -13,6 +13,7 @@
|
||||||
#define SHARDINTERVAL_UTILS_H_
|
#define SHARDINTERVAL_UTILS_H_
|
||||||
|
|
||||||
#include "distributed/master_metadata_utility.h"
|
#include "distributed/master_metadata_utility.h"
|
||||||
|
#include "distributed/metadata_cache.h"
|
||||||
#include "nodes/primnodes.h"
|
#include "nodes/primnodes.h"
|
||||||
|
|
||||||
#define INVALID_SHARD_INDEX -1
|
#define INVALID_SHARD_INDEX -1
|
||||||
|
@ -33,10 +34,7 @@ extern int CompareRelationShards(const void *leftElement,
|
||||||
const void *rightElement);
|
const void *rightElement);
|
||||||
extern int ShardIndex(ShardInterval *shardInterval);
|
extern int ShardIndex(ShardInterval *shardInterval);
|
||||||
extern ShardInterval * FindShardInterval(Datum partitionColumnValue,
|
extern ShardInterval * FindShardInterval(Datum partitionColumnValue,
|
||||||
ShardInterval **shardIntervalCache,
|
DistTableCacheEntry *cacheEntry);
|
||||||
int shardCount, char partitionMethod,
|
|
||||||
FmgrInfo *compareFunction,
|
|
||||||
FmgrInfo *hashFunction, bool useBinarySearch);
|
|
||||||
extern bool SingleReplicatedTable(Oid relationId);
|
extern bool SingleReplicatedTable(Oid relationId);
|
||||||
|
|
||||||
#endif /* SHARDINTERVAL_UTILS_H_ */
|
#endif /* SHARDINTERVAL_UTILS_H_ */
|
||||||
|
|
Loading…
Reference in New Issue