mirror of https://github.com/citusdata/citus.git
214 lines
6.2 KiB
C
214 lines
6.2 KiB
C
/*-------------------------------------------------------------------------
|
|
*
|
|
* distribution_column.c
|
|
*
|
|
* This file contains functions for translating distribution columns in
|
|
* metadata tables.
|
|
*
|
|
* Copyright (c) Citus Data, Inc.
|
|
*
|
|
*-------------------------------------------------------------------------
|
|
*/
|
|
|
|
#include "postgres.h"
|
|
|
|
|
|
#include "access/attnum.h"
|
|
#include "access/heapam.h"
|
|
#include "access/htup_details.h"
|
|
#include "distributed/distribution_column.h"
|
|
#include "distributed/metadata_cache.h"
|
|
#include "distributed/multi_partitioning_utils.h"
|
|
#include "distributed/version_compat.h"
|
|
#include "nodes/makefuncs.h"
|
|
#include "nodes/nodes.h"
|
|
#include "nodes/primnodes.h"
|
|
#include "parser/scansup.h"
|
|
#include "utils/builtins.h"
|
|
#include "utils/elog.h"
|
|
#include "utils/errcodes.h"
|
|
#include "utils/lsyscache.h"
|
|
#include "utils/rel.h"
|
|
#include "utils/relcache.h"
|
|
#include "utils/syscache.h"
|
|
|
|
|
|
/* exports for SQL callable functions */
|
|
PG_FUNCTION_INFO_V1(column_name_to_column);
|
|
PG_FUNCTION_INFO_V1(column_name_to_column_id);
|
|
PG_FUNCTION_INFO_V1(column_to_column_name);
|
|
|
|
|
|
/*
|
|
* column_name_to_column is an internal UDF to obtain a textual representation
|
|
* of a particular column node (Var), given a relation identifier and column
|
|
* name. There is no requirement that the table be distributed; this function
|
|
* simply returns the textual representation of a Var representing a column.
|
|
* This function will raise an ERROR if no such column can be found or if the
|
|
* provided name refers to a system column.
|
|
*/
|
|
Datum
|
|
column_name_to_column(PG_FUNCTION_ARGS)
|
|
{
|
|
CheckCitusVersion(ERROR);
|
|
|
|
Oid relationId = PG_GETARG_OID(0);
|
|
text *columnText = PG_GETARG_TEXT_P(1);
|
|
char *columnName = text_to_cstring(columnText);
|
|
|
|
Var *column = BuildDistributionKeyFromColumnName(relationId, columnName,
|
|
AccessShareLock);
|
|
Assert(column != NULL);
|
|
char *columnNodeString = nodeToString(column);
|
|
text *columnNodeText = cstring_to_text(columnNodeString);
|
|
|
|
PG_RETURN_TEXT_P(columnNodeText);
|
|
}
|
|
|
|
|
|
/*
|
|
* column_name_to_column_id takes a relation identifier and a name of a column
|
|
* in that relation and returns the index of that column in the relation. If
|
|
* the provided name is a system column or no column at all, this function will
|
|
* throw an error instead.
|
|
*/
|
|
Datum
|
|
column_name_to_column_id(PG_FUNCTION_ARGS)
|
|
{
|
|
Oid distributedTableId = PG_GETARG_OID(0);
|
|
char *columnName = PG_GETARG_CSTRING(1);
|
|
|
|
Var *column = BuildDistributionKeyFromColumnName(distributedTableId, columnName,
|
|
AccessExclusiveLock);
|
|
Assert(column != NULL);
|
|
|
|
PG_RETURN_INT16((int16) column->varattno);
|
|
}
|
|
|
|
|
|
/*
|
|
* column_to_column_name is an internal UDF to obtain the human-readable name
|
|
* of a column given a relation identifier and the column's internal textual
|
|
* (Var) representation. This function will raise an ERROR if no such column
|
|
* can be found or if the provided Var refers to a system column.
|
|
*/
|
|
Datum
|
|
column_to_column_name(PG_FUNCTION_ARGS)
|
|
{
|
|
CheckCitusVersion(ERROR);
|
|
|
|
Oid relationId = PG_GETARG_OID(0);
|
|
text *columnNodeText = PG_GETARG_TEXT_P(1);
|
|
|
|
char *columnNodeString = text_to_cstring(columnNodeText);
|
|
Node *columnNode = stringToNode(columnNodeString);
|
|
|
|
char *columnName = ColumnToColumnName(relationId, columnNode);
|
|
|
|
text *columnText = cstring_to_text(columnName);
|
|
|
|
PG_RETURN_TEXT_P(columnText);
|
|
}
|
|
|
|
|
|
/*
|
|
* BuildDistributionKeyFromColumnName builds a simple distribution key consisting
|
|
* only out of a reference to the column of name columnName. Errors out if the
|
|
* specified column does not exist or is not suitable to be used as a
|
|
* distribution column.
|
|
*
|
|
* The function returns NULL if the passed column name is NULL. That case only
|
|
* corresponds to reference tables.
|
|
*/
|
|
Var *
|
|
BuildDistributionKeyFromColumnName(Oid relationId, char *columnName, LOCKMODE lockMode)
|
|
{
|
|
Relation relation = try_relation_open(relationId, ExclusiveLock);
|
|
|
|
if (relation == NULL)
|
|
{
|
|
ereport(ERROR, (errmsg("relation does not exist")));
|
|
}
|
|
|
|
relation_close(relation, NoLock);
|
|
|
|
char *tableName = get_rel_name(relationId);
|
|
|
|
/* short circuit for reference tables */
|
|
if (columnName == NULL)
|
|
{
|
|
return NULL;
|
|
}
|
|
|
|
/* it'd probably better to downcase identifiers consistent with SQL case folding */
|
|
truncate_identifier(columnName, strlen(columnName), true);
|
|
|
|
/* lookup column definition */
|
|
HeapTuple columnTuple = SearchSysCacheAttName(relationId, columnName);
|
|
if (!HeapTupleIsValid(columnTuple))
|
|
{
|
|
ereport(ERROR, (errcode(ERRCODE_UNDEFINED_COLUMN),
|
|
errmsg("column \"%s\" of relation \"%s\" does not exist",
|
|
columnName, tableName)));
|
|
}
|
|
|
|
Form_pg_attribute columnForm = (Form_pg_attribute) GETSTRUCT(columnTuple);
|
|
|
|
/* check if the column may be referenced in the distribution key */
|
|
if (columnForm->attnum <= 0)
|
|
{
|
|
ereport(ERROR, (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
|
|
errmsg("cannot reference system column \"%s\" in relation \"%s\"",
|
|
columnName, tableName)));
|
|
}
|
|
|
|
/* build Var referencing only the chosen distribution column */
|
|
Var *distributionColumn = makeVar(1, columnForm->attnum, columnForm->atttypid,
|
|
columnForm->atttypmod, columnForm->attcollation, 0);
|
|
|
|
ReleaseSysCache(columnTuple);
|
|
|
|
return distributionColumn;
|
|
}
|
|
|
|
|
|
/*
|
|
* ColumnToColumnName returns the human-readable name of a column given a
|
|
* relation identifier and the column's internal (Var) representation.
|
|
* This function will raise an ERROR if no such column can be found or if the
|
|
* provided Var refers to a system column.
|
|
*/
|
|
char *
|
|
ColumnToColumnName(Oid relationId, Node *columnNode)
|
|
{
|
|
if (columnNode == NULL || !IsA(columnNode, Var))
|
|
{
|
|
ereport(ERROR, (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
|
|
errmsg("not a valid column")));
|
|
}
|
|
|
|
Var *column = (Var *) columnNode;
|
|
|
|
AttrNumber columnNumber = column->varattno;
|
|
if (!AttrNumberIsForUserDefinedAttr(columnNumber))
|
|
{
|
|
char *relationName = get_rel_name(relationId);
|
|
|
|
ereport(ERROR, (errcode(ERRCODE_INVALID_COLUMN_REFERENCE),
|
|
errmsg("attribute %d of relation \"%s\" is a system column",
|
|
columnNumber, relationName)));
|
|
}
|
|
|
|
char *columnName = get_attname(relationId, column->varattno, false);
|
|
if (columnName == NULL)
|
|
{
|
|
char *relationName = get_rel_name(relationId);
|
|
|
|
ereport(ERROR, (errcode(ERRCODE_UNDEFINED_COLUMN),
|
|
errmsg("attribute %d of relation \"%s\" does not exist",
|
|
columnNumber, relationName)));
|
|
}
|
|
|
|
return columnName;
|
|
}
|