citus/src/backend/distributed/utils/distribution_column.c

214 lines
6.2 KiB
C

/*-------------------------------------------------------------------------
*
* distribution_column.c
*
* This file contains functions for translating distribution columns in
* metadata tables.
*
* Copyright (c) Citus Data, Inc.
*
*-------------------------------------------------------------------------
*/
#include "postgres.h"
#include "access/attnum.h"
#include "access/heapam.h"
#include "access/htup_details.h"
#include "distributed/distribution_column.h"
#include "distributed/metadata_cache.h"
#include "distributed/multi_partitioning_utils.h"
#include "distributed/version_compat.h"
#include "nodes/makefuncs.h"
#include "nodes/nodes.h"
#include "nodes/primnodes.h"
#include "parser/scansup.h"
#include "utils/builtins.h"
#include "utils/elog.h"
#include "utils/errcodes.h"
#include "utils/lsyscache.h"
#include "utils/rel.h"
#include "utils/relcache.h"
#include "utils/syscache.h"
/* exports for SQL callable functions */
PG_FUNCTION_INFO_V1(column_name_to_column);
PG_FUNCTION_INFO_V1(column_name_to_column_id);
PG_FUNCTION_INFO_V1(column_to_column_name);
/*
* column_name_to_column is an internal UDF to obtain a textual representation
* of a particular column node (Var), given a relation identifier and column
* name. There is no requirement that the table be distributed; this function
* simply returns the textual representation of a Var representing a column.
* This function will raise an ERROR if no such column can be found or if the
* provided name refers to a system column.
*/
Datum
column_name_to_column(PG_FUNCTION_ARGS)
{
CheckCitusVersion(ERROR);
Oid relationId = PG_GETARG_OID(0);
text *columnText = PG_GETARG_TEXT_P(1);
char *columnName = text_to_cstring(columnText);
Var *column = BuildDistributionKeyFromColumnName(relationId, columnName,
AccessShareLock);
Assert(column != NULL);
char *columnNodeString = nodeToString(column);
text *columnNodeText = cstring_to_text(columnNodeString);
PG_RETURN_TEXT_P(columnNodeText);
}
/*
* column_name_to_column_id takes a relation identifier and a name of a column
* in that relation and returns the index of that column in the relation. If
* the provided name is a system column or no column at all, this function will
* throw an error instead.
*/
Datum
column_name_to_column_id(PG_FUNCTION_ARGS)
{
Oid distributedTableId = PG_GETARG_OID(0);
char *columnName = PG_GETARG_CSTRING(1);
Var *column = BuildDistributionKeyFromColumnName(distributedTableId, columnName,
AccessExclusiveLock);
Assert(column != NULL);
PG_RETURN_INT16((int16) column->varattno);
}
/*
* column_to_column_name is an internal UDF to obtain the human-readable name
* of a column given a relation identifier and the column's internal textual
* (Var) representation. This function will raise an ERROR if no such column
* can be found or if the provided Var refers to a system column.
*/
Datum
column_to_column_name(PG_FUNCTION_ARGS)
{
CheckCitusVersion(ERROR);
Oid relationId = PG_GETARG_OID(0);
text *columnNodeText = PG_GETARG_TEXT_P(1);
char *columnNodeString = text_to_cstring(columnNodeText);
Node *columnNode = stringToNode(columnNodeString);
char *columnName = ColumnToColumnName(relationId, columnNode);
text *columnText = cstring_to_text(columnName);
PG_RETURN_TEXT_P(columnText);
}
/*
* BuildDistributionKeyFromColumnName builds a simple distribution key consisting
* only out of a reference to the column of name columnName. Errors out if the
* specified column does not exist or is not suitable to be used as a
* distribution column.
*
* The function returns NULL if the passed column name is NULL. That case only
* corresponds to reference tables.
*/
Var *
BuildDistributionKeyFromColumnName(Oid relationId, char *columnName, LOCKMODE lockMode)
{
Relation relation = try_relation_open(relationId, ExclusiveLock);
if (relation == NULL)
{
ereport(ERROR, (errmsg("relation does not exist")));
}
relation_close(relation, NoLock);
char *tableName = get_rel_name(relationId);
/* short circuit for reference tables */
if (columnName == NULL)
{
return NULL;
}
/* it'd probably better to downcase identifiers consistent with SQL case folding */
truncate_identifier(columnName, strlen(columnName), true);
/* lookup column definition */
HeapTuple columnTuple = SearchSysCacheAttName(relationId, columnName);
if (!HeapTupleIsValid(columnTuple))
{
ereport(ERROR, (errcode(ERRCODE_UNDEFINED_COLUMN),
errmsg("column \"%s\" of relation \"%s\" does not exist",
columnName, tableName)));
}
Form_pg_attribute columnForm = (Form_pg_attribute) GETSTRUCT(columnTuple);
/* check if the column may be referenced in the distribution key */
if (columnForm->attnum <= 0)
{
ereport(ERROR, (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
errmsg("cannot reference system column \"%s\" in relation \"%s\"",
columnName, tableName)));
}
/* build Var referencing only the chosen distribution column */
Var *distributionColumn = makeVar(1, columnForm->attnum, columnForm->atttypid,
columnForm->atttypmod, columnForm->attcollation, 0);
ReleaseSysCache(columnTuple);
return distributionColumn;
}
/*
* ColumnToColumnName returns the human-readable name of a column given a
* relation identifier and the column's internal (Var) representation.
* This function will raise an ERROR if no such column can be found or if the
* provided Var refers to a system column.
*/
char *
ColumnToColumnName(Oid relationId, Node *columnNode)
{
if (columnNode == NULL || !IsA(columnNode, Var))
{
ereport(ERROR, (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
errmsg("not a valid column")));
}
Var *column = (Var *) columnNode;
AttrNumber columnNumber = column->varattno;
if (!AttrNumberIsForUserDefinedAttr(columnNumber))
{
char *relationName = get_rel_name(relationId);
ereport(ERROR, (errcode(ERRCODE_INVALID_COLUMN_REFERENCE),
errmsg("attribute %d of relation \"%s\" is a system column",
columnNumber, relationName)));
}
char *columnName = get_attname(relationId, column->varattno, false);
if (columnName == NULL)
{
char *relationName = get_rel_name(relationId);
ereport(ERROR, (errcode(ERRCODE_UNDEFINED_COLUMN),
errmsg("attribute %d of relation \"%s\" does not exist",
columnNumber, relationName)));
}
return columnName;
}