/*------------------------------------------------------------------------- * * database.c * Commands to interact with the database object in a distributed * environment. * * Copyright (c) Citus Data, Inc. * *------------------------------------------------------------------------- */ #include "postgres.h" #include "miscadmin.h" #include "miscadmin.h" #include "access/heapam.h" #include "access/heapam.h" #include "access/htup_details.h" #include "access/xact.h" #include "catalog/objectaddress.h" #include "catalog/pg_collation.h" #include "catalog/pg_collation.h" #include "catalog/pg_database.h" #include "catalog/pg_database_d.h" #include "catalog/pg_tablespace.h" #include "catalog/pg_database_d.h" #include "catalog/pg_tablespace.h" #include "commands/dbcommands.h" #include "commands/defrem.h" #include "commands/defrem.h" #include "nodes/parsenodes.h" #include "utils/builtins.h" #include "utils/lsyscache.h" #include "utils/rel.h" #include "utils/relcache.h" #include "utils/builtins.h" #include "utils/lsyscache.h" #include "utils/rel.h" #include "utils/relcache.h" #include "utils/syscache.h" #include "distributed/adaptive_executor.h" #include "distributed/adaptive_executor.h" #include "distributed/commands.h" #include "distributed/commands/utility_hook.h" #include "distributed/deparse_shard_query.h" #include "distributed/deparse_shard_query.h" #include "distributed/deparser.h" #include "distributed/listutils.h" #include "distributed/metadata/distobject.h" #include "distributed/listutils.h" #include "distributed/metadata/distobject.h" #include "distributed/metadata_sync.h" #include "distributed/metadata_utility.h" #include "distributed/multi_executor.h" #include "distributed/relation_access_tracking.h" #include "distributed/worker_protocol.h" #include "distributed/worker_protocol.h" #include "distributed/worker_transaction.h" /* * DatabaseCollationInfo is used to store collation related information of a database */ typedef struct DatabaseCollationInfo { char *datcollate; char *datctype; #if PG_VERSION_NUM >= PG_VERSION_15 char *daticulocale; char *datcollversion; #endif #if PG_VERSION_NUM >= PG_VERSION_16 char *daticurules; #endif } DatabaseCollationInfo; static void EnsureSupportedCreateDatabaseCommand(CreatedbStmt *stmt); static char * GenerateCreateDatabaseStatementFromPgDatabase(Form_pg_database databaseForm); static DatabaseCollationInfo GetDatabaseCollation(Oid dbOid); static AlterOwnerStmt * RecreateAlterDatabaseOwnerStmt(Oid databaseOid); #if PG_VERSION_NUM >= PG_VERSION_15 static char * GetLocaleProviderString(char datlocprovider); #endif static char * GetTablespaceName(Oid tablespaceOid); static ObjectAddress * GetDatabaseAddressFromDatabaseName(char *databaseName, bool missingOk); static Oid get_database_owner(Oid db_oid); /* controlled via GUC */ bool EnableCreateDatabasePropagation = false; bool EnableAlterDatabaseOwner = true; /* * AlterDatabaseOwnerObjectAddress returns the ObjectAddress of the database that is the * object of the AlterOwnerStmt. Errors if missing_ok is false. */ List * AlterDatabaseOwnerObjectAddress(Node *node, bool missing_ok, bool isPostprocess) { AlterOwnerStmt *stmt = castNode(AlterOwnerStmt, node); Assert(stmt->objectType == OBJECT_DATABASE); Oid databaseOid = get_database_oid(strVal((String *) stmt->object), missing_ok); ObjectAddress *address = palloc0(sizeof(ObjectAddress)); ObjectAddressSet(*address, DatabaseRelationId, databaseOid); return list_make1(address); } /* * DatabaseOwnerDDLCommands returns a list of sql statements to idempotently apply a * change of the database owner on the workers so that the database is owned by the same * user on all nodes in the cluster. */ List * DatabaseOwnerDDLCommands(const ObjectAddress *address) { Node *stmt = (Node *) RecreateAlterDatabaseOwnerStmt(address->objectId); return list_make1(DeparseTreeNode(stmt)); } /* * RecreateAlterDatabaseOwnerStmt creates an AlterOwnerStmt that represents the operation * of changing the owner of the database to its current owner. */ static AlterOwnerStmt * RecreateAlterDatabaseOwnerStmt(Oid databaseOid) { AlterOwnerStmt *stmt = makeNode(AlterOwnerStmt); stmt->objectType = OBJECT_DATABASE; stmt->object = (Node *) makeString(get_database_name(databaseOid)); Oid ownerOid = get_database_owner(databaseOid); stmt->newowner = makeNode(RoleSpec); stmt->newowner->roletype = ROLESPEC_CSTRING; stmt->newowner->rolename = GetUserNameFromId(ownerOid, false); return stmt; } /* * get_database_owner returns the Oid of the role owning the database */ static Oid get_database_owner(Oid dbId) { HeapTuple tuple = SearchSysCache1(DATABASEOID, ObjectIdGetDatum(dbId)); if (!HeapTupleIsValid(tuple)) { ereport(ERROR, (errcode(ERRCODE_UNDEFINED_DATABASE), errmsg("database with OID %u does not exist", dbId))); } Oid dba = ((Form_pg_database) GETSTRUCT(tuple))->datdba; ReleaseSysCache(tuple); return dba; } /* * PreprocessGrantOnDatabaseStmt is executed before the statement is applied to the local * postgres instance. * * In this stage we can prepare the commands that need to be run on all workers to grant * on databases. */ List * PreprocessGrantOnDatabaseStmt(Node *node, const char *queryString, ProcessUtilityContext processUtilityContext) { if (!ShouldPropagate()) { return NIL; } GrantStmt *stmt = castNode(GrantStmt, node); Assert(stmt->objtype == OBJECT_DATABASE); List *databaseList = stmt->objects; if (list_length(databaseList) == 0) { return NIL; } EnsureCoordinator(); char *sql = DeparseTreeNode((Node *) stmt); List *commands = list_make3(DISABLE_DDL_PROPAGATION, (void *) sql, ENABLE_DDL_PROPAGATION); return NodeDDLTaskList(NON_COORDINATOR_NODES, commands); } static bool isSetTablespaceStatement(AlterDatabaseStmt *stmt) { ListCell *lc = NULL; foreach(lc, stmt->options) { DefElem *def = (DefElem *) lfirst(lc); if (strcmp(def->defname, "tablespace") == 0) { return true; } } return false; } /* * PreprocessAlterDatabaseStmt is executed before the statement is applied to the local * postgres instance. * * In this stage we can prepare the commands that need to be run on all workers to grant * on databases. */ List * PreprocessAlterDatabaseStmt(Node *node, const char *queryString, ProcessUtilityContext processUtilityContext) { if (!ShouldPropagate()) { return NIL; } EnsureCoordinator(); AlterDatabaseStmt *stmt = castNode(AlterDatabaseStmt, node); char *sql = DeparseTreeNode((Node *) stmt); List *commands = list_make3(DISABLE_DDL_PROPAGATION, sql, ENABLE_DDL_PROPAGATION); if (isSetTablespaceStatement(stmt)) { /* * Set tablespace does not work inside a transaction.Therefore, we need to use * NontransactionalNodeDDLTask to run the command on the workers outside * the transaction block. */ return NontransactionalNodeDDLTaskList(NON_COORDINATOR_NODES, commands); } else { return NodeDDLTaskList(NON_COORDINATOR_NODES, commands); } } #if PG_VERSION_NUM >= PG_VERSION_15 /* * PreprocessAlterDatabaseSetStmt is executed before the statement is applied to the local * postgres instance. * * In this stage we can prepare the commands that need to be run on all workers to grant * on databases. */ List * PreprocessAlterDatabaseRefreshCollStmt(Node *node, const char *queryString, ProcessUtilityContext processUtilityContext) { if (!ShouldPropagate()) { return NIL; } AlterDatabaseRefreshCollStmt *stmt = castNode(AlterDatabaseRefreshCollStmt, node); EnsureCoordinator(); char *sql = DeparseTreeNode((Node *) stmt); List *commands = list_make3(DISABLE_DDL_PROPAGATION, (void *) sql, ENABLE_DDL_PROPAGATION); return NodeDDLTaskList(NON_COORDINATOR_NODES, commands); } #endif /* * PreprocessAlterDatabaseRenameStmt is executed before the statement is applied to the local * postgres instance. In this stage we prepare ALTER DATABASE RENAME statement to be run on * all workers. */ List * PreprocessAlterDatabaseRenameStmt(Node *node, const char *queryString, ProcessUtilityContext processUtilityContext) { if (!ShouldPropagate()) { return NIL; } EnsureCoordinator(); RenameStmt *stmt = castNode(RenameStmt, node); char *sql = DeparseTreeNode((Node *) stmt); List *commands = list_make3(DISABLE_DDL_PROPAGATION, (void *) sql, ENABLE_DDL_PROPAGATION); return NodeDDLTaskList(NON_COORDINATOR_NODES, commands); } /* * PreprocessAlterDatabaseSetStmt is executed before the statement is applied to the local * postgres instance. * * In this stage we can prepare the commands that need to be run on all workers to grant * on databases. */ List * PreprocessAlterDatabaseSetStmt(Node *node, const char *queryString, ProcessUtilityContext processUtilityContext) { if (!ShouldPropagate()) { return NIL; } AlterDatabaseSetStmt *stmt = castNode(AlterDatabaseSetStmt, node); EnsureCoordinator(); char *sql = DeparseTreeNode((Node *) stmt); List *commands = list_make3(DISABLE_DDL_PROPAGATION, (void *) sql, ENABLE_DDL_PROPAGATION); return NodeDDLTaskList(NON_COORDINATOR_NODES, commands); } /* * PostprocessAlterDatabaseStmt is executed before the statement is applied to the local * Postgres instance. * * In this stage, we perform validations that we want to ensure before delegating to * previous utility hooks because it might not be convenient to throw an error in an * implicit transaction that creates a database. */ List * PreprocessCreateDatabaseStmt(Node *node, const char *queryString, ProcessUtilityContext processUtilityContext) { if (!EnableCreateDatabasePropagation || !ShouldPropagate()) { return NIL; } EnsureCoordinator(); CreatedbStmt *stmt = castNode(CreatedbStmt, node); EnsureSupportedCreateDatabaseCommand(stmt); return NIL; } /* * PostprocessCreateDatabaseStmt is executed after the statement is applied to the local * postgres instance. In this stage we prepare the commands that need to be run on * all workers to create the database. Since the CREATE DATABASE statement gives error * in a transaction block, we need to use NontransactionalNodeDDLTaskList to send the * CREATE DATABASE statement to the workers. * */ List * PostprocessCreateDatabaseStmt(Node *node, const char *queryString) { if (!EnableCreateDatabasePropagation || !ShouldPropagate()) { return NIL; } EnsureCoordinator(); /* * Given that CREATE DATABASE doesn't support "IF NOT EXISTS" and we're * in the post-process, database must exist, hence missingOk = false. */ bool missingOk = false; bool isPostProcess = true; List *addresses = GetObjectAddressListFromParseTree(node, missingOk, isPostProcess); EnsureAllObjectDependenciesExistOnAllNodes(addresses); char *createDatabaseCommand = DeparseTreeNode(node); List *commands = list_make3(DISABLE_DDL_PROPAGATION, (void *) createDatabaseCommand, ENABLE_DDL_PROPAGATION); return NontransactionalNodeDDLTaskList(NON_COORDINATOR_NODES, commands); } /* * PreprocessDropDatabaseStmt is executed after the statement is applied to the local * postgres instance. In this stage we can prepare the commands that need to be run on * all workers to drop the database. Since the DROP DATABASE statement gives error in * transaction context, we need to use NontransactionalNodeDDLTaskList to send the * DROP DATABASE statement to the workers. */ List * PreprocessDropDatabaseStmt(Node *node, const char *queryString, ProcessUtilityContext processUtilityContext) { if (!EnableCreateDatabasePropagation || !ShouldPropagate()) { return NIL; } EnsureCoordinator(); DropdbStmt *stmt = (DropdbStmt *) node; bool isPostProcess = false; List *addresses = GetObjectAddressListFromParseTree(node, stmt->missing_ok, isPostProcess); if (list_length(addresses) != 1) { ereport(ERROR, (errmsg("unexpected number of objects found when " "executing DROP DATABASE command"))); } ObjectAddress *address = (ObjectAddress *) linitial(addresses); if (address->objectId == InvalidOid || !IsAnyObjectDistributed(list_make1(address))) { return NIL; } char *dropDatabaseCommand = DeparseTreeNode(node); List *commands = list_make3(DISABLE_DDL_PROPAGATION, (void *) dropDatabaseCommand, ENABLE_DDL_PROPAGATION); return NontransactionalNodeDDLTaskList(NON_COORDINATOR_NODES, commands); } /* * DropDatabaseStmtObjectAddress gets the ObjectAddress of the database that is the * object of the DropdbStmt. */ List * DropDatabaseStmtObjectAddress(Node *node, bool missingOk, bool isPostprocess) { DropdbStmt *stmt = castNode(DropdbStmt, node); ObjectAddress *dbAddress = GetDatabaseAddressFromDatabaseName(stmt->dbname, missingOk); return list_make1(dbAddress); } /* * CreateDatabaseStmtObjectAddress gets the ObjectAddress of the database that is the * object of the CreatedbStmt. */ List * CreateDatabaseStmtObjectAddress(Node *node, bool missingOk, bool isPostprocess) { CreatedbStmt *stmt = castNode(CreatedbStmt, node); ObjectAddress *dbAddress = GetDatabaseAddressFromDatabaseName(stmt->dbname, missingOk); return list_make1(dbAddress); } /* * EnsureSupportedCreateDatabaseCommand validates the options provided for the CREATE * DATABASE command. * * Parameters: * stmt: A CreatedbStmt struct representing a CREATE DATABASE command. * The options field is a list of DefElem structs, each representing an option. * * Currently, this function checks for the following: * - The "oid" option is not supported. * - The "template" option is only supported with the value "template1". * - The "strategy" option is only supported with the value "wal_log". */ void EnsureSupportedCreateDatabaseCommand(CreatedbStmt *stmt) { DefElem *option = NULL; foreach_ptr(option, stmt->options) { if (strcmp(option->defname, "oid") == 0) { ereport(ERROR, errmsg("CREATE DATABASE option \"%s\" is not supported", option->defname)); } char *optionValue = defGetString(option); if (strcmp(option->defname, "template") == 0 && strcmp(optionValue, "template1") != 0) { ereport(ERROR, errmsg("Only template1 is supported as template " "parameter for CREATE DATABASE")); } if (strcmp(option->defname, "strategy") == 0 && strcmp(optionValue, "wal_log") != 0) { ereport(ERROR, errmsg("Only wal_log is supported as strategy " "parameter for CREATE DATABASE")); } } } /* * GetDatabaseAddressFromDatabaseName gets the database name and returns the ObjectAddress * of the database. */ static ObjectAddress * GetDatabaseAddressFromDatabaseName(char *databaseName, bool missingOk) { Oid databaseOid = get_database_oid(databaseName, missingOk); ObjectAddress *dbObjectAddress = palloc0(sizeof(ObjectAddress)); ObjectAddressSet(*dbObjectAddress, DatabaseRelationId, databaseOid); return dbObjectAddress; } /* * GetTablespaceName gets the tablespace oid and returns the tablespace name. */ static char * GetTablespaceName(Oid tablespaceOid) { HeapTuple tuple = SearchSysCache1(TABLESPACEOID, ObjectIdGetDatum(tablespaceOid)); if (!HeapTupleIsValid(tuple)) { return NULL; } Form_pg_tablespace tablespaceForm = (Form_pg_tablespace) GETSTRUCT(tuple); char *tablespaceName = pstrdup(NameStr(tablespaceForm->spcname)); ReleaseSysCache(tuple); return tablespaceName; } /* * GetDatabaseCollation gets oid of a database and returns all the collation related information * We need this method since collation related info in Form_pg_database is not accessible. */ static DatabaseCollationInfo GetDatabaseCollation(Oid dbOid) { DatabaseCollationInfo info; memset(&info, 0, sizeof(DatabaseCollationInfo)); Relation rel = table_open(DatabaseRelationId, AccessShareLock); HeapTuple tup = get_catalog_object_by_oid(rel, Anum_pg_database_oid, dbOid); if (!HeapTupleIsValid(tup)) { elog(ERROR, "cache lookup failed for database %u", dbOid); } bool isNull = false; TupleDesc tupdesc = RelationGetDescr(rel); Datum collationDatum = heap_getattr(tup, Anum_pg_database_datcollate, tupdesc, &isNull); info.datcollate = TextDatumGetCString(collationDatum); Datum ctypeDatum = heap_getattr(tup, Anum_pg_database_datctype, tupdesc, &isNull); info.datctype = TextDatumGetCString(ctypeDatum); #if PG_VERSION_NUM >= PG_VERSION_15 Datum icuLocaleDatum = heap_getattr(tup, Anum_pg_database_daticulocale, tupdesc, &isNull); if (!isNull) { info.daticulocale = TextDatumGetCString(icuLocaleDatum); } Datum collverDatum = heap_getattr(tup, Anum_pg_database_datcollversion, tupdesc, &isNull); if (!isNull) { info.datcollversion = TextDatumGetCString(collverDatum); } #endif #if PG_VERSION_NUM >= PG_VERSION_16 Datum icurulesDatum = heap_getattr(tup, Anum_pg_database_daticurules, tupdesc, &isNull); if (!isNull) { info.daticurules = TextDatumGetCString(icurulesDatum); } #endif table_close(rel, AccessShareLock); heap_freetuple(tup); return info; } #if PG_VERSION_NUM >= PG_VERSION_15 /* * GetLocaleProviderString gets the datlocprovider stored in pg_database * and returns the string representation of the datlocprovider */ static char * GetLocaleProviderString(char datlocprovider) { switch (datlocprovider) { case 'c': { return "libc"; } case 'i': { return "icu"; } default: { ereport(ERROR, (errmsg("unexpected datlocprovider value: %c", datlocprovider))); } } } #endif /* * GenerateCreateDatabaseStatementFromPgDatabase gets the pg_database tuple and returns the * CREATE DATABASE statement that can be used to create given database. * * Note that this doesn't deparse OID of the database and this is not a * problem as we anyway don't allow specifying custom OIDs for databases * when creating them. */ static char * GenerateCreateDatabaseStatementFromPgDatabase(Form_pg_database databaseForm) { DatabaseCollationInfo collInfo = GetDatabaseCollation(databaseForm->oid); StringInfoData str; initStringInfo(&str); appendStringInfo(&str, "CREATE DATABASE %s", quote_identifier(NameStr(databaseForm->datname))); appendStringInfo(&str, " CONNECTION LIMIT %d", databaseForm->datconnlimit); appendStringInfo(&str, " ALLOW_CONNECTIONS = %s", quote_literal_cstr(databaseForm->datallowconn ? "true" : "false")); appendStringInfo(&str, " IS_TEMPLATE = %s", quote_literal_cstr(databaseForm->datistemplate ? "true" : "false")); appendStringInfo(&str, " LC_COLLATE = %s", quote_literal_cstr(collInfo.datcollate)); appendStringInfo(&str, " LC_CTYPE = %s", quote_literal_cstr(collInfo.datctype)); appendStringInfo(&str, " OWNER = %s", quote_identifier(GetUserNameFromId(databaseForm->datdba, false))); appendStringInfo(&str, " TABLESPACE = %s", quote_identifier(GetTablespaceName(databaseForm->dattablespace))); appendStringInfo(&str, " ENCODING = %s", quote_literal_cstr(pg_encoding_to_char(databaseForm->encoding))); #if PG_VERSION_NUM >= PG_VERSION_15 if (collInfo.datcollversion != NULL) { appendStringInfo(&str, " COLLATION_VERSION = %s", quote_identifier(collInfo.datcollversion)); } if (collInfo.daticulocale != NULL) { appendStringInfo(&str, " ICU_LOCALE = %s", quote_identifier( collInfo.daticulocale)); } appendStringInfo(&str, " LOCALE_PROVIDER = %s", quote_identifier(GetLocaleProviderString( databaseForm->datlocprovider))); #endif #if PG_VERSION_NUM >= PG_VERSION_16 if (collInfo.daticurules != NULL) { appendStringInfo(&str, " ICU_RULES = %s", quote_identifier( collInfo.daticurules)); } #endif return str.data; } /* * CreateDatabaseDDLCommand returns a CREATE DATABASE command to create given * database * * Command is wrapped by citus_internal_database_command() UDF * to avoid from transaction block restrictions that apply to database commands. */ char * CreateDatabaseDDLCommand(Oid dbId) { HeapTuple tuple = SearchSysCache1(DATABASEOID, ObjectIdGetDatum(dbId)); if (!HeapTupleIsValid(tuple)) { ereport(ERROR, (errcode(ERRCODE_UNDEFINED_DATABASE), errmsg("database with OID %u does not exist", dbId))); } Form_pg_database databaseForm = (Form_pg_database) GETSTRUCT(tuple); char *createStmt = GenerateCreateDatabaseStatementFromPgDatabase(databaseForm); StringInfo outerDbStmt = makeStringInfo(); /* Generate the CREATE DATABASE statement */ appendStringInfo(outerDbStmt, "SELECT pg_catalog.citus_internal_database_command(%s)", quote_literal_cstr(createStmt)); ReleaseSysCache(tuple); return outerDbStmt->data; }