UNPKG

@clickup/ent-framework

Version:

A PostgreSQL graph-database-alike library with microsharding and row-level security

656 lines (596 loc) 22.4 kB
import defaults from "lodash/defaults"; import type pg from "pg"; import type { ClientConnectionIssue, ClientOptions, ClientPingInput, ClientRole, } from "../abstract/Client"; import { Client } from "../abstract/Client"; import type { ClientErrorPostAction } from "../abstract/ClientError"; import { ClientError } from "../abstract/ClientError"; import { OP_PING, OP_SHARD_NOS, OP_TIMELINE_POS_REFRESH, } from "../abstract/internal/misc"; import type { ClientQueryLoggerProps } from "../abstract/Loggers"; import type { QueryAnnotation } from "../abstract/QueryAnnotation"; import { ShardError } from "../abstract/ShardError"; import { TimelineManager } from "../abstract/TimelineManager"; import type { MaybeCallable, MaybeError, PickPartial } from "../internal/misc"; import { addSentenceSuffixes, maybeCall, sanitizeIDForDebugPrinting, } from "../internal/misc"; import { Ref } from "../internal/Ref"; import type { Hints, Literal } from "../types"; import { escapeLiteral } from "./helpers/escapeLiteral"; import { buildHintQueries } from "./internal/buildHintQueries"; import { CLIENT_ERROR_PREDICATES } from "./internal/misc"; import { parseCompositeRow } from "./internal/parseCompositeRow"; import { parseLsn } from "./internal/parseLsn"; import { PgError } from "./PgError"; /** * Options for PgClient constructor. */ export interface PgClientOptions extends ClientOptions { /** Info on how to discover the shards. */ shards?: { /** Name of a PG shard schema (e.g. "sh%04d"). */ nameFormat: string; /** A SQL query which should return the names of shard schemas served by * this Client. */ discoverQuery: MaybeCallable<string>; } | null; /** PG "SET key=value" hints to run before each query. Often times we use it * to pass statement_timeout option since e.g. PGBouncer doesn't support * per-connection statement timeout in transaction pooling mode: it throws * "unsupported startup parameter" error. I.e. we may want to emit "SET * statement_timeout TO ..." before each query in multi-query mode. */ hints?: MaybeCallable<Hints> | null; /** After how many milliseconds we give up waiting for the replica to catch up * with the master. When role="replica", then this option is the only way to * "unlatch" the reads from the master node after a write. */ maxReplicationLagMs?: MaybeCallable<number>; /** Sometimes, the role of this Client is known statically, e.g. when pointing * to AWS Aurora writer and reader endpoints. If "master" or "replica" are * provided, then no attempt is made to use functions like * pg_current_wal_insert_lsn() etc. (they are barely supported in e.g. AWS * Aurora). Instead, for "replica" role, it is treated as "always lagging up * until maxReplicationLagMs after the last write". If role="unknown", then * auto-detection and automatic lag tracking is performed using * pg_current_wal_insert_lsn() and other built-in PostgreSQL functions. */ role?: ClientRole; /** Up to how often we call TimelineManager#triggerRefresh(). */ replicaTimelinePosRefreshMs?: MaybeCallable<number>; } /** * An opened low-level PostgreSQL connection. */ export interface PgClientConn extends pg.PoolClient { /** Undocumented property of node-postgres, see: * https://github.com/brianc/node-postgres/issues/2665 */ processID?: number | null; /** An additional property to the vanilla client: auto-incrementing ID of the * connection for logging purposes. */ id?: number; /** An additional property to the vanilla client: number of queries sent * within this connection. */ queriesSent?: number; /** An additional property to the vanilla client: when do we want to * hard-close that connection. */ closeAt?: number; } /** * An abstract PostgreSQL Client which doesn't know how to acquire an actual * connection and send queries; these things are up to the derived classes to * implement. * * The idea is that in each particular project, people may have they own classes * derived from PgClient, in case the codebase already has some existing * connection pooling solution. They don't have to use PgClientPool. * * Since the class is cloneable internally (using the prototype substitution * technique), the contract of this class is that ALL its derived classes may * only have readonly immediate properties. */ export abstract class PgClient extends Client { /** Default values for the constructor options. */ static override readonly DEFAULT_OPTIONS: Required< PickPartial<PgClientOptions> > = { ...super.DEFAULT_OPTIONS, shards: null, hints: null, role: "unknown", maxReplicationLagMs: 60000, replicaTimelinePosRefreshMs: 1000, }; /** Number of decimal digits in an ID allocated for shard number. Calculated * dynamically based on shards.nameFormat (e.g. for "sh%04d", it will be 4 * since it expands to "sh0012"). */ private readonly shardNoPadLen: number = 0; /** This value is set after each request to reflect the actual role of the * client. The idea is that master/replica role may change online, without * reconnecting the Client, so we need to refresh it after each request and be * ready for a fallback. The expectation is that the initial value is * populated during the very first shardNos() call. */ private readonly reportedRoleAfterLastQuery: Ref<ClientRole>; /** This value is non-null if there was an unsuccessful connection attempt * (i.e. the PG is down), and there were no successful queries since then. */ private readonly reportedConnectionIssue = new Ref<ClientConnectionIssue | null>(null); /** PgClient configuration options. */ override readonly options: Required<PgClientOptions>; /** Name of the shard associated to this Client. */ readonly shardName: string = "public"; /** An active TimelineManager for this particular Client. */ readonly timelineManager: TimelineManager; /** * Returns statistics about the connection pool. */ abstract poolStats(): ClientQueryLoggerProps["poolStats"]; /** * Called when the Client needs a connection to run a query against. Implies * than the caller MUST call release() method on the returned object. */ abstract acquireConn(): Promise<PgClientConn>; /** * Initializes an instance of PgClient. */ constructor(options: PgClientOptions) { super(options); this.options = defaults( {}, options, (this as Client).options, { maxReplicationLagMs: options.role === "master" || options.role === "replica" ? 2000 // e.g. AWS Aurora, assuming it always "catches up" fast : undefined, }, PgClient.DEFAULT_OPTIONS, ); this.reportedRoleAfterLastQuery = new Ref(this.options.role); this.timelineManager = new TimelineManager( this.options.maxReplicationLagMs, this.options.replicaTimelinePosRefreshMs, async () => { const startTime = performance.now(); try { await this.query({ query: [`SELECT '${OP_TIMELINE_POS_REFRESH}'`], isWrite: false, annotations: [], op: OP_TIMELINE_POS_REFRESH, table: "pg_catalog", }); } catch (error: unknown) { this.logSwallowedError({ where: OP_TIMELINE_POS_REFRESH, error, elapsed: Math.round(performance.now() - startTime), importance: "normal", }); } }, ); if (this.options.shards) { this.shardNoPadLen = this.buildShardName(0).match(/(\d+)/) ? RegExp.$1.length : 0; if (!this.shardNoPadLen) { throw Error("Invalid shards.nameFormat value"); } } } /** * Sends a query (internally, a multi-query). After the query finishes, we * should expect that role() returns the actual master/replica role. */ async query<TRow>({ query: queryLiteral, hints, isWrite, annotations, op, table, batchFactor, }: { query: Literal; hints?: Hints; isWrite: boolean; annotations: QueryAnnotation[]; op: string; table: string; batchFactor?: number; }): Promise<TRow[]> { const { rawPrepend, queries, queriesRollback, debugQueryWithHints, resultPos, } = this.buildMultiQuery( hints, queryLiteral, this.options.role === "unknown" ? // For master, we read its WAL LSN (pg_current_wal_insert_lsn) after // each query (notice that, when run on a replica, // pg_current_wal_insert_lsn() throws, so we call it only if // pg_is_in_recovery() returns false). For replica, we read its WAL // LSN (pg_last_wal_replay_lsn). "SELECT CASE WHEN pg_is_in_recovery() THEN NULL ELSE pg_current_wal_insert_lsn() END AS pg_current_wal_insert_lsn, pg_last_wal_replay_lsn()" : undefined, isWrite, ); const startTime = performance.now(); let queryTime: number | undefined = undefined; let conn: PgClientConn | undefined = undefined; let res: TRow[] | undefined = undefined; let e: MaybeError<{ severity?: unknown }> = undefined; let postAction: ClientErrorPostAction = "fail"; try { if (this.isEnded()) { throw new ClientError( Error(`Cannot use ${this.constructor.name} since it's ended`), this.options.name, "choose-another-client", "data-on-server-is-unchanged", "client_is_ended", ); } conn = await this.acquireConn(); conn.id ??= connNo++; conn.queriesSent = (conn.queriesSent ?? 0) + 1; queryTime = Math.round(performance.now() - startTime); const resMulti = await this.sendMultiQuery( conn, rawPrepend, queries, queriesRollback, ); this.reportedConnectionIssue.current = null; res = resMulti[resultPos].rows; if (this.options.role === "unknown") { const lsns = resMulti[resMulti.length - 1].rows[0] as { pg_current_wal_insert_lsn: string | null; pg_last_wal_replay_lsn: string | null; }; if (lsns.pg_current_wal_insert_lsn !== null) { this.reportedRoleAfterLastQuery.current = "master"; this.timelineManager.setCurrentPos( parseLsn(lsns.pg_current_wal_insert_lsn)!, ); } else if (lsns.pg_last_wal_replay_lsn !== null) { this.reportedRoleAfterLastQuery.current = "replica"; this.timelineManager.setCurrentPos( parseLsn(lsns.pg_last_wal_replay_lsn), ); } else { throw Error( "BUG: both pg_current_wal_insert_lsn() and pg_last_wal_replay_lsn() returned null", ); } } else if (this.options.role === "master") { this.reportedRoleAfterLastQuery.current = "master"; // In this mode, master pos is always =1 constant. this.timelineManager.setCurrentPos(BigInt(1), true); } else { this.reportedRoleAfterLastQuery.current = "replica"; // In this mode, replica pos is always =0 constant (i.e. always behind // the master), and we solely rely on maxReplicationLagMs timeline data // expiration in Timeline object. this.timelineManager.setCurrentPos(BigInt(0), true); } return res; } catch (cause: unknown) { e = cause as MaybeError<{ severity?: unknown }>; if (e instanceof ClientError) { throw e; } // Infer ClientError which affects Client choosing logic. for (const predicate of CLIENT_ERROR_PREDICATES) { const res = predicate({ code: "" + e?.code, message: "" + e?.message, }); if (res) { if (!isWrite) { // For read queries, we know for sure that the data wasn't changed. res.kind = "data-on-server-is-unchanged"; } postAction = this.role() === "master" ? res.postAction.ifMaster : res.postAction.ifReplica; if (res.postAction.reportConnectionIssue) { // Mark the current Client as non-healthy, so the retry logic will // likely choose another one if available. this.reportedConnectionIssue.current = { timestamp: new Date(), cause, postAction, kind: res.kind, comment: res.comment, }; } throw new ClientError( e, this.options.name, postAction, res.kind, res.abbreviation, res.comment + (res.kind === "unknown-server-state" ? " The write might have been committed on the PG server though." : ""), ); } } // Only wrap the errors which PG sent to us explicitly. Those errors mean // that there was some aborted transaction, so it's safe to retry. if (e?.severity) { throw new PgError(e, this.options.name, debugQueryWithHints); } // Some other error which should not trigger query retries or // Shards/Islands rediscovery. throw e; } finally { conn?.release(); const now = performance.now(); this.options.loggers?.clientQueryLogger?.({ annotations, op, shard: this.shardName, table, batchFactor: batchFactor ?? 1, msg: debugQueryWithHints, output: res ? res : undefined, elapsed: { total: Math.round(now - startTime), acquire: queryTime !== undefined ? queryTime : Math.round(now - startTime), }, connStats: { id: conn ? "" + (conn.id ?? 0) : "?", queriesSent: conn?.queriesSent ?? 0, }, poolStats: this.poolStats(), error: e === undefined ? undefined : addSentenceSuffixes( `${e}`, e?.code ? ` (${e.code})` : undefined, ` [${postAction}]`, ), role: this.role(), backend: this.options.name, address: this.address(), }); } } async shardNos(): Promise<readonly number[]> { // An installation without sharding enabled. if (!this.options.shards) { return [0]; } // e.g. sh0000, sh0123 and not e.g. sh1 or sh12345678 const rows = await this.query<Partial<Record<string, string>>>({ query: [maybeCall(this.options.shards.discoverQuery)], isWrite: false, annotations: [], op: OP_SHARD_NOS, table: "pg_catalog", }); return rows .map((row) => Object.values(row)[0]) .map((name) => { const no = name?.match(/(\d+)/) ? parseInt(RegExp.$1) : null; return no !== null && name === this.buildShardName(no) ? no : null; }) .filter((no): no is number => no !== null) .sort((a, b) => a - b); } async ping({ execTimeMs, isWrite, annotation, }: ClientPingInput): Promise<void> { await this.query<Partial<Record<string, string>>>({ query: [ "DO $$ BEGIN PERFORM pg_sleep(?); IF pg_is_in_recovery() AND ? THEN RAISE read_only_sql_transaction; END IF; END $$", execTimeMs / 1000, isWrite, ], isWrite, annotations: [annotation], op: OP_PING, table: "pg_catalog", }); } shardNoByID(id: string): number { // An installation without sharding enabled. if (!this.options.shards) { return 0; } // Just a historical exception for id="1". if (id === "1") { return 1; } // Composite ID: `(100008888888,1023499999999)` - try extracting non-zero // Shard from parts (left to right) first, and if there is none, allow shard // zero too. if (typeof id === "string" && id.startsWith("(") && id.endsWith(")")) { let no = NaN; for (const subID of parseCompositeRow(id)) { const tryNo = subID && subID.length >= this.shardNoPadLen + 1 ? parseInt(subID.substring(1, this.shardNoPadLen + 1)) : NaN; if (!isNaN(tryNo)) { if (tryNo > 0) { return tryNo; } else if (isNaN(no)) { no = tryNo; } } } if (isNaN(no)) { const idSafe = sanitizeIDForDebugPrinting(id); throw Error( `Cannot extract shard number from the composite ID ${idSafe}`, ); } return no; } // Plain ID. const no = typeof id === "string" && id.length >= this.shardNoPadLen + 1 ? parseInt(id.substring(1, this.shardNoPadLen + 1)) : NaN; if (isNaN(no)) { const idSafe = sanitizeIDForDebugPrinting(id); throw new ShardError( `Cannot parse ID ${idSafe} to detect shard number`, this.options.name, ); } return no; } withShard(no: number): this { return Object.assign(Object.create(this.constructor.prototype), { ...this, shardName: this.buildShardName(no), // Notice that we can ONLY have readonly properties in this and all // derived classes to make it work. If we need some mutable props shared // across all of the clones, we need to wrap them in a Ref (and make the // Ref object itself readonly). That's a pretty fragile contract though. }); } role(): ClientRole { return this.reportedRoleAfterLastQuery.current; } connectionIssue(): ClientConnectionIssue | null { return this.reportedConnectionIssue.current; } /** * Prepares a PG Client multi-query from the query literal and hints. */ private buildMultiQuery( hints: Hints | undefined, literal: Literal, epilogue: string | undefined, isWrite: boolean, ): { rawPrepend: string; queries: string[]; queriesRollback: string[]; debugQueryWithHints: string; resultPos: number; } { const query = escapeLiteral(literal).trimEnd(); if (query === "") { throw Error("Empty query passed to query()"); } const queriesPrologue: string[] = []; const queriesEpilogue: string[] = []; const queriesRollback: string[] = []; const [rawPrepend, hintQueriesDefault, hintQueries] = buildHintQueries( this.options.hints ? maybeCall(this.options.hints) : undefined, hints, ); // Prepend per-query hints to the prologue (if any); they will be logged. queriesPrologue.unshift(...hintQueries); // The query which is logged to the logging infra. For more brief messages, // we don't log internal hints (this.hints) and search_path; see below. const debugQueryWithHints = `${rawPrepend}/*${this.shardName}*/` + [...queriesPrologue, query].join("; ").trim(); // Prepend internal per-Client hints to the prologue. queriesPrologue.unshift(...hintQueriesDefault); // We must always have "public" in search_path, because extensions are by // default installed in "public" schema. Some extensions may expose // operators (e.g. "citext" exposes comparison operators) which must be // available in all Shards by default, so they should live in "public". // (There is a way to install an extension to a particular schema, but a) // there can be only one such schema, and b) there are problems running // pg_dump when migrating this Shard to another machine since pg_dump // doesn't emit CREATE EXTENSION statement when filtering by schema name). queriesPrologue.unshift( `SET LOCAL search_path TO ${this.shardName}, public`, ); if (epilogue) { queriesEpilogue.push(epilogue); } // Why wrapping with BEGIN...COMMIT for write queries? See here: // https://www.postgresql.org/message-id/20220803.163217.1789690807623885906.horikyota.ntt%40gmail.com if (isWrite && queriesEpilogue.length > 0) { queriesPrologue.unshift("BEGIN"); queriesRollback.unshift("ROLLBACK"); queriesEpilogue.unshift("COMMIT"); } return { rawPrepend, queries: [...queriesPrologue, query, ...queriesEpilogue], queriesRollback, debugQueryWithHints, resultPos: queriesPrologue.length, }; } /** * Sends a multi-query to PG Client. * * A good and simple explanation of the protocol is here: * https://www.postgresql.org/docs/13/protocol-flow.html. In short, we can't * use prepared-statement-based operations even theoretically, because this * mode doesn't support multi-queries. Also notice that TS typing is doomed * for multi-queries: * https://github.com/DefinitelyTyped/DefinitelyTyped/pull/33297 */ private async sendMultiQuery( conn: PgClientConn, rawPrepend: string, queries: string[], queriesRollback: string[], ): Promise<pg.QueryResult[]> { const queriesStr = `${rawPrepend}/*${this.shardName}*/${queries.join("; ")}`; // For multi-query, query() actually returns an array of pg.QueryResult, but // it's not reflected in its TS typing, so patching this. const resMulti = (await conn.query(queriesStr).catch(async (e) => { // We must run a ROLLBACK if we used BEGIN in the queries, because // otherwise the connection is released to the pool in "aborted // transaction" state (see the protocol link above). queriesRollback.length > 0 && (await conn.query(queriesRollback.join("; ")).catch(() => {})); throw e; })) as unknown as Array<pg.QueryResult<{}>>; if (resMulti.length !== queries.length) { throw Error( `Multi-query (with semicolons) is not allowed as an input to query(); got ${queriesStr}`, ); } return resMulti; } /** * Builds the schema name (aka "Shard name") by Shard number using * `options#shards#nameFormat`. * * E.g. nameFormat="sh%04d" generates names like "sh0042". */ private buildShardName(no: number | string): string { // return this.options.shards ? this.options.shards.nameFormat.replace( /%(0?)(\d+)[sd]/, (_, zero: string, d: string) => no.toString().padStart(zero ? parseInt(d) : 0, "0"), ) : this.shardName; } } let connNo = 1;