UNPKG

fib-flow

Version:

A robust workflow management system for fibjs with task orchestration, state management, and distributed execution capabilities

247 lines (214 loc) 10.9 kB
/** * PostgreSQL-specific database adapter implementation * Extends BaseDBAdapter with PostgreSQL-specific schema and optimizations */ const BaseDBAdapter = require('./base'); const createLogger = require('../logger'); // Create logger for PostgreSQL adapter operations const logger = createLogger('fib-flow'); /** * PostgreSQL adapter for task persistence * Uses native PostgreSQL features and includes indexes for optimal query performance */ class PSQLAdapter extends BaseDBAdapter { constructor(config, poolSize = 5) { logger.info(`[PSQLAdapter] Initializing with config:`, config); super(config, poolSize); } /** * Initialize PostgreSQL-specific schema * Creates tasks table with appropriate column types and indexes * * Table Structure: * - Task identification and basic info: * - id: BIGSERIAL primary key * - name: Task type name, used to match with registered handlers * - type: Task type (async: one-time, cron: recurring) * - priority: Task priority for execution ordering (-20 to 20, higher runs first) * - payload: JSON encoded task parameters and data * - created_at: Task creation timestamp (Unix seconds) * - tag: Task tag for categorization * * - Task execution status and results: * - status: Current task state * - next_run_time: Next scheduled execution time (Unix seconds) * - last_active_time: Last time task reported activity (Unix seconds) * - result: JSON encoded task execution result * - error: Error message if task failed * * - Task execution settings: * - timeout: Task execution timeout in seconds * - retry_count: Number of retry attempts made * - max_retries: Maximum number of retry attempts allowed * - retry_interval: Delay between retry attempts in seconds * - cron_expr: Cron expression for recurring tasks * * - Workflow relationships: * - root_id: ID of the root task in workflow * - parent_id: ID of the parent task * - total_children: Total number of child tasks * - completed_children: Number of completed child tasks * * - Worker information: * - worker_id: ID of the worker that executed the task * - start_time: Timestamp when task started execution (Unix seconds) * * Indexes: * - idx_fib_flow_tasks_status_priority_next_run_time: B-tree index for task scheduling * - idx_fib_flow_tasks_name: B-tree index for task type lookups * - idx_fib_flow_tasks_parent_status: B-tree index for workflow management * - idx_fib_flow_tasks_tag_name_status: B-tree index for task statistics */ setup() { logger.notice(`[PSQLAdapter] Setting up database schema`); this.pool(conn => { logger.notice(`[PSQLAdapter] Creating tasks table if not exists`); conn.execute(` CREATE TABLE IF NOT EXISTS fib_flow_tasks ( id BIGSERIAL PRIMARY KEY, name VARCHAR(255) NOT NULL, type VARCHAR(10) NOT NULL, priority INTEGER DEFAULT 0, payload TEXT, created_at BIGINT, tag VARCHAR(255), status VARCHAR(20) NOT NULL, next_run_time BIGINT NOT NULL, last_active_time BIGINT, last_event_time BIGINT, last_event_type VARCHAR(100), result TEXT, error TEXT, current_stage_name VARCHAR(255), progress_text TEXT, progress_percent DOUBLE PRECISION, stage INTEGER DEFAULT 0, timeout INTEGER DEFAULT 60, retry_count INTEGER DEFAULT 0, max_retries INTEGER DEFAULT 3, retry_interval INTEGER DEFAULT 0, cron_expr VARCHAR(100), root_id BIGINT, parent_id BIGINT, total_children INTEGER DEFAULT 0, completed_children INTEGER DEFAULT 0, worker_id VARCHAR(255), start_time BIGINT, context BYTEA ); CREATE TABLE IF NOT EXISTS fib_flow_task_events ( id BIGSERIAL PRIMARY KEY, task_id BIGINT NOT NULL, root_id BIGINT, parent_id BIGINT, event_type VARCHAR(100) NOT NULL, from_status VARCHAR(32), to_status VARCHAR(32), stage INTEGER, worker_id VARCHAR(255), attempt INTEGER, event_time BIGINT NOT NULL, message TEXT, metadata TEXT ); CREATE TABLE IF NOT EXISTS fib_flow_task_attempts ( id BIGSERIAL PRIMARY KEY, task_id BIGINT NOT NULL, attempt INTEGER NOT NULL, worker_id VARCHAR(255), started_at BIGINT NOT NULL, ended_at BIGINT, outcome VARCHAR(32), error TEXT, timeout_flag BOOLEAN DEFAULT FALSE ); CREATE TABLE IF NOT EXISTS fib_flow_workers ( worker_id VARCHAR(255) PRIMARY KEY, pod_id VARCHAR(255) NOT NULL, status VARCHAR(32) NOT NULL, registered_at BIGINT NOT NULL, last_seen_at BIGINT NOT NULL, expires_at BIGINT NOT NULL, superseded_at BIGINT, dead_at BIGINT, meta TEXT ); -- Task scheduling index: Optimizes high-frequency task claiming queries -- Uses partial index to improve query performance CREATE INDEX IF NOT EXISTS idx_task_scheduling ON fib_flow_tasks(status, next_run_time, priority DESC) WHERE status = 'pending'; -- Timeout detection index: Only indexes running tasks CREATE INDEX IF NOT EXISTS idx_task_timeout ON fib_flow_tasks(last_active_time) WHERE status = 'running'; -- Workflow index: Supports parent-child relationship queries -- Uses INCLUDE to add commonly accessed fields to reduce table lookups CREATE INDEX IF NOT EXISTS idx_task_workflow ON fib_flow_tasks(parent_id, status) INCLUDE (completed_children, total_children) WHERE parent_id IS NOT NULL; -- Task statistics index: Optimizes tag-based queries -- Uses B-tree index for exact matches and range scans CREATE INDEX IF NOT EXISTS idx_task_stats ON fib_flow_tasks(tag, name, status); CREATE INDEX IF NOT EXISTS idx_task_last_event ON fib_flow_tasks(last_event_time, last_event_type); CREATE INDEX IF NOT EXISTS idx_task_root_created ON fib_flow_tasks(root_id, created_at) WHERE root_id IS NOT NULL; CREATE INDEX IF NOT EXISTS idx_task_events_task_time ON fib_flow_task_events(task_id, event_time); CREATE INDEX IF NOT EXISTS idx_task_events_root_time ON fib_flow_task_events(root_id, event_time); CREATE INDEX IF NOT EXISTS idx_task_events_parent_time ON fib_flow_task_events(parent_id, event_time) WHERE parent_id IS NOT NULL; CREATE INDEX IF NOT EXISTS idx_task_events_type_time ON fib_flow_task_events(event_type, event_time); CREATE INDEX IF NOT EXISTS idx_task_events_worker_time ON fib_flow_task_events(worker_id, event_time) WHERE worker_id IS NOT NULL; CREATE INDEX IF NOT EXISTS idx_task_events_stage_time ON fib_flow_task_events(stage, event_time) WHERE stage IS NOT NULL; CREATE INDEX IF NOT EXISTS idx_task_events_attempt_time ON fib_flow_task_events(attempt, event_time) WHERE attempt IS NOT NULL; CREATE INDEX IF NOT EXISTS idx_task_attempts_task_attempt ON fib_flow_task_attempts(task_id, attempt); CREATE INDEX IF NOT EXISTS idx_task_attempts_task_open ON fib_flow_task_attempts(task_id, attempt DESC) WHERE ended_at IS NULL; CREATE INDEX IF NOT EXISTS idx_task_attempts_worker_started ON fib_flow_task_attempts(worker_id, started_at) WHERE worker_id IS NOT NULL; CREATE INDEX IF NOT EXISTS idx_task_attempts_outcome_started ON fib_flow_task_attempts(outcome, started_at) WHERE outcome IS NOT NULL; CREATE INDEX IF NOT EXISTS idx_task_workers_pod_id ON fib_flow_workers(pod_id); CREATE INDEX IF NOT EXISTS idx_task_workers_status_expires ON fib_flow_workers(status, expires_at); CREATE INDEX IF NOT EXISTS idx_task_workers_pod_status ON fib_flow_workers(pod_id, status); `); logger.info(`[PSQLAdapter] Database schema setup completed successfully`); }); } /** * Get the ID of the last inserted row in PostgreSQL * Uses PostgreSQL's lastval() function to retrieve the last value from a sequence * * @protected * @param {Object} conn - Database connection object * @param {Object} rs - Result set from the previous insert operation * @returns {number} The ID of the last inserted row * @throws {Error} If lastval() fails or no sequence has been used in the current session */ _getLastInsertedId(conn, rs) { const rs1 = conn.execute('SELECT lastval()'); return rs1[0].lastval; } } module.exports = PSQLAdapter;