PostgreSQL Source Code git master
task.c
Go to the documentation of this file.
1/*
2 * task.c
3 * framework for parallelizing pg_upgrade's once-in-each-database tasks
4 *
5 * This framework provides an efficient way of running the various
6 * once-in-each-database tasks required by pg_upgrade. Specifically, it
7 * parallelizes these tasks by managing a set of slots that follow a simple
8 * state machine and by using libpq's asynchronous APIs to establish the
9 * connections and run the queries. Callers simply need to create a callback
10 * function and build/execute an UpgradeTask. A simple example follows:
11 *
12 * static void
13 * my_process_cb(DbInfo *dbinfo, PGresult *res, void *arg)
14 * {
15 * for (int i = 0; i < PQntuples(res); i++)
16 * {
17 * ... process results ...
18 * }
19 * }
20 *
21 * void
22 * my_task(ClusterInfo *cluster)
23 * {
24 * UpgradeTask *task = upgrade_task_create();
25 *
26 * upgrade_task_add_step(task,
27 * "... query text ...",
28 * my_process_cb,
29 * true, // let the task free the PGresult
30 * NULL); // "arg" pointer for callback
31 * upgrade_task_run(task, cluster);
32 * upgrade_task_free(task);
33 * }
34 *
35 * Note that multiple steps can be added to a given task. When there are
36 * multiple steps, the task will run all of the steps consecutively in the same
37 * database connection before freeing the connection and moving on. In other
38 * words, it only ever initiates one connection to each database in the
39 * cluster for a given run.
40 *
41 * Copyright (c) 2024-2025, PostgreSQL Global Development Group
42 * src/bin/pg_upgrade/task.c
43 */
44
45#include "postgres_fe.h"
46
47#include "common/connect.h"
49#include "pg_upgrade.h"
50
51/*
52 * dbs_complete stores the number of databases that we have completed
53 * processing. When this value equals the number of databases in the cluster,
54 * the task is finished.
55 */
56static int dbs_complete;
57
58/*
59 * dbs_processing stores the index of the next database in the cluster's array
60 * of databases that will be picked up for processing. It will always be
61 * greater than or equal to dbs_complete.
62 */
63static int dbs_processing;
64
65/*
66 * This struct stores the information for a single step of a task. Note that
67 * the query string is stored in the "queries" PQExpBuffer for the UpgradeTask.
68 * All steps in a task are run in a single connection before moving on to the
69 * next database (which requires a new connection).
70 */
71typedef struct UpgradeTaskStep
72{
73 UpgradeTaskProcessCB process_cb; /* processes the results of the query */
74 bool free_result; /* should we free the result? */
75 void *arg; /* pointer passed to process_cb */
77
78/*
79 * This struct is a thin wrapper around an array of steps, i.e.,
80 * UpgradeTaskStep, plus a PQExpBuffer for all the query strings.
81 */
83{
87};
88
89/*
90 * The different states for a parallel slot.
91 */
93{
94 FREE, /* slot available for use in a new database */
95 CONNECTING, /* waiting for connection to be established */
96 RUNNING_QUERIES, /* running/processing queries in the task */
98
99/*
100 * We maintain an array of user_opts.jobs slots to execute the task.
101 */
102typedef struct UpgradeTaskSlot
103{
104 UpgradeTaskSlotState state; /* state of the slot */
105 int db_idx; /* index of the database assigned to slot */
106 int step_idx; /* index of the current step of task */
107 PGconn *conn; /* current connection managed by slot */
108 bool ready; /* slot is ready for processing */
109 bool select_mode; /* select() mode: true->read, false->write */
110 int sock; /* file descriptor for connection's socket */
112
113/*
114 * Initializes an UpgradeTask.
115 */
118{
119 UpgradeTask *task = pg_malloc0(sizeof(UpgradeTask));
120
121 task->queries = createPQExpBuffer();
122
123 /* All tasks must first set a secure search_path. */
125
126 return task;
127}
128
129/*
130 * Frees all storage associated with an UpgradeTask.
131 */
132void
134{
136 pg_free(task->steps);
137 pg_free(task);
138}
139
140/*
141 * Adds a step to an UpgradeTask. The steps will be executed in each database
142 * in the order in which they are added.
143 *
144 * task: task object that must have been initialized via upgrade_task_create()
145 * query: the query text
146 * process_cb: function that processes the results of the query
147 * free_result: should we free the PGresult, or leave it to the caller?
148 * arg: pointer to task-specific data that is passed to each callback
149 */
150void
151upgrade_task_add_step(UpgradeTask *task, const char *query,
152 UpgradeTaskProcessCB process_cb, bool free_result,
153 void *arg)
154{
155 UpgradeTaskStep *new_step;
156
157 task->steps = pg_realloc(task->steps,
158 ++task->num_steps * sizeof(UpgradeTaskStep));
159
160 new_step = &task->steps[task->num_steps - 1];
161 new_step->process_cb = process_cb;
162 new_step->free_result = free_result;
163 new_step->arg = arg;
164
165 appendPQExpBuffer(task->queries, "%s;", query);
166}
167
168/*
169 * Build a connection string for the slot's current database and asynchronously
170 * start a new connection, but do not wait for the connection to be
171 * established.
172 */
173static void
175{
176 PQExpBufferData conn_opts;
177 DbInfo *dbinfo = &cluster->dbarr.dbs[slot->db_idx];
178
179 /* Build connection string with proper quoting */
180 initPQExpBuffer(&conn_opts);
181 appendPQExpBufferStr(&conn_opts, "dbname=");
182 appendConnStrVal(&conn_opts, dbinfo->db_name);
183 appendPQExpBufferStr(&conn_opts, " user=");
184 appendConnStrVal(&conn_opts, os_info.user);
185 appendPQExpBuffer(&conn_opts, " port=%d", cluster->port);
186 if (cluster->sockdir)
187 {
188 appendPQExpBufferStr(&conn_opts, " host=");
189 appendConnStrVal(&conn_opts, cluster->sockdir);
190 }
191
192 slot->conn = PQconnectStart(conn_opts.data);
193
194 if (!slot->conn)
195 pg_fatal("out of memory");
196
197 termPQExpBuffer(&conn_opts);
198}
199
200/*
201 * Run the process_cb callback function to process the result of a query, and
202 * free the result if the caller indicated we should do so.
203 */
204static void
206 const UpgradeTask *task)
207{
208 UpgradeTaskStep *steps = &task->steps[slot->step_idx];
209 UpgradeTaskProcessCB process_cb = steps->process_cb;
210 DbInfo *dbinfo = &cluster->dbarr.dbs[slot->db_idx];
211 PGresult *res = PQgetResult(slot->conn);
212
213 if (PQstatus(slot->conn) == CONNECTION_BAD ||
216 pg_fatal("connection failure: %s", PQerrorMessage(slot->conn));
217
218 /*
219 * We assume that a NULL process_cb callback function means there's
220 * nothing to process. This is primarily intended for the initial step in
221 * every task that sets a safe search_path.
222 */
223 if (process_cb)
224 (*process_cb) (dbinfo, res, steps->arg);
225
226 if (steps->free_result)
227 PQclear(res);
228}
229
230/*
231 * Advances the state machine for a given slot as necessary.
232 */
233static void
235{
237
238 if (!slot->ready)
239 return;
240
241 switch (slot->state)
242 {
243 case FREE:
244
245 /*
246 * If all of the databases in the cluster have been processed or
247 * are currently being processed by other slots, we are done.
248 */
249 if (dbs_processing >= cluster->dbarr.ndbs)
250 return;
251
252 /*
253 * Claim the next database in the cluster's array and initiate a
254 * new connection.
255 */
256 slot->db_idx = dbs_processing++;
257 slot->state = CONNECTING;
258 start_conn(cluster, slot);
259
260 return;
261
262 case CONNECTING:
263
264 /* Check for connection failure. */
265 status = PQconnectPoll(slot->conn);
266 if (status == PGRES_POLLING_FAILED)
267 pg_fatal("connection failure: %s", PQerrorMessage(slot->conn));
268
269 /* Check whether the connection is still establishing. */
270 if (status != PGRES_POLLING_OK)
271 {
272 slot->select_mode = (status == PGRES_POLLING_READING);
273 return;
274 }
275
276 /*
277 * Move on to running/processing the queries in the task.
278 */
279 slot->state = RUNNING_QUERIES;
280 slot->select_mode = true; /* wait until ready for reading */
281 if (!PQsendQuery(slot->conn, task->queries->data))
282 pg_fatal("connection failure: %s", PQerrorMessage(slot->conn));
283
284 return;
285
286 case RUNNING_QUERIES:
287
288 /*
289 * Consume any available data and clear the read-ready indicator
290 * for the connection.
291 */
292 if (!PQconsumeInput(slot->conn))
293 pg_fatal("connection failure: %s", PQerrorMessage(slot->conn));
294
295 /*
296 * Process any results that are ready so that we can free up this
297 * slot for another database as soon as possible.
298 */
299 for (; slot->step_idx < task->num_steps; slot->step_idx++)
300 {
301 /* If no more results are available yet, move on. */
302 if (PQisBusy(slot->conn))
303 return;
304
305 process_query_result(cluster, slot, task);
306 }
307
308 /*
309 * If we just finished processing the result of the last step in
310 * the task, free the slot. We recursively call this function on
311 * the newly-freed slot so that we can start initiating the next
312 * connection immediately instead of waiting for the next loop
313 * through the slots.
314 */
315 dbs_complete++;
316 PQfinish(slot->conn);
317 memset(slot, 0, sizeof(UpgradeTaskSlot));
318 slot->ready = true;
319
320 process_slot(cluster, slot, task);
321
322 return;
323 }
324}
325
326/*
327 * Returns -1 on error, else the number of ready descriptors.
328 */
329static int
330select_loop(int maxFd, fd_set *input, fd_set *output)
331{
332 fd_set save_input = *input;
333 fd_set save_output = *output;
334
335 if (maxFd == 0)
336 return 0;
337
338 for (;;)
339 {
340 int i;
341
342 *input = save_input;
343 *output = save_output;
344
345 i = select(maxFd + 1, input, output, NULL, NULL);
346
347#ifndef WIN32
348 if (i < 0 && errno == EINTR)
349 continue;
350#else
351 if (i == SOCKET_ERROR && WSAGetLastError() == WSAEINTR)
352 continue;
353#endif
354 return i;
355 }
356}
357
358/*
359 * Wait on the slots to either finish connecting or to receive query results if
360 * possible. This avoids a tight loop in upgrade_task_run().
361 */
362static void
363wait_on_slots(UpgradeTaskSlot *slots, int numslots)
364{
365 fd_set input;
366 fd_set output;
367 int maxFd = 0;
368
369 FD_ZERO(&input);
370 FD_ZERO(&output);
371
372 for (int i = 0; i < numslots; i++)
373 {
374 /*
375 * We assume the previous call to process_slot() handled everything
376 * that was marked ready in the previous call to wait_on_slots(), if
377 * any.
378 */
379 slots[i].ready = false;
380
381 /*
382 * This function should only ever see free slots as we are finishing
383 * processing the last few databases, at which point we don't have any
384 * databases left for them to process. We'll never use these slots
385 * again, so we can safely ignore them.
386 */
387 if (slots[i].state == FREE)
388 continue;
389
390 /*
391 * Add the socket to the set.
392 */
393 slots[i].sock = PQsocket(slots[i].conn);
394 if (slots[i].sock < 0)
395 pg_fatal("invalid socket");
396 FD_SET(slots[i].sock, slots[i].select_mode ? &input : &output);
397 maxFd = Max(maxFd, slots[i].sock);
398 }
399
400 /*
401 * If we found socket(s) to wait on, wait.
402 */
403 if (select_loop(maxFd, &input, &output) == -1)
404 pg_fatal("%s() failed: %m", "select");
405
406 /*
407 * Mark which sockets appear to be ready.
408 */
409 for (int i = 0; i < numslots; i++)
410 slots[i].ready |= (FD_ISSET(slots[i].sock, &input) ||
411 FD_ISSET(slots[i].sock, &output));
412}
413
414/*
415 * Runs all the steps of the task in every database in the cluster using
416 * user_opts.jobs parallel slots.
417 */
418void
420{
421 int jobs = Max(1, user_opts.jobs);
422 UpgradeTaskSlot *slots = pg_malloc0(sizeof(UpgradeTaskSlot) * jobs);
423
424 dbs_complete = 0;
425 dbs_processing = 0;
426
427 /*
428 * Process every slot the first time round.
429 */
430 for (int i = 0; i < jobs; i++)
431 slots[i].ready = true;
432
433 while (dbs_complete < cluster->dbarr.ndbs)
434 {
435 for (int i = 0; i < jobs; i++)
436 process_slot(cluster, &slots[i], task);
437
438 wait_on_slots(slots, jobs);
439 }
440
441 pg_free(slots);
442}
#define Max(x, y)
Definition: c.h:1002
void cluster(ParseState *pstate, ClusterStmt *stmt, bool isTopLevel)
Definition: cluster.c:107
#define ALWAYS_SECURE_SEARCH_PATH_SQL
Definition: connect.h:25
PostgresPollingStatusType PQconnectPoll(PGconn *conn)
Definition: fe-connect.c:2922
ConnStatusType PQstatus(const PGconn *conn)
Definition: fe-connect.c:7641
PGconn * PQconnectStart(const char *conninfo)
Definition: fe-connect.c:953
void PQfinish(PGconn *conn)
Definition: fe-connect.c:5316
char * PQerrorMessage(const PGconn *conn)
Definition: fe-connect.c:7704
int PQsocket(const PGconn *conn)
Definition: fe-connect.c:7730
int PQconsumeInput(PGconn *conn)
Definition: fe-exec.c:2000
int PQsendQuery(PGconn *conn, const char *query)
Definition: fe-exec.c:1432
int PQisBusy(PGconn *conn)
Definition: fe-exec.c:2047
void * pg_malloc0(size_t size)
Definition: fe_memutils.c:53
void pg_free(void *ptr)
Definition: fe_memutils.c:105
void * pg_realloc(void *ptr, size_t size)
Definition: fe_memutils.c:65
FILE * input
FILE * output
int i
Definition: isn.c:77
#define PQgetResult
Definition: libpq-be-fe.h:246
#define PQclear
Definition: libpq-be-fe.h:245
#define PQresultStatus
Definition: libpq-be-fe.h:247
@ CONNECTION_BAD
Definition: libpq-fe.h:85
@ PGRES_COMMAND_OK
Definition: libpq-fe.h:125
@ PGRES_TUPLES_OK
Definition: libpq-fe.h:128
PostgresPollingStatusType
Definition: libpq-fe.h:114
@ PGRES_POLLING_OK
Definition: libpq-fe.h:118
@ PGRES_POLLING_READING
Definition: libpq-fe.h:116
@ PGRES_POLLING_FAILED
Definition: libpq-fe.h:115
void * arg
#define pg_fatal(...)
OSInfo os_info
Definition: pg_upgrade.c:74
void(* UpgradeTaskProcessCB)(DbInfo *dbinfo, PGresult *res, void *arg)
Definition: pg_upgrade.h:512
PQExpBuffer createPQExpBuffer(void)
Definition: pqexpbuffer.c:72
void initPQExpBuffer(PQExpBuffer str)
Definition: pqexpbuffer.c:90
void appendPQExpBuffer(PQExpBuffer str, const char *fmt,...)
Definition: pqexpbuffer.c:265
void destroyPQExpBuffer(PQExpBuffer str)
Definition: pqexpbuffer.c:114
void appendPQExpBufferStr(PQExpBuffer str, const char *data)
Definition: pqexpbuffer.c:367
void termPQExpBuffer(PQExpBuffer str)
Definition: pqexpbuffer.c:129
UserOpts user_opts
Definition: option.c:30
PGconn * conn
Definition: streamutil.c:52
void appendConnStrVal(PQExpBuffer buf, const char *str)
Definition: string_utils.c:698
char * db_name
Definition: pg_upgrade.h:199
char * user
Definition: pg_upgrade.h:359
int step_idx
Definition: task.c:106
int db_idx
Definition: task.c:105
PGconn * conn
Definition: task.c:107
bool select_mode
Definition: task.c:109
UpgradeTaskSlotState state
Definition: task.c:104
bool ready
Definition: task.c:108
bool free_result
Definition: task.c:74
UpgradeTaskProcessCB process_cb
Definition: task.c:73
void * arg
Definition: task.c:75
PQExpBuffer queries
Definition: task.c:86
UpgradeTaskStep * steps
Definition: task.c:84
int num_steps
Definition: task.c:85
int jobs
Definition: pg_upgrade.h:338
Definition: regguts.h:323
static int dbs_processing
Definition: task.c:63
UpgradeTask * upgrade_task_create(void)
Definition: task.c:117
static void wait_on_slots(UpgradeTaskSlot *slots, int numslots)
Definition: task.c:363
static int dbs_complete
Definition: task.c:56
struct UpgradeTaskSlot UpgradeTaskSlot
struct UpgradeTaskStep UpgradeTaskStep
UpgradeTaskSlotState
Definition: task.c:93
@ CONNECTING
Definition: task.c:95
@ RUNNING_QUERIES
Definition: task.c:96
@ FREE
Definition: task.c:94
void upgrade_task_run(const UpgradeTask *task, const ClusterInfo *cluster)
Definition: task.c:419
static void process_slot(const ClusterInfo *cluster, UpgradeTaskSlot *slot, const UpgradeTask *task)
Definition: task.c:234
static void start_conn(const ClusterInfo *cluster, UpgradeTaskSlot *slot)
Definition: task.c:174
static int select_loop(int maxFd, fd_set *input, fd_set *output)
Definition: task.c:330
void upgrade_task_free(UpgradeTask *task)
Definition: task.c:133
static void process_query_result(const ClusterInfo *cluster, UpgradeTaskSlot *slot, const UpgradeTask *task)
Definition: task.c:205
void upgrade_task_add_step(UpgradeTask *task, const char *query, UpgradeTaskProcessCB process_cb, bool free_result, void *arg)
Definition: task.c:151
#define EINTR
Definition: win32_port.h:364
#define select(n, r, w, e, timeout)
Definition: win32_port.h:503