Line data Source code
1 : /*
2 : * server.c
3 : *
4 : * database server functions
5 : *
6 : * Copyright (c) 2010-2023, PostgreSQL Global Development Group
7 : * src/bin/pg_upgrade/server.c
8 : */
9 :
10 : #include "postgres_fe.h"
11 :
12 : #include "common/connect.h"
13 : #include "fe_utils/string_utils.h"
14 : #include "libpq/pqcomm.h"
15 : #include "pg_upgrade.h"
16 :
17 : static PGconn *get_db_conn(ClusterInfo *cluster, const char *db_name);
18 :
19 :
20 : /*
21 : * connectToServer()
22 : *
23 : * Connects to the desired database on the designated server.
24 : * If the connection attempt fails, this function logs an error
25 : * message and calls exit() to kill the program.
26 : */
27 : PGconn *
28 392 : connectToServer(ClusterInfo *cluster, const char *db_name)
29 : {
30 392 : PGconn *conn = get_db_conn(cluster, db_name);
31 :
32 392 : if (conn == NULL || PQstatus(conn) != CONNECTION_OK)
33 : {
34 2 : pg_log(PG_REPORT, "%s", PQerrorMessage(conn));
35 :
36 2 : if (conn)
37 2 : PQfinish(conn);
38 :
39 2 : printf(_("Failure, exiting\n"));
40 2 : exit(1);
41 : }
42 :
43 390 : PQclear(executeQueryOrDie(conn, ALWAYS_SECURE_SEARCH_PATH_SQL));
44 :
45 390 : return conn;
46 : }
47 :
48 :
49 : /*
50 : * get_db_conn()
51 : *
52 : * get database connection, using named database + standard params for cluster
53 : *
54 : * Caller must check for connection failure!
55 : */
56 : static PGconn *
57 422 : get_db_conn(ClusterInfo *cluster, const char *db_name)
58 : {
59 : PQExpBufferData conn_opts;
60 : PGconn *conn;
61 :
62 : /* Build connection string with proper quoting */
63 422 : initPQExpBuffer(&conn_opts);
64 422 : appendPQExpBufferStr(&conn_opts, "dbname=");
65 422 : appendConnStrVal(&conn_opts, db_name);
66 422 : appendPQExpBufferStr(&conn_opts, " user=");
67 422 : appendConnStrVal(&conn_opts, os_info.user);
68 422 : appendPQExpBuffer(&conn_opts, " port=%d", cluster->port);
69 422 : if (cluster->sockdir)
70 : {
71 422 : appendPQExpBufferStr(&conn_opts, " host=");
72 422 : appendConnStrVal(&conn_opts, cluster->sockdir);
73 : }
74 :
75 422 : conn = PQconnectdb(conn_opts.data);
76 422 : termPQExpBuffer(&conn_opts);
77 422 : return conn;
78 : }
79 :
80 :
81 : /*
82 : * cluster_conn_opts()
83 : *
84 : * Return standard command-line options for connecting to this cluster when
85 : * using psql, pg_dump, etc. Ideally this would match what get_db_conn()
86 : * sets, but the utilities we need aren't very consistent about the treatment
87 : * of database name options, so we leave that out.
88 : *
89 : * Result is valid until the next call to this function.
90 : */
91 : char *
92 54 : cluster_conn_opts(ClusterInfo *cluster)
93 : {
94 : static PQExpBuffer buf;
95 :
96 54 : if (buf == NULL)
97 6 : buf = createPQExpBuffer();
98 : else
99 48 : resetPQExpBuffer(buf);
100 :
101 54 : if (cluster->sockdir)
102 : {
103 54 : appendPQExpBufferStr(buf, "--host ");
104 54 : appendShellString(buf, cluster->sockdir);
105 54 : appendPQExpBufferChar(buf, ' ');
106 : }
107 54 : appendPQExpBuffer(buf, "--port %d --username ", cluster->port);
108 54 : appendShellString(buf, os_info.user);
109 :
110 54 : return buf->data;
111 : }
112 :
113 :
114 : /*
115 : * executeQueryOrDie()
116 : *
117 : * Formats a query string from the given arguments and executes the
118 : * resulting query. If the query fails, this function logs an error
119 : * message and calls exit() to kill the program.
120 : */
121 : PGresult *
122 822 : executeQueryOrDie(PGconn *conn, const char *fmt,...)
123 : {
124 : static char query[QUERY_ALLOC];
125 : va_list args;
126 : PGresult *result;
127 : ExecStatusType status;
128 :
129 822 : va_start(args, fmt);
130 822 : vsnprintf(query, sizeof(query), fmt, args);
131 822 : va_end(args);
132 :
133 822 : pg_log(PG_VERBOSE, "executing: %s", query);
134 822 : result = PQexec(conn, query);
135 822 : status = PQresultStatus(result);
136 :
137 822 : if ((status != PGRES_TUPLES_OK) && (status != PGRES_COMMAND_OK))
138 : {
139 0 : pg_log(PG_REPORT, "SQL command failed\n%s\n%s", query,
140 : PQerrorMessage(conn));
141 0 : PQclear(result);
142 0 : PQfinish(conn);
143 0 : printf(_("Failure, exiting\n"));
144 0 : exit(1);
145 : }
146 : else
147 822 : return result;
148 : }
149 :
150 :
151 : /*
152 : * get_major_server_version()
153 : *
154 : * gets the version (in unsigned int form) for the given datadir. Assumes
155 : * that datadir is an absolute path to a valid pgdata directory. The version
156 : * is retrieved by reading the PG_VERSION file.
157 : */
158 : uint32
159 24 : get_major_server_version(ClusterInfo *cluster)
160 : {
161 : FILE *version_fd;
162 : char ver_filename[MAXPGPATH];
163 24 : int v1 = 0,
164 24 : v2 = 0;
165 :
166 24 : snprintf(ver_filename, sizeof(ver_filename), "%s/PG_VERSION",
167 : cluster->pgdata);
168 24 : if ((version_fd = fopen(ver_filename, "r")) == NULL)
169 0 : pg_fatal("could not open version file \"%s\": %m", ver_filename);
170 :
171 24 : if (fscanf(version_fd, "%63s", cluster->major_version_str) == 0 ||
172 24 : sscanf(cluster->major_version_str, "%d.%d", &v1, &v2) < 1)
173 0 : pg_fatal("could not parse version file \"%s\"", ver_filename);
174 :
175 24 : fclose(version_fd);
176 :
177 24 : if (v1 < 10)
178 : {
179 : /* old style, e.g. 9.6.1 */
180 0 : return v1 * 10000 + v2 * 100;
181 : }
182 : else
183 : {
184 : /* new style, e.g. 10.1 */
185 24 : return v1 * 10000;
186 : }
187 : }
188 :
189 :
190 : static void
191 12 : stop_postmaster_atexit(void)
192 : {
193 12 : stop_postmaster(true);
194 12 : }
195 :
196 :
197 : bool
198 30 : start_postmaster(ClusterInfo *cluster, bool report_and_exit_on_error)
199 : {
200 : char cmd[MAXPGPATH * 4 + 1000];
201 : PGconn *conn;
202 30 : bool pg_ctl_return = false;
203 : char socket_string[MAXPGPATH + 200];
204 : PQExpBufferData pgoptions;
205 :
206 : static bool exit_hook_registered = false;
207 :
208 30 : if (!exit_hook_registered)
209 : {
210 12 : atexit(stop_postmaster_atexit);
211 12 : exit_hook_registered = true;
212 : }
213 :
214 30 : socket_string[0] = '\0';
215 :
216 : #if !defined(WIN32)
217 : /* prevent TCP/IP connections, restrict socket access */
218 30 : strcat(socket_string,
219 : " -c listen_addresses='' -c unix_socket_permissions=0700");
220 :
221 : /* Have a sockdir? Tell the postmaster. */
222 30 : if (cluster->sockdir)
223 30 : snprintf(socket_string + strlen(socket_string),
224 30 : sizeof(socket_string) - strlen(socket_string),
225 : " -c %s='%s'",
226 30 : (GET_MAJOR_VERSION(cluster->major_version) <= 902) ?
227 : "unix_socket_directory" : "unix_socket_directories",
228 : cluster->sockdir);
229 : #endif
230 :
231 30 : initPQExpBuffer(&pgoptions);
232 :
233 : /*
234 : * Construct a parameter string which is passed to the server process.
235 : *
236 : * Turn off durability requirements to improve object creation speed, and
237 : * we only modify the new cluster, so only use it there. If there is a
238 : * crash, the new cluster has to be recreated anyway. fsync=off is a big
239 : * win on ext4.
240 : */
241 30 : if (cluster == &new_cluster)
242 18 : appendPQExpBufferStr(&pgoptions, " -c synchronous_commit=off -c fsync=off -c full_page_writes=off");
243 :
244 : /*
245 : * Use max_slot_wal_keep_size as -1 to prevent the WAL removal by the
246 : * checkpointer process. If WALs required by logical replication slots
247 : * are removed, the slots are unusable. This setting prevents the
248 : * invalidation of slots during the upgrade. We set this option when
249 : * cluster is PG17 or later because logical replication slots can only be
250 : * migrated since then. Besides, max_slot_wal_keep_size is added in PG13.
251 : *
252 : * Use max_logical_replication_workers as 0 to prevent a startup of the
253 : * logical replication launcher while upgrading because it may start apply
254 : * workers that could start receiving changes from the publisher before
255 : * the physical files are put in place, causing corruption on the new
256 : * cluster upgrading to. Like the previous parameter, this is set only
257 : * when a cluster is PG17 or later as logical slots can only be migrated
258 : * since this version.
259 : */
260 30 : if (GET_MAJOR_VERSION(cluster->major_version) >= 1700)
261 30 : appendPQExpBufferStr(&pgoptions, " -c max_slot_wal_keep_size=-1 -c max_logical_replication_workers=0");
262 :
263 : /* Use -b to disable autovacuum. */
264 30 : snprintf(cmd, sizeof(cmd),
265 : "\"%s/pg_ctl\" -w -l \"%s/%s\" -D \"%s\" -o \"-p %d -b%s %s%s\" start",
266 : cluster->bindir,
267 : log_opts.logdir,
268 30 : SERVER_LOG_FILE, cluster->pgconfig, cluster->port,
269 : pgoptions.data,
270 30 : cluster->pgopts ? cluster->pgopts : "", socket_string);
271 :
272 30 : termPQExpBuffer(&pgoptions);
273 :
274 : /*
275 : * Don't throw an error right away, let connecting throw the error because
276 : * it might supply a reason for the failure.
277 : */
278 30 : pg_ctl_return = exec_prog(SERVER_START_LOG_FILE,
279 : /* pass both file names if they differ */
280 : (strcmp(SERVER_LOG_FILE,
281 : SERVER_START_LOG_FILE) != 0) ?
282 : SERVER_LOG_FILE : NULL,
283 : report_and_exit_on_error, false,
284 : "%s", cmd);
285 :
286 : /* Did it fail and we are just testing if the server could be started? */
287 30 : if (!pg_ctl_return && !report_and_exit_on_error)
288 0 : return false;
289 :
290 : /*
291 : * We set this here to make sure atexit() shuts down the server, but only
292 : * if we started the server successfully. We do it before checking for
293 : * connectivity in case the server started but there is a connectivity
294 : * failure. If pg_ctl did not return success, we will exit below.
295 : *
296 : * Pre-9.1 servers do not have PQping(), so we could be leaving the server
297 : * running if authentication was misconfigured, so someday we might went
298 : * to be more aggressive about doing server shutdowns even if pg_ctl
299 : * fails, but now (2013-08-14) it seems prudent to be cautious. We don't
300 : * want to shutdown a server that might have been accidentally started
301 : * during the upgrade.
302 : */
303 30 : if (pg_ctl_return)
304 30 : os_info.running_cluster = cluster;
305 :
306 : /*
307 : * pg_ctl -w might have failed because the server couldn't be started, or
308 : * there might have been a connection problem in _checking_ if the server
309 : * has started. Therefore, even if pg_ctl failed, we continue and test
310 : * for connectivity in case we get a connection reason for the failure.
311 : */
312 60 : if ((conn = get_db_conn(cluster, "template1")) == NULL ||
313 30 : PQstatus(conn) != CONNECTION_OK)
314 : {
315 0 : pg_log(PG_REPORT, "\n%s", PQerrorMessage(conn));
316 0 : if (conn)
317 0 : PQfinish(conn);
318 0 : if (cluster == &old_cluster)
319 0 : pg_fatal("could not connect to source postmaster started with the command:\n"
320 : "%s",
321 : cmd);
322 : else
323 0 : pg_fatal("could not connect to target postmaster started with the command:\n"
324 : "%s",
325 : cmd);
326 : }
327 30 : PQfinish(conn);
328 :
329 : /*
330 : * If pg_ctl failed, and the connection didn't fail, and
331 : * report_and_exit_on_error is enabled, fail now. This could happen if
332 : * the server was already running.
333 : */
334 30 : if (!pg_ctl_return)
335 : {
336 0 : if (cluster == &old_cluster)
337 0 : pg_fatal("pg_ctl failed to start the source server, or connection failed");
338 : else
339 0 : pg_fatal("pg_ctl failed to start the target server, or connection failed");
340 : }
341 :
342 30 : return true;
343 : }
344 :
345 :
346 : void
347 36 : stop_postmaster(bool in_atexit)
348 : {
349 : ClusterInfo *cluster;
350 :
351 36 : if (os_info.running_cluster == &old_cluster)
352 12 : cluster = &old_cluster;
353 24 : else if (os_info.running_cluster == &new_cluster)
354 18 : cluster = &new_cluster;
355 : else
356 6 : return; /* no cluster running */
357 :
358 60 : exec_prog(SERVER_STOP_LOG_FILE, NULL, !in_atexit, !in_atexit,
359 : "\"%s/pg_ctl\" -w -D \"%s\" -o \"%s\" %s stop",
360 : cluster->bindir, cluster->pgconfig,
361 30 : cluster->pgopts ? cluster->pgopts : "",
362 30 : in_atexit ? "-m fast" : "-m smart");
363 :
364 30 : os_info.running_cluster = NULL;
365 : }
366 :
367 :
368 : /*
369 : * check_pghost_envvar()
370 : *
371 : * Tests that PGHOST does not point to a non-local server
372 : */
373 : void
374 14 : check_pghost_envvar(void)
375 : {
376 : PQconninfoOption *option;
377 : PQconninfoOption *start;
378 :
379 : /* Get valid libpq env vars from the PQconndefaults function */
380 :
381 14 : start = PQconndefaults();
382 :
383 14 : if (!start)
384 0 : pg_fatal("out of memory");
385 :
386 574 : for (option = start; option->keyword != NULL; option++)
387 : {
388 560 : if (option->envvar && (strcmp(option->envvar, "PGHOST") == 0 ||
389 434 : strcmp(option->envvar, "PGHOSTADDR") == 0))
390 : {
391 28 : const char *value = getenv(option->envvar);
392 :
393 28 : if (value && strlen(value) > 0 &&
394 : /* check for 'local' host values */
395 14 : (strcmp(value, "localhost") != 0 && strcmp(value, "127.0.0.1") != 0 &&
396 14 : strcmp(value, "::1") != 0 && !is_unixsock_path(value)))
397 0 : pg_fatal("libpq environment variable %s has a non-local server value: %s",
398 : option->envvar, value);
399 : }
400 : }
401 :
402 : /* Free the memory that libpq allocated on our behalf */
403 14 : PQconninfoFree(start);
404 14 : }
|