Line data Source code
1 : /*
2 : * pgbench.c
3 : *
4 : * A simple benchmark program for PostgreSQL
5 : * Originally written by Tatsuo Ishii and enhanced by many contributors.
6 : *
7 : * src/bin/pgbench/pgbench.c
8 : * Copyright (c) 2000-2025, PostgreSQL Global Development Group
9 : * ALL RIGHTS RESERVED;
10 : *
11 : * Permission to use, copy, modify, and distribute this software and its
12 : * documentation for any purpose, without fee, and without a written agreement
13 : * is hereby granted, provided that the above copyright notice and this
14 : * paragraph and the following two paragraphs appear in all copies.
15 : *
16 : * IN NO EVENT SHALL THE AUTHOR OR DISTRIBUTORS BE LIABLE TO ANY PARTY FOR
17 : * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES, INCLUDING
18 : * LOST PROFITS, ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS
19 : * DOCUMENTATION, EVEN IF THE AUTHOR OR DISTRIBUTORS HAVE BEEN ADVISED OF THE
20 : * POSSIBILITY OF SUCH DAMAGE.
21 : *
22 : * THE AUTHOR AND DISTRIBUTORS SPECIFICALLY DISCLAIMS ANY WARRANTIES,
23 : * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY
24 : * AND FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS
25 : * ON AN "AS IS" BASIS, AND THE AUTHOR AND DISTRIBUTORS HAS NO OBLIGATIONS TO
26 : * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
27 : *
28 : */
29 :
30 : #if defined(WIN32) && FD_SETSIZE < 1024
31 : #error FD_SETSIZE needs to have been increased
32 : #endif
33 :
34 : #include "postgres_fe.h"
35 :
36 : #include <ctype.h>
37 : #include <float.h>
38 : #include <limits.h>
39 : #include <math.h>
40 : #include <signal.h>
41 : #include <time.h>
42 : #include <sys/time.h>
43 : #include <sys/resource.h> /* for getrlimit */
44 :
45 : /* For testing, PGBENCH_USE_SELECT can be defined to force use of that code */
46 : #if defined(HAVE_PPOLL) && !defined(PGBENCH_USE_SELECT)
47 : #define POLL_USING_PPOLL
48 : #ifdef HAVE_POLL_H
49 : #include <poll.h>
50 : #endif
51 : #else /* no ppoll(), so use select() */
52 : #define POLL_USING_SELECT
53 : #include <sys/select.h>
54 : #endif
55 :
56 : #include "catalog/pg_class_d.h"
57 : #include "common/int.h"
58 : #include "common/logging.h"
59 : #include "common/pg_prng.h"
60 : #include "common/string.h"
61 : #include "common/username.h"
62 : #include "fe_utils/cancel.h"
63 : #include "fe_utils/conditional.h"
64 : #include "fe_utils/option_utils.h"
65 : #include "fe_utils/string_utils.h"
66 : #include "getopt_long.h"
67 : #include "libpq-fe.h"
68 : #include "pgbench.h"
69 : #include "port/pg_bitutils.h"
70 : #include "portability/instr_time.h"
71 :
72 : /* X/Open (XSI) requires <math.h> to provide M_PI, but core POSIX does not */
73 : #ifndef M_PI
74 : #define M_PI 3.14159265358979323846
75 : #endif
76 :
77 : #define ERRCODE_T_R_SERIALIZATION_FAILURE "40001"
78 : #define ERRCODE_T_R_DEADLOCK_DETECTED "40P01"
79 : #define ERRCODE_UNDEFINED_TABLE "42P01"
80 :
81 : /*
82 : * Hashing constants
83 : */
84 : #define FNV_PRIME UINT64CONST(0x100000001b3)
85 : #define FNV_OFFSET_BASIS UINT64CONST(0xcbf29ce484222325)
86 : #define MM2_MUL UINT64CONST(0xc6a4a7935bd1e995)
87 : #define MM2_MUL_TIMES_8 UINT64CONST(0x35253c9ade8f4ca8)
88 : #define MM2_ROT 47
89 :
90 : /*
91 : * Multi-platform socket set implementations
92 : */
93 :
94 : #ifdef POLL_USING_PPOLL
95 : #define SOCKET_WAIT_METHOD "ppoll"
96 :
97 : typedef struct socket_set
98 : {
99 : int maxfds; /* allocated length of pollfds[] array */
100 : int curfds; /* number currently in use */
101 : struct pollfd pollfds[FLEXIBLE_ARRAY_MEMBER];
102 : } socket_set;
103 :
104 : #endif /* POLL_USING_PPOLL */
105 :
106 : #ifdef POLL_USING_SELECT
107 : #define SOCKET_WAIT_METHOD "select"
108 :
109 : typedef struct socket_set
110 : {
111 : int maxfd; /* largest FD currently set in fds */
112 : fd_set fds;
113 : } socket_set;
114 :
115 : #endif /* POLL_USING_SELECT */
116 :
117 : /*
118 : * Multi-platform thread implementations
119 : */
120 :
121 : #ifdef WIN32
122 : /* Use Windows threads */
123 : #include <windows.h>
124 : #define GETERRNO() (_dosmaperr(GetLastError()), errno)
125 : #define THREAD_T HANDLE
126 : #define THREAD_FUNC_RETURN_TYPE unsigned
127 : #define THREAD_FUNC_RETURN return 0
128 : #define THREAD_FUNC_CC __stdcall
129 : #define THREAD_CREATE(handle, function, arg) \
130 : ((*(handle) = (HANDLE) _beginthreadex(NULL, 0, (function), (arg), 0, NULL)) == 0 ? errno : 0)
131 : #define THREAD_JOIN(handle) \
132 : (WaitForSingleObject(handle, INFINITE) != WAIT_OBJECT_0 ? \
133 : GETERRNO() : CloseHandle(handle) ? 0 : GETERRNO())
134 : #define THREAD_BARRIER_T SYNCHRONIZATION_BARRIER
135 : #define THREAD_BARRIER_INIT(barrier, n) \
136 : (InitializeSynchronizationBarrier((barrier), (n), 0) ? 0 : GETERRNO())
137 : #define THREAD_BARRIER_WAIT(barrier) \
138 : EnterSynchronizationBarrier((barrier), \
139 : SYNCHRONIZATION_BARRIER_FLAGS_BLOCK_ONLY)
140 : #define THREAD_BARRIER_DESTROY(barrier)
141 : #else
142 : /* Use POSIX threads */
143 : #include "port/pg_pthread.h"
144 : #define THREAD_T pthread_t
145 : #define THREAD_FUNC_RETURN_TYPE void *
146 : #define THREAD_FUNC_RETURN return NULL
147 : #define THREAD_FUNC_CC
148 : #define THREAD_CREATE(handle, function, arg) \
149 : pthread_create((handle), NULL, (function), (arg))
150 : #define THREAD_JOIN(handle) \
151 : pthread_join((handle), NULL)
152 : #define THREAD_BARRIER_T pthread_barrier_t
153 : #define THREAD_BARRIER_INIT(barrier, n) \
154 : pthread_barrier_init((barrier), NULL, (n))
155 : #define THREAD_BARRIER_WAIT(barrier) pthread_barrier_wait((barrier))
156 : #define THREAD_BARRIER_DESTROY(barrier) pthread_barrier_destroy((barrier))
157 : #endif
158 :
159 :
160 : /********************************************************************
161 : * some configurable parameters */
162 :
163 : #define DEFAULT_INIT_STEPS "dtgvp" /* default -I setting */
164 : #define ALL_INIT_STEPS "dtgGvpf" /* all possible steps */
165 :
166 : #define LOG_STEP_SECONDS 5 /* seconds between log messages */
167 : #define DEFAULT_NXACTS 10 /* default nxacts */
168 :
169 : #define MIN_GAUSSIAN_PARAM 2.0 /* minimum parameter for gauss */
170 :
171 : #define MIN_ZIPFIAN_PARAM 1.001 /* minimum parameter for zipfian */
172 : #define MAX_ZIPFIAN_PARAM 1000.0 /* maximum parameter for zipfian */
173 :
174 : static int nxacts = 0; /* number of transactions per client */
175 : static int duration = 0; /* duration in seconds */
176 : static int64 end_time = 0; /* when to stop in micro seconds, under -T */
177 :
178 : /*
179 : * scaling factor. for example, scale = 10 will make 1000000 tuples in
180 : * pgbench_accounts table.
181 : */
182 : static int scale = 1;
183 :
184 : /*
185 : * fillfactor. for example, fillfactor = 90 will use only 90 percent
186 : * space during inserts and leave 10 percent free.
187 : */
188 : static int fillfactor = 100;
189 :
190 : /*
191 : * use unlogged tables?
192 : */
193 : static bool unlogged_tables = false;
194 :
195 : /*
196 : * log sampling rate (1.0 = log everything, 0.0 = option not given)
197 : */
198 : static double sample_rate = 0.0;
199 :
200 : /*
201 : * When threads are throttled to a given rate limit, this is the target delay
202 : * to reach that rate in usec. 0 is the default and means no throttling.
203 : */
204 : static double throttle_delay = 0;
205 :
206 : /*
207 : * Transactions which take longer than this limit (in usec) are counted as
208 : * late, and reported as such, although they are completed anyway. When
209 : * throttling is enabled, execution time slots that are more than this late
210 : * are skipped altogether, and counted separately.
211 : */
212 : static int64 latency_limit = 0;
213 :
214 : /*
215 : * tablespace selection
216 : */
217 : static char *tablespace = NULL;
218 : static char *index_tablespace = NULL;
219 :
220 : /*
221 : * Number of "pgbench_accounts" partitions. 0 is the default and means no
222 : * partitioning.
223 : */
224 : static int partitions = 0;
225 :
226 : /* partitioning strategy for "pgbench_accounts" */
227 : typedef enum
228 : {
229 : PART_NONE, /* no partitioning */
230 : PART_RANGE, /* range partitioning */
231 : PART_HASH, /* hash partitioning */
232 : } partition_method_t;
233 :
234 : static partition_method_t partition_method = PART_NONE;
235 : static const char *const PARTITION_METHOD[] = {"none", "range", "hash"};
236 :
237 : /* random seed used to initialize base_random_sequence */
238 : static int64 random_seed = -1;
239 :
240 : /*
241 : * end of configurable parameters
242 : *********************************************************************/
243 :
244 : #define nbranches 1 /* Makes little sense to change this. Change
245 : * -s instead */
246 : #define ntellers 10
247 : #define naccounts 100000
248 :
249 : /*
250 : * The scale factor at/beyond which 32bit integers are incapable of storing
251 : * 64bit values.
252 : *
253 : * Although the actual threshold is 21474, we use 20000 because it is easier to
254 : * document and remember, and isn't that far away from the real threshold.
255 : */
256 : #define SCALE_32BIT_THRESHOLD 20000
257 :
258 : static bool use_log; /* log transaction latencies to a file */
259 : static bool use_quiet; /* quiet logging onto stderr */
260 : static int agg_interval; /* log aggregates instead of individual
261 : * transactions */
262 : static bool per_script_stats = false; /* whether to collect stats per script */
263 : static int progress = 0; /* thread progress report every this seconds */
264 : static bool progress_timestamp = false; /* progress report with Unix time */
265 : static int nclients = 1; /* number of clients */
266 : static int nthreads = 1; /* number of threads */
267 : static bool is_connect; /* establish connection for each transaction */
268 : static bool report_per_command = false; /* report per-command latencies,
269 : * retries after errors and failures
270 : * (errors without retrying) */
271 : static int main_pid; /* main process id used in log filename */
272 :
273 : /*
274 : * There are different types of restrictions for deciding that the current
275 : * transaction with a serialization/deadlock error can no longer be retried and
276 : * should be reported as failed:
277 : * - max_tries (--max-tries) can be used to limit the number of tries;
278 : * - latency_limit (-L) can be used to limit the total time of tries;
279 : * - duration (-T) can be used to limit the total benchmark time.
280 : *
281 : * They can be combined together, and you need to use at least one of them to
282 : * retry the transactions with serialization/deadlock errors. If none of them is
283 : * used, the default value of max_tries is 1 and such transactions will not be
284 : * retried.
285 : */
286 :
287 : /*
288 : * We cannot retry a transaction after the serialization/deadlock error if its
289 : * number of tries reaches this maximum; if its value is zero, it is not used.
290 : */
291 : static uint32 max_tries = 1;
292 :
293 : static bool failures_detailed = false; /* whether to group failures in
294 : * reports or logs by basic types */
295 :
296 : static const char *pghost = NULL;
297 : static const char *pgport = NULL;
298 : static const char *username = NULL;
299 : static const char *dbName = NULL;
300 : static char *logfile_prefix = NULL;
301 : static const char *progname;
302 :
303 : #define WSEP '@' /* weight separator */
304 :
305 : static volatile sig_atomic_t timer_exceeded = false; /* flag from signal
306 : * handler */
307 :
308 : /*
309 : * We don't want to allocate variables one by one; for efficiency, add a
310 : * constant margin each time it overflows.
311 : */
312 : #define VARIABLES_ALLOC_MARGIN 8
313 :
314 : /*
315 : * Variable definitions.
316 : *
317 : * If a variable only has a string value, "svalue" is that value, and value is
318 : * "not set". If the value is known, "value" contains the value (in any
319 : * variant).
320 : *
321 : * In this case "svalue" contains the string equivalent of the value, if we've
322 : * had occasion to compute that, or NULL if we haven't.
323 : */
324 : typedef struct
325 : {
326 : char *name; /* variable's name */
327 : char *svalue; /* its value in string form, if known */
328 : PgBenchValue value; /* actual variable's value */
329 : } Variable;
330 :
331 : /*
332 : * Data structure for client variables.
333 : */
334 : typedef struct
335 : {
336 : Variable *vars; /* array of variable definitions */
337 : int nvars; /* number of variables */
338 :
339 : /*
340 : * The maximum number of variables that we can currently store in 'vars'
341 : * without having to reallocate more space. We must always have max_vars
342 : * >= nvars.
343 : */
344 : int max_vars;
345 :
346 : bool vars_sorted; /* are variables sorted by name? */
347 : } Variables;
348 :
349 : #define MAX_SCRIPTS 128 /* max number of SQL scripts allowed */
350 : #define SHELL_COMMAND_SIZE 256 /* maximum size allowed for shell command */
351 :
352 : /*
353 : * Simple data structure to keep stats about something.
354 : *
355 : * XXX probably the first value should be kept and used as an offset for
356 : * better numerical stability...
357 : */
358 : typedef struct SimpleStats
359 : {
360 : int64 count; /* how many values were encountered */
361 : double min; /* the minimum seen */
362 : double max; /* the maximum seen */
363 : double sum; /* sum of values */
364 : double sum2; /* sum of squared values */
365 : } SimpleStats;
366 :
367 : /*
368 : * The instr_time type is expensive when dealing with time arithmetic. Define
369 : * a type to hold microseconds instead. Type int64 is good enough for about
370 : * 584500 years.
371 : */
372 : typedef int64 pg_time_usec_t;
373 :
374 : /*
375 : * Data structure to hold various statistics: per-thread and per-script stats
376 : * are maintained and merged together.
377 : */
378 : typedef struct StatsData
379 : {
380 : pg_time_usec_t start_time; /* interval start time, for aggregates */
381 :
382 : /*----------
383 : * Transactions are counted depending on their execution and outcome.
384 : * First a transaction may have started or not: skipped transactions occur
385 : * under --rate and --latency-limit when the client is too late to execute
386 : * them. Secondly, a started transaction may ultimately succeed or fail,
387 : * possibly after some retries when --max-tries is not one. Thus
388 : *
389 : * the number of all transactions =
390 : * 'skipped' (it was too late to execute them) +
391 : * 'cnt' (the number of successful transactions) +
392 : * 'failed' (the number of failed transactions).
393 : *
394 : * A successful transaction can have several unsuccessful tries before a
395 : * successful run. Thus
396 : *
397 : * 'cnt' (the number of successful transactions) =
398 : * successfully retried transactions (they got a serialization or a
399 : * deadlock error(s), but were
400 : * successfully retried from the very
401 : * beginning) +
402 : * directly successful transactions (they were successfully completed on
403 : * the first try).
404 : *
405 : * A failed transaction is defined as unsuccessfully retried transactions.
406 : * It can be one of two types:
407 : *
408 : * failed (the number of failed transactions) =
409 : * 'serialization_failures' (they got a serialization error and were not
410 : * successfully retried) +
411 : * 'deadlock_failures' (they got a deadlock error and were not
412 : * successfully retried).
413 : *
414 : * If the transaction was retried after a serialization or a deadlock
415 : * error this does not guarantee that this retry was successful. Thus
416 : *
417 : * 'retries' (number of retries) =
418 : * number of retries in all retried transactions =
419 : * number of retries in (successfully retried transactions +
420 : * failed transactions);
421 : *
422 : * 'retried' (number of all retried transactions) =
423 : * successfully retried transactions +
424 : * failed transactions.
425 : *----------
426 : */
427 : int64 cnt; /* number of successful transactions, not
428 : * including 'skipped' */
429 : int64 skipped; /* number of transactions skipped under --rate
430 : * and --latency-limit */
431 : int64 retries; /* number of retries after a serialization or
432 : * a deadlock error in all the transactions */
433 : int64 retried; /* number of all transactions that were
434 : * retried after a serialization or a deadlock
435 : * error (perhaps the last try was
436 : * unsuccessful) */
437 : int64 serialization_failures; /* number of transactions that were
438 : * not successfully retried after a
439 : * serialization error */
440 : int64 deadlock_failures; /* number of transactions that were not
441 : * successfully retried after a deadlock
442 : * error */
443 : SimpleStats latency;
444 : SimpleStats lag;
445 : } StatsData;
446 :
447 : /*
448 : * For displaying Unix epoch timestamps, as some time functions may have
449 : * another reference.
450 : */
451 : static pg_time_usec_t epoch_shift;
452 :
453 : /*
454 : * Error status for errors during script execution.
455 : */
456 : typedef enum EStatus
457 : {
458 : ESTATUS_NO_ERROR = 0,
459 : ESTATUS_META_COMMAND_ERROR,
460 :
461 : /* SQL errors */
462 : ESTATUS_SERIALIZATION_ERROR,
463 : ESTATUS_DEADLOCK_ERROR,
464 : ESTATUS_OTHER_SQL_ERROR,
465 : } EStatus;
466 :
467 : /*
468 : * Transaction status at the end of a command.
469 : */
470 : typedef enum TStatus
471 : {
472 : TSTATUS_IDLE,
473 : TSTATUS_IN_BLOCK,
474 : TSTATUS_CONN_ERROR,
475 : TSTATUS_OTHER_ERROR,
476 : } TStatus;
477 :
478 : /* Various random sequences are initialized from this one. */
479 : static pg_prng_state base_random_sequence;
480 :
481 : /* Synchronization barrier for start and connection */
482 : static THREAD_BARRIER_T barrier;
483 :
484 : /*
485 : * Connection state machine states.
486 : */
487 : typedef enum
488 : {
489 : /*
490 : * The client must first choose a script to execute. Once chosen, it can
491 : * either be throttled (state CSTATE_PREPARE_THROTTLE under --rate), start
492 : * right away (state CSTATE_START_TX) or not start at all if the timer was
493 : * exceeded (state CSTATE_FINISHED).
494 : */
495 : CSTATE_CHOOSE_SCRIPT,
496 :
497 : /*
498 : * CSTATE_START_TX performs start-of-transaction processing. Establishes
499 : * a new connection for the transaction in --connect mode, records the
500 : * transaction start time, and proceed to the first command.
501 : *
502 : * Note: once a script is started, it will either error or run till its
503 : * end, where it may be interrupted. It is not interrupted while running,
504 : * so pgbench --time is to be understood as tx are allowed to start in
505 : * that time, and will finish when their work is completed.
506 : */
507 : CSTATE_START_TX,
508 :
509 : /*
510 : * In CSTATE_PREPARE_THROTTLE state, we calculate when to begin the next
511 : * transaction, and advance to CSTATE_THROTTLE. CSTATE_THROTTLE state
512 : * sleeps until that moment, then advances to CSTATE_START_TX, or
513 : * CSTATE_FINISHED if the next transaction would start beyond the end of
514 : * the run.
515 : */
516 : CSTATE_PREPARE_THROTTLE,
517 : CSTATE_THROTTLE,
518 :
519 : /*
520 : * We loop through these states, to process each command in the script:
521 : *
522 : * CSTATE_START_COMMAND starts the execution of a command. On a SQL
523 : * command, the command is sent to the server, and we move to
524 : * CSTATE_WAIT_RESULT state unless in pipeline mode. On a \sleep
525 : * meta-command, the timer is set, and we enter the CSTATE_SLEEP state to
526 : * wait for it to expire. Other meta-commands are executed immediately. If
527 : * the command about to start is actually beyond the end of the script,
528 : * advance to CSTATE_END_TX.
529 : *
530 : * CSTATE_WAIT_RESULT waits until we get a result set back from the server
531 : * for the current command.
532 : *
533 : * CSTATE_SLEEP waits until the end of \sleep.
534 : *
535 : * CSTATE_END_COMMAND records the end-of-command timestamp, increments the
536 : * command counter, and loops back to CSTATE_START_COMMAND state.
537 : *
538 : * CSTATE_SKIP_COMMAND is used by conditional branches which are not
539 : * executed. It quickly skip commands that do not need any evaluation.
540 : * This state can move forward several commands, till there is something
541 : * to do or the end of the script.
542 : */
543 : CSTATE_START_COMMAND,
544 : CSTATE_WAIT_RESULT,
545 : CSTATE_SLEEP,
546 : CSTATE_END_COMMAND,
547 : CSTATE_SKIP_COMMAND,
548 :
549 : /*
550 : * States for failed commands.
551 : *
552 : * If the SQL/meta command fails, in CSTATE_ERROR clean up after an error:
553 : * (1) clear the conditional stack; (2) if we have an unterminated
554 : * (possibly failed) transaction block, send the rollback command to the
555 : * server and wait for the result in CSTATE_WAIT_ROLLBACK_RESULT. If
556 : * something goes wrong with rolling back, go to CSTATE_ABORTED.
557 : *
558 : * But if everything is ok we are ready for future transactions: if this
559 : * is a serialization or deadlock error and we can re-execute the
560 : * transaction from the very beginning, go to CSTATE_RETRY; otherwise go
561 : * to CSTATE_FAILURE.
562 : *
563 : * In CSTATE_RETRY report an error, set the same parameters for the
564 : * transaction execution as in the previous tries and process the first
565 : * transaction command in CSTATE_START_COMMAND.
566 : *
567 : * In CSTATE_FAILURE report a failure, set the parameters for the
568 : * transaction execution as they were before the first run of this
569 : * transaction (except for a random state) and go to CSTATE_END_TX to
570 : * complete this transaction.
571 : */
572 : CSTATE_ERROR,
573 : CSTATE_WAIT_ROLLBACK_RESULT,
574 : CSTATE_RETRY,
575 : CSTATE_FAILURE,
576 :
577 : /*
578 : * CSTATE_END_TX performs end-of-transaction processing. It calculates
579 : * latency, and logs the transaction. In --connect mode, it closes the
580 : * current connection.
581 : *
582 : * Then either starts over in CSTATE_CHOOSE_SCRIPT, or enters
583 : * CSTATE_FINISHED if we have no more work to do.
584 : */
585 : CSTATE_END_TX,
586 :
587 : /*
588 : * Final states. CSTATE_ABORTED means that the script execution was
589 : * aborted because a command failed, CSTATE_FINISHED means success.
590 : */
591 : CSTATE_ABORTED,
592 : CSTATE_FINISHED,
593 : } ConnectionStateEnum;
594 :
595 : /*
596 : * Connection state.
597 : */
598 : typedef struct
599 : {
600 : PGconn *con; /* connection handle to DB */
601 : int id; /* client No. */
602 : ConnectionStateEnum state; /* state machine's current state. */
603 : ConditionalStack cstack; /* enclosing conditionals state */
604 :
605 : /*
606 : * Separate randomness for each client. This is used for random functions
607 : * PGBENCH_RANDOM_* during the execution of the script.
608 : */
609 : pg_prng_state cs_func_rs;
610 :
611 : int use_file; /* index in sql_script for this client */
612 : int command; /* command number in script */
613 : int num_syncs; /* number of ongoing sync commands */
614 :
615 : /* client variables */
616 : Variables variables;
617 :
618 : /* various times about current transaction in microseconds */
619 : pg_time_usec_t txn_scheduled; /* scheduled start time of transaction */
620 : pg_time_usec_t sleep_until; /* scheduled start time of next cmd */
621 : pg_time_usec_t txn_begin; /* used for measuring schedule lag times */
622 : pg_time_usec_t stmt_begin; /* used for measuring statement latencies */
623 :
624 : /* whether client prepared each command of each script */
625 : bool **prepared;
626 :
627 : /*
628 : * For processing failures and repeating transactions with serialization
629 : * or deadlock errors:
630 : */
631 : EStatus estatus; /* the error status of the current transaction
632 : * execution; this is ESTATUS_NO_ERROR if
633 : * there were no errors */
634 : pg_prng_state random_state; /* random state */
635 : uint32 tries; /* how many times have we already tried the
636 : * current transaction? */
637 :
638 : /* per client collected stats */
639 : int64 cnt; /* client transaction count, for -t; skipped
640 : * and failed transactions are also counted
641 : * here */
642 : } CState;
643 :
644 : /*
645 : * Thread state
646 : */
647 : typedef struct
648 : {
649 : int tid; /* thread id */
650 : THREAD_T thread; /* thread handle */
651 : CState *state; /* array of CState */
652 : int nstate; /* length of state[] */
653 :
654 : /*
655 : * Separate randomness for each thread. Each thread option uses its own
656 : * random state to make all of them independent of each other and
657 : * therefore deterministic at the thread level.
658 : */
659 : pg_prng_state ts_choose_rs; /* random state for selecting a script */
660 : pg_prng_state ts_throttle_rs; /* random state for transaction throttling */
661 : pg_prng_state ts_sample_rs; /* random state for log sampling */
662 :
663 : int64 throttle_trigger; /* previous/next throttling (us) */
664 : FILE *logfile; /* where to log, or NULL */
665 :
666 : /* per thread collected stats in microseconds */
667 : pg_time_usec_t create_time; /* thread creation time */
668 : pg_time_usec_t started_time; /* thread is running */
669 : pg_time_usec_t bench_start; /* thread is benchmarking */
670 : pg_time_usec_t conn_duration; /* cumulated connection and disconnection
671 : * delays */
672 :
673 : StatsData stats;
674 : int64 latency_late; /* count executed but late transactions */
675 : } TState;
676 :
677 : /*
678 : * queries read from files
679 : */
680 : #define SQL_COMMAND 1
681 : #define META_COMMAND 2
682 :
683 : /*
684 : * max number of backslash command arguments or SQL variables,
685 : * including the command or SQL statement itself
686 : */
687 : #define MAX_ARGS 256
688 :
689 : typedef enum MetaCommand
690 : {
691 : META_NONE, /* not a known meta-command */
692 : META_SET, /* \set */
693 : META_SETSHELL, /* \setshell */
694 : META_SHELL, /* \shell */
695 : META_SLEEP, /* \sleep */
696 : META_GSET, /* \gset */
697 : META_ASET, /* \aset */
698 : META_IF, /* \if */
699 : META_ELIF, /* \elif */
700 : META_ELSE, /* \else */
701 : META_ENDIF, /* \endif */
702 : META_STARTPIPELINE, /* \startpipeline */
703 : META_SYNCPIPELINE, /* \syncpipeline */
704 : META_ENDPIPELINE, /* \endpipeline */
705 : } MetaCommand;
706 :
707 : typedef enum QueryMode
708 : {
709 : QUERY_SIMPLE, /* simple query */
710 : QUERY_EXTENDED, /* extended query */
711 : QUERY_PREPARED, /* extended query with prepared statements */
712 : NUM_QUERYMODE
713 : } QueryMode;
714 :
715 : static QueryMode querymode = QUERY_SIMPLE;
716 : static const char *const QUERYMODE[] = {"simple", "extended", "prepared"};
717 :
718 : /*
719 : * struct Command represents one command in a script.
720 : *
721 : * lines The raw, possibly multi-line command text. Variable substitution
722 : * not applied.
723 : * first_line A short, single-line extract of 'lines', for error reporting.
724 : * type SQL_COMMAND or META_COMMAND
725 : * meta The type of meta-command, with META_NONE/GSET/ASET if command
726 : * is SQL.
727 : * argc Number of arguments of the command, 0 if not yet processed.
728 : * argv Command arguments, the first of which is the command or SQL
729 : * string itself. For SQL commands, after post-processing
730 : * argv[0] is the same as 'lines' with variables substituted.
731 : * prepname The name that this command is prepared under, in prepare mode
732 : * varprefix SQL commands terminated with \gset or \aset have this set
733 : * to a non NULL value. If nonempty, it's used to prefix the
734 : * variable name that receives the value.
735 : * aset do gset on all possible queries of a combined query (\;).
736 : * expr Parsed expression, if needed.
737 : * stats Time spent in this command.
738 : * retries Number of retries after a serialization or deadlock error in the
739 : * current command.
740 : * failures Number of errors in the current command that were not retried.
741 : */
742 : typedef struct Command
743 : {
744 : PQExpBufferData lines;
745 : char *first_line;
746 : int type;
747 : MetaCommand meta;
748 : int argc;
749 : char *argv[MAX_ARGS];
750 : char *prepname;
751 : char *varprefix;
752 : PgBenchExpr *expr;
753 : SimpleStats stats;
754 : int64 retries;
755 : int64 failures;
756 : } Command;
757 :
758 : typedef struct ParsedScript
759 : {
760 : const char *desc; /* script descriptor (eg, file name) */
761 : int weight; /* selection weight */
762 : Command **commands; /* NULL-terminated array of Commands */
763 : StatsData stats; /* total time spent in script */
764 : } ParsedScript;
765 :
766 : static ParsedScript sql_script[MAX_SCRIPTS]; /* SQL script files */
767 : static int num_scripts; /* number of scripts in sql_script[] */
768 : static int64 total_weight = 0;
769 :
770 : static bool verbose_errors = false; /* print verbose messages of all errors */
771 :
772 : static bool exit_on_abort = false; /* exit when any client is aborted */
773 :
774 : /* Builtin test scripts */
775 : typedef struct BuiltinScript
776 : {
777 : const char *name; /* very short name for -b ... */
778 : const char *desc; /* short description */
779 : const char *script; /* actual pgbench script */
780 : } BuiltinScript;
781 :
782 : static const BuiltinScript builtin_script[] =
783 : {
784 : {
785 : "tpcb-like",
786 : "<builtin: TPC-B (sort of)>",
787 : "\\set aid random(1, " CppAsString2(naccounts) " * :scale)\n"
788 : "\\set bid random(1, " CppAsString2(nbranches) " * :scale)\n"
789 : "\\set tid random(1, " CppAsString2(ntellers) " * :scale)\n"
790 : "\\set delta random(-5000, 5000)\n"
791 : "BEGIN;\n"
792 : "UPDATE pgbench_accounts SET abalance = abalance + :delta WHERE aid = :aid;\n"
793 : "SELECT abalance FROM pgbench_accounts WHERE aid = :aid;\n"
794 : "UPDATE pgbench_tellers SET tbalance = tbalance + :delta WHERE tid = :tid;\n"
795 : "UPDATE pgbench_branches SET bbalance = bbalance + :delta WHERE bid = :bid;\n"
796 : "INSERT INTO pgbench_history (tid, bid, aid, delta, mtime) VALUES (:tid, :bid, :aid, :delta, CURRENT_TIMESTAMP);\n"
797 : "END;\n"
798 : },
799 : {
800 : "simple-update",
801 : "<builtin: simple update>",
802 : "\\set aid random(1, " CppAsString2(naccounts) " * :scale)\n"
803 : "\\set bid random(1, " CppAsString2(nbranches) " * :scale)\n"
804 : "\\set tid random(1, " CppAsString2(ntellers) " * :scale)\n"
805 : "\\set delta random(-5000, 5000)\n"
806 : "BEGIN;\n"
807 : "UPDATE pgbench_accounts SET abalance = abalance + :delta WHERE aid = :aid;\n"
808 : "SELECT abalance FROM pgbench_accounts WHERE aid = :aid;\n"
809 : "INSERT INTO pgbench_history (tid, bid, aid, delta, mtime) VALUES (:tid, :bid, :aid, :delta, CURRENT_TIMESTAMP);\n"
810 : "END;\n"
811 : },
812 : {
813 : "select-only",
814 : "<builtin: select only>",
815 : "\\set aid random(1, " CppAsString2(naccounts) " * :scale)\n"
816 : "SELECT abalance FROM pgbench_accounts WHERE aid = :aid;\n"
817 : }
818 : };
819 :
820 :
821 : /* Function prototypes */
822 : static void setNullValue(PgBenchValue *pv);
823 : static void setBoolValue(PgBenchValue *pv, bool bval);
824 : static void setIntValue(PgBenchValue *pv, int64 ival);
825 : static void setDoubleValue(PgBenchValue *pv, double dval);
826 : static bool evaluateExpr(CState *st, PgBenchExpr *expr,
827 : PgBenchValue *retval);
828 : static ConnectionStateEnum executeMetaCommand(CState *st, pg_time_usec_t *now);
829 : static void doLog(TState *thread, CState *st,
830 : StatsData *agg, bool skipped, double latency, double lag);
831 : static void processXactStats(TState *thread, CState *st, pg_time_usec_t *now,
832 : bool skipped, StatsData *agg);
833 : static void addScript(const ParsedScript *script);
834 : static THREAD_FUNC_RETURN_TYPE THREAD_FUNC_CC threadRun(void *arg);
835 : static void finishCon(CState *st);
836 : static void setalarm(int seconds);
837 : static socket_set *alloc_socket_set(int count);
838 : static void free_socket_set(socket_set *sa);
839 : static void clear_socket_set(socket_set *sa);
840 : static void add_socket_to_set(socket_set *sa, int fd, int idx);
841 : static int wait_on_socket_set(socket_set *sa, int64 usecs);
842 : static bool socket_has_input(socket_set *sa, int fd, int idx);
843 :
844 : /* callback used to build rows for COPY during data loading */
845 : typedef void (*initRowMethod) (PQExpBufferData *sql, int64 curr);
846 :
847 : /* callback functions for our flex lexer */
848 : static const PsqlScanCallbacks pgbench_callbacks = {
849 : NULL, /* don't need get_variable functionality */
850 : };
851 :
852 : static char
853 12 : get_table_relkind(PGconn *con, const char *table)
854 : {
855 : PGresult *res;
856 : char *val;
857 : char relkind;
858 12 : const char *params[1] = {table};
859 12 : const char *sql =
860 : "SELECT relkind FROM pg_catalog.pg_class WHERE oid=$1::pg_catalog.regclass";
861 :
862 12 : res = PQexecParams(con, sql, 1, NULL, params, NULL, NULL, 0);
863 12 : if (PQresultStatus(res) != PGRES_TUPLES_OK)
864 : {
865 0 : pg_log_error("query failed: %s", PQerrorMessage(con));
866 0 : pg_log_error_detail("Query was: %s", sql);
867 0 : exit(1);
868 : }
869 12 : val = PQgetvalue(res, 0, 0);
870 : Assert(strlen(val) == 1);
871 12 : relkind = val[0];
872 12 : PQclear(res);
873 :
874 12 : return relkind;
875 : }
876 :
877 : static inline pg_time_usec_t
878 23758 : pg_time_now(void)
879 : {
880 : instr_time now;
881 :
882 23758 : INSTR_TIME_SET_CURRENT(now);
883 :
884 23758 : return (pg_time_usec_t) INSTR_TIME_GET_MICROSEC(now);
885 : }
886 :
887 : static inline void
888 21486 : pg_time_now_lazy(pg_time_usec_t *now)
889 : {
890 21486 : if ((*now) == 0)
891 19442 : (*now) = pg_time_now();
892 21486 : }
893 :
894 : #define PG_TIME_GET_DOUBLE(t) (0.000001 * (t))
895 :
896 : static void
897 2 : usage(void)
898 : {
899 2 : printf("%s is a benchmarking tool for PostgreSQL.\n\n"
900 : "Usage:\n"
901 : " %s [OPTION]... [DBNAME]\n"
902 : "\nInitialization options:\n"
903 : " -i, --initialize invokes initialization mode\n"
904 : " -I, --init-steps=[" ALL_INIT_STEPS "]+ (default \"" DEFAULT_INIT_STEPS "\")\n"
905 : " run selected initialization steps, in the specified order\n"
906 : " d: drop any existing pgbench tables\n"
907 : " t: create the tables used by the standard pgbench scenario\n"
908 : " g: generate data, client-side\n"
909 : " G: generate data, server-side\n"
910 : " v: invoke VACUUM on the standard tables\n"
911 : " p: create primary key indexes on the standard tables\n"
912 : " f: create foreign keys between the standard tables\n"
913 : " -F, --fillfactor=NUM set fill factor\n"
914 : " -n, --no-vacuum do not run VACUUM during initialization\n"
915 : " -q, --quiet quiet logging (one message each 5 seconds)\n"
916 : " -s, --scale=NUM scaling factor\n"
917 : " --foreign-keys create foreign key constraints between tables\n"
918 : " --index-tablespace=TABLESPACE\n"
919 : " create indexes in the specified tablespace\n"
920 : " --partition-method=(range|hash)\n"
921 : " partition pgbench_accounts with this method (default: range)\n"
922 : " --partitions=NUM partition pgbench_accounts into NUM parts (default: 0)\n"
923 : " --tablespace=TABLESPACE create tables in the specified tablespace\n"
924 : " --unlogged-tables create tables as unlogged tables\n"
925 : "\nOptions to select what to run:\n"
926 : " -b, --builtin=NAME[@W] add builtin script NAME weighted at W (default: 1)\n"
927 : " (use \"-b list\" to list available scripts)\n"
928 : " -f, --file=FILENAME[@W] add script FILENAME weighted at W (default: 1)\n"
929 : " -N, --skip-some-updates skip updates of pgbench_tellers and pgbench_branches\n"
930 : " (same as \"-b simple-update\")\n"
931 : " -S, --select-only perform SELECT-only transactions\n"
932 : " (same as \"-b select-only\")\n"
933 : "\nBenchmarking options:\n"
934 : " -c, --client=NUM number of concurrent database clients (default: 1)\n"
935 : " -C, --connect establish new connection for each transaction\n"
936 : " -D, --define=VARNAME=VALUE\n"
937 : " define variable for use by custom script\n"
938 : " -j, --jobs=NUM number of threads (default: 1)\n"
939 : " -l, --log write transaction times to log file\n"
940 : " -L, --latency-limit=NUM count transactions lasting more than NUM ms as late\n"
941 : " -M, --protocol=simple|extended|prepared\n"
942 : " protocol for submitting queries (default: simple)\n"
943 : " -n, --no-vacuum do not run VACUUM before tests\n"
944 : " -P, --progress=NUM show thread progress report every NUM seconds\n"
945 : " -r, --report-per-command report latencies, failures, and retries per command\n"
946 : " -R, --rate=NUM target rate in transactions per second\n"
947 : " -s, --scale=NUM report this scale factor in output\n"
948 : " -t, --transactions=NUM number of transactions each client runs (default: 10)\n"
949 : " -T, --time=NUM duration of benchmark test in seconds\n"
950 : " -v, --vacuum-all vacuum all four standard tables before tests\n"
951 : " --aggregate-interval=NUM aggregate data over NUM seconds\n"
952 : " --exit-on-abort exit when any client is aborted\n"
953 : " --failures-detailed report the failures grouped by basic types\n"
954 : " --log-prefix=PREFIX prefix for transaction time log file\n"
955 : " (default: \"pgbench_log\")\n"
956 : " --max-tries=NUM max number of tries to run transaction (default: 1)\n"
957 : " --progress-timestamp use Unix epoch timestamps for progress\n"
958 : " --random-seed=SEED set random seed (\"time\", \"rand\", integer)\n"
959 : " --sampling-rate=NUM fraction of transactions to log (e.g., 0.01 for 1%%)\n"
960 : " --show-script=NAME show builtin script code, then exit\n"
961 : " --verbose-errors print messages of all errors\n"
962 : "\nCommon options:\n"
963 : " --debug print debugging output\n"
964 : " -d, --dbname=DBNAME database name to connect to\n"
965 : " -h, --host=HOSTNAME database server host or socket directory\n"
966 : " -p, --port=PORT database server port number\n"
967 : " -U, --username=USERNAME connect as specified database user\n"
968 : " -V, --version output version information, then exit\n"
969 : " -?, --help show this help, then exit\n"
970 : "\n"
971 : "Report bugs to <%s>.\n"
972 : "%s home page: <%s>\n",
973 : progname, progname, PACKAGE_BUGREPORT, PACKAGE_NAME, PACKAGE_URL);
974 2 : }
975 :
976 : /* return whether str matches "^\s*[-+]?[0-9]+$" */
977 : static bool
978 1024 : is_an_int(const char *str)
979 : {
980 1024 : const char *ptr = str;
981 :
982 : /* skip leading spaces; cast is consistent with strtoint64 */
983 1024 : while (*ptr && isspace((unsigned char) *ptr))
984 0 : ptr++;
985 :
986 : /* skip sign */
987 1024 : if (*ptr == '+' || *ptr == '-')
988 6 : ptr++;
989 :
990 : /* at least one digit */
991 1024 : if (*ptr && !isdigit((unsigned char) *ptr))
992 4 : return false;
993 :
994 : /* eat all digits */
995 2150 : while (*ptr && isdigit((unsigned char) *ptr))
996 1130 : ptr++;
997 :
998 : /* must have reached end of string */
999 1020 : return *ptr == '\0';
1000 : }
1001 :
1002 :
1003 : /*
1004 : * strtoint64 -- convert a string to 64-bit integer
1005 : *
1006 : * This function is a slightly modified version of pg_strtoint64() from
1007 : * src/backend/utils/adt/numutils.c.
1008 : *
1009 : * The function returns whether the conversion worked, and if so
1010 : * "*result" is set to the result.
1011 : *
1012 : * If not errorOK, an error message is also printed out on errors.
1013 : */
1014 : bool
1015 2612 : strtoint64(const char *str, bool errorOK, int64 *result)
1016 : {
1017 2612 : const char *ptr = str;
1018 2612 : int64 tmp = 0;
1019 2612 : bool neg = false;
1020 :
1021 : /*
1022 : * Do our own scan, rather than relying on sscanf which might be broken
1023 : * for long long.
1024 : *
1025 : * As INT64_MIN can't be stored as a positive 64 bit integer, accumulate
1026 : * value as a negative number.
1027 : */
1028 :
1029 : /* skip leading spaces */
1030 2612 : while (*ptr && isspace((unsigned char) *ptr))
1031 0 : ptr++;
1032 :
1033 : /* handle sign */
1034 2612 : if (*ptr == '-')
1035 : {
1036 4 : ptr++;
1037 4 : neg = true;
1038 : }
1039 2608 : else if (*ptr == '+')
1040 0 : ptr++;
1041 :
1042 : /* require at least one digit */
1043 2612 : if (unlikely(!isdigit((unsigned char) *ptr)))
1044 0 : goto invalid_syntax;
1045 :
1046 : /* process digits */
1047 7830 : while (*ptr && isdigit((unsigned char) *ptr))
1048 : {
1049 5220 : int8 digit = (*ptr++ - '0');
1050 :
1051 5220 : if (unlikely(pg_mul_s64_overflow(tmp, 10, &tmp)) ||
1052 5218 : unlikely(pg_sub_s64_overflow(tmp, digit, &tmp)))
1053 2 : goto out_of_range;
1054 : }
1055 :
1056 : /* allow trailing whitespace, but not other trailing chars */
1057 2610 : while (*ptr != '\0' && isspace((unsigned char) *ptr))
1058 0 : ptr++;
1059 :
1060 2610 : if (unlikely(*ptr != '\0'))
1061 0 : goto invalid_syntax;
1062 :
1063 2610 : if (!neg)
1064 : {
1065 2606 : if (unlikely(tmp == PG_INT64_MIN))
1066 0 : goto out_of_range;
1067 2606 : tmp = -tmp;
1068 : }
1069 :
1070 2610 : *result = tmp;
1071 2610 : return true;
1072 :
1073 2 : out_of_range:
1074 2 : if (!errorOK)
1075 0 : pg_log_error("value \"%s\" is out of range for type bigint", str);
1076 2 : return false;
1077 :
1078 0 : invalid_syntax:
1079 0 : if (!errorOK)
1080 0 : pg_log_error("invalid input syntax for type bigint: \"%s\"", str);
1081 0 : return false;
1082 : }
1083 :
1084 : /* convert string to double, detecting overflows/underflows */
1085 : bool
1086 132 : strtodouble(const char *str, bool errorOK, double *dv)
1087 : {
1088 : char *end;
1089 :
1090 132 : errno = 0;
1091 132 : *dv = strtod(str, &end);
1092 :
1093 132 : if (unlikely(errno != 0))
1094 : {
1095 4 : if (!errorOK)
1096 0 : pg_log_error("value \"%s\" is out of range for type double", str);
1097 4 : return false;
1098 : }
1099 :
1100 128 : if (unlikely(end == str || *end != '\0'))
1101 : {
1102 4 : if (!errorOK)
1103 0 : pg_log_error("invalid input syntax for type double: \"%s\"", str);
1104 4 : return false;
1105 : }
1106 124 : return true;
1107 : }
1108 :
1109 : /*
1110 : * Initialize a prng state struct.
1111 : *
1112 : * We derive the seed from base_random_sequence, which must be set up already.
1113 : */
1114 : static void
1115 778 : initRandomState(pg_prng_state *state)
1116 : {
1117 778 : pg_prng_seed(state, pg_prng_uint64(&base_random_sequence));
1118 778 : }
1119 :
1120 :
1121 : /*
1122 : * random number generator: uniform distribution from min to max inclusive.
1123 : *
1124 : * Although the limits are expressed as int64, you can't generate the full
1125 : * int64 range in one call, because the difference of the limits mustn't
1126 : * overflow int64. This is not checked.
1127 : */
1128 : static int64
1129 5740 : getrand(pg_prng_state *state, int64 min, int64 max)
1130 : {
1131 5740 : return min + (int64) pg_prng_uint64_range(state, 0, max - min);
1132 : }
1133 :
1134 : /*
1135 : * random number generator: exponential distribution from min to max inclusive.
1136 : * the parameter is so that the density of probability for the last cut-off max
1137 : * value is exp(-parameter).
1138 : */
1139 : static int64
1140 6 : getExponentialRand(pg_prng_state *state, int64 min, int64 max,
1141 : double parameter)
1142 : {
1143 : double cut,
1144 : uniform,
1145 : rand;
1146 :
1147 : /* abort if wrong parameter, but must really be checked beforehand */
1148 : Assert(parameter > 0.0);
1149 6 : cut = exp(-parameter);
1150 : /* pg_prng_double value in [0, 1), uniform in (0, 1] */
1151 6 : uniform = 1.0 - pg_prng_double(state);
1152 :
1153 : /*
1154 : * inner expression in (cut, 1] (if parameter > 0), rand in [0, 1)
1155 : */
1156 : Assert((1.0 - cut) != 0.0);
1157 6 : rand = -log(cut + (1.0 - cut) * uniform) / parameter;
1158 : /* return int64 random number within between min and max */
1159 6 : return min + (int64) ((max - min + 1) * rand);
1160 : }
1161 :
1162 : /* random number generator: gaussian distribution from min to max inclusive */
1163 : static int64
1164 6 : getGaussianRand(pg_prng_state *state, int64 min, int64 max,
1165 : double parameter)
1166 : {
1167 : double stdev;
1168 : double rand;
1169 :
1170 : /* abort if parameter is too low, but must really be checked beforehand */
1171 : Assert(parameter >= MIN_GAUSSIAN_PARAM);
1172 :
1173 : /*
1174 : * Get normally-distributed random number in the range -parameter <= stdev
1175 : * < parameter.
1176 : *
1177 : * This loop is executed until the number is in the expected range.
1178 : *
1179 : * As the minimum parameter is 2.0, the probability of looping is low:
1180 : * sqrt(-2 ln(r)) <= 2 => r >= e^{-2} ~ 0.135, then when taking the
1181 : * average sinus multiplier as 2/pi, we have a 8.6% looping probability in
1182 : * the worst case. For a parameter value of 5.0, the looping probability
1183 : * is about e^{-5} * 2 / pi ~ 0.43%.
1184 : */
1185 : do
1186 : {
1187 6 : stdev = pg_prng_double_normal(state);
1188 : }
1189 6 : while (stdev < -parameter || stdev >= parameter);
1190 :
1191 : /* stdev is in [-parameter, parameter), normalization to [0,1) */
1192 6 : rand = (stdev + parameter) / (parameter * 2.0);
1193 :
1194 : /* return int64 random number within between min and max */
1195 6 : return min + (int64) ((max - min + 1) * rand);
1196 : }
1197 :
1198 : /*
1199 : * random number generator: generate a value, such that the series of values
1200 : * will approximate a Poisson distribution centered on the given value.
1201 : *
1202 : * Individual results are rounded to integers, though the center value need
1203 : * not be one.
1204 : */
1205 : static int64
1206 420 : getPoissonRand(pg_prng_state *state, double center)
1207 : {
1208 : /*
1209 : * Use inverse transform sampling to generate a value > 0, such that the
1210 : * expected (i.e. average) value is the given argument.
1211 : */
1212 : double uniform;
1213 :
1214 : /* pg_prng_double value in [0, 1), uniform in (0, 1] */
1215 420 : uniform = 1.0 - pg_prng_double(state);
1216 :
1217 420 : return (int64) (-log(uniform) * center + 0.5);
1218 : }
1219 :
1220 : /*
1221 : * Computing zipfian using rejection method, based on
1222 : * "Non-Uniform Random Variate Generation",
1223 : * Luc Devroye, p. 550-551, Springer 1986.
1224 : *
1225 : * This works for s > 1.0, but may perform badly for s very close to 1.0.
1226 : */
1227 : static int64
1228 6 : computeIterativeZipfian(pg_prng_state *state, int64 n, double s)
1229 : {
1230 6 : double b = pow(2.0, s - 1.0);
1231 : double x,
1232 : t,
1233 : u,
1234 : v;
1235 :
1236 : /* Ensure n is sane */
1237 6 : if (n <= 1)
1238 0 : return 1;
1239 :
1240 : while (true)
1241 : {
1242 : /* random variates */
1243 6 : u = pg_prng_double(state);
1244 6 : v = pg_prng_double(state);
1245 :
1246 6 : x = floor(pow(u, -1.0 / (s - 1.0)));
1247 :
1248 6 : t = pow(1.0 + 1.0 / x, s - 1.0);
1249 : /* reject if too large or out of bound */
1250 6 : if (v * x * (t - 1.0) / (b - 1.0) <= t / b && x <= n)
1251 6 : break;
1252 : }
1253 6 : return (int64) x;
1254 : }
1255 :
1256 : /* random number generator: zipfian distribution from min to max inclusive */
1257 : static int64
1258 6 : getZipfianRand(pg_prng_state *state, int64 min, int64 max, double s)
1259 : {
1260 6 : int64 n = max - min + 1;
1261 :
1262 : /* abort if parameter is invalid */
1263 : Assert(MIN_ZIPFIAN_PARAM <= s && s <= MAX_ZIPFIAN_PARAM);
1264 :
1265 6 : return min - 1 + computeIterativeZipfian(state, n, s);
1266 : }
1267 :
1268 : /*
1269 : * FNV-1a hash function
1270 : */
1271 : static int64
1272 2 : getHashFnv1a(int64 val, uint64 seed)
1273 : {
1274 : int64 result;
1275 : int i;
1276 :
1277 2 : result = FNV_OFFSET_BASIS ^ seed;
1278 18 : for (i = 0; i < 8; ++i)
1279 : {
1280 16 : int32 octet = val & 0xff;
1281 :
1282 16 : val = val >> 8;
1283 16 : result = result ^ octet;
1284 16 : result = result * FNV_PRIME;
1285 : }
1286 :
1287 2 : return result;
1288 : }
1289 :
1290 : /*
1291 : * Murmur2 hash function
1292 : *
1293 : * Based on original work of Austin Appleby
1294 : * https://github.com/aappleby/smhasher/blob/master/src/MurmurHash2.cpp
1295 : */
1296 : static int64
1297 10 : getHashMurmur2(int64 val, uint64 seed)
1298 : {
1299 10 : uint64 result = seed ^ MM2_MUL_TIMES_8; /* sizeof(int64) */
1300 10 : uint64 k = (uint64) val;
1301 :
1302 10 : k *= MM2_MUL;
1303 10 : k ^= k >> MM2_ROT;
1304 10 : k *= MM2_MUL;
1305 :
1306 10 : result ^= k;
1307 10 : result *= MM2_MUL;
1308 :
1309 10 : result ^= result >> MM2_ROT;
1310 10 : result *= MM2_MUL;
1311 10 : result ^= result >> MM2_ROT;
1312 :
1313 10 : return (int64) result;
1314 : }
1315 :
1316 : /*
1317 : * Pseudorandom permutation function
1318 : *
1319 : * For small sizes, this generates each of the (size!) possible permutations
1320 : * of integers in the range [0, size) with roughly equal probability. Once
1321 : * the size is larger than 20, the number of possible permutations exceeds the
1322 : * number of distinct states of the internal pseudorandom number generator,
1323 : * and so not all possible permutations can be generated, but the permutations
1324 : * chosen should continue to give the appearance of being random.
1325 : *
1326 : * THIS FUNCTION IS NOT CRYPTOGRAPHICALLY SECURE.
1327 : * DO NOT USE FOR SUCH PURPOSE.
1328 : */
1329 : static int64
1330 90 : permute(const int64 val, const int64 isize, const int64 seed)
1331 : {
1332 : /* using a high-end PRNG is probably overkill */
1333 : pg_prng_state state;
1334 : uint64 size;
1335 : uint64 v;
1336 : int masklen;
1337 : uint64 mask;
1338 : int i;
1339 :
1340 90 : if (isize < 2)
1341 2 : return 0; /* nothing to permute */
1342 :
1343 : /* Initialize prng state using the seed */
1344 88 : pg_prng_seed(&state, (uint64) seed);
1345 :
1346 : /* Computations are performed on unsigned values */
1347 88 : size = (uint64) isize;
1348 88 : v = (uint64) val % size;
1349 :
1350 : /* Mask to work modulo largest power of 2 less than or equal to size */
1351 88 : masklen = pg_leftmost_one_pos64(size);
1352 88 : mask = (((uint64) 1) << masklen) - 1;
1353 :
1354 : /*
1355 : * Permute the input value by applying several rounds of pseudorandom
1356 : * bijective transformations. The intention here is to distribute each
1357 : * input uniformly randomly across the range, and separate adjacent inputs
1358 : * approximately uniformly randomly from each other, leading to a fairly
1359 : * random overall choice of permutation.
1360 : *
1361 : * To separate adjacent inputs, we multiply by a random number modulo
1362 : * (mask + 1), which is a power of 2. For this to be a bijection, the
1363 : * multiplier must be odd. Since this is known to lead to less randomness
1364 : * in the lower bits, we also apply a rotation that shifts the topmost bit
1365 : * into the least significant bit. In the special cases where size <= 3,
1366 : * mask = 1 and each of these operations is actually a no-op, so we also
1367 : * XOR the value with a different random number to inject additional
1368 : * randomness. Since the size is generally not a power of 2, we apply
1369 : * this bijection on overlapping upper and lower halves of the input.
1370 : *
1371 : * To distribute the inputs uniformly across the range, we then also apply
1372 : * a random offset modulo the full range.
1373 : *
1374 : * Taken together, these operations resemble a modified linear
1375 : * congruential generator, as is commonly used in pseudorandom number
1376 : * generators. The number of rounds is fairly arbitrary, but six has been
1377 : * found empirically to give a fairly good tradeoff between performance
1378 : * and uniform randomness. For small sizes it selects each of the (size!)
1379 : * possible permutations with roughly equal probability. For larger
1380 : * sizes, not all permutations can be generated, but the intended random
1381 : * spread is still produced.
1382 : */
1383 616 : for (i = 0; i < 6; i++)
1384 : {
1385 : uint64 m,
1386 : r,
1387 : t;
1388 :
1389 : /* Random multiply (by an odd number), XOR and rotate of lower half */
1390 528 : m = (pg_prng_uint64(&state) & mask) | 1;
1391 528 : r = pg_prng_uint64(&state) & mask;
1392 528 : if (v <= mask)
1393 : {
1394 438 : v = ((v * m) ^ r) & mask;
1395 438 : v = ((v << 1) & mask) | (v >> (masklen - 1));
1396 : }
1397 :
1398 : /* Random multiply (by an odd number), XOR and rotate of upper half */
1399 528 : m = (pg_prng_uint64(&state) & mask) | 1;
1400 528 : r = pg_prng_uint64(&state) & mask;
1401 528 : t = size - 1 - v;
1402 528 : if (t <= mask)
1403 : {
1404 470 : t = ((t * m) ^ r) & mask;
1405 470 : t = ((t << 1) & mask) | (t >> (masklen - 1));
1406 470 : v = size - 1 - t;
1407 : }
1408 :
1409 : /* Random offset */
1410 528 : r = pg_prng_uint64_range(&state, 0, size - 1);
1411 528 : v = (v + r) % size;
1412 : }
1413 :
1414 88 : return (int64) v;
1415 : }
1416 :
1417 : /*
1418 : * Initialize the given SimpleStats struct to all zeroes
1419 : */
1420 : static void
1421 4078 : initSimpleStats(SimpleStats *ss)
1422 : {
1423 4078 : memset(ss, 0, sizeof(SimpleStats));
1424 4078 : }
1425 :
1426 : /*
1427 : * Accumulate one value into a SimpleStats struct.
1428 : */
1429 : static void
1430 19286 : addToSimpleStats(SimpleStats *ss, double val)
1431 : {
1432 19286 : if (ss->count == 0 || val < ss->min)
1433 352 : ss->min = val;
1434 19286 : if (ss->count == 0 || val > ss->max)
1435 1012 : ss->max = val;
1436 19286 : ss->count++;
1437 19286 : ss->sum += val;
1438 19286 : ss->sum2 += val * val;
1439 19286 : }
1440 :
1441 : /*
1442 : * Merge two SimpleStats objects
1443 : */
1444 : static void
1445 340 : mergeSimpleStats(SimpleStats *acc, SimpleStats *ss)
1446 : {
1447 340 : if (acc->count == 0 || ss->min < acc->min)
1448 340 : acc->min = ss->min;
1449 340 : if (acc->count == 0 || ss->max > acc->max)
1450 340 : acc->max = ss->max;
1451 340 : acc->count += ss->count;
1452 340 : acc->sum += ss->sum;
1453 340 : acc->sum2 += ss->sum2;
1454 340 : }
1455 :
1456 : /*
1457 : * Initialize a StatsData struct to mostly zeroes, with its start time set to
1458 : * the given value.
1459 : */
1460 : static void
1461 1084 : initStats(StatsData *sd, pg_time_usec_t start)
1462 : {
1463 1084 : sd->start_time = start;
1464 1084 : sd->cnt = 0;
1465 1084 : sd->skipped = 0;
1466 1084 : sd->retries = 0;
1467 1084 : sd->retried = 0;
1468 1084 : sd->serialization_failures = 0;
1469 1084 : sd->deadlock_failures = 0;
1470 1084 : initSimpleStats(&sd->latency);
1471 1084 : initSimpleStats(&sd->lag);
1472 1084 : }
1473 :
1474 : /*
1475 : * Accumulate one additional item into the given stats object.
1476 : */
1477 : static void
1478 18100 : accumStats(StatsData *stats, bool skipped, double lat, double lag,
1479 : EStatus estatus, int64 tries)
1480 : {
1481 : /* Record the skipped transaction */
1482 18100 : if (skipped)
1483 : {
1484 : /* no latency to record on skipped transactions */
1485 18 : stats->skipped++;
1486 18 : return;
1487 : }
1488 :
1489 : /*
1490 : * Record the number of retries regardless of whether the transaction was
1491 : * successful or failed.
1492 : */
1493 18082 : if (tries > 1)
1494 : {
1495 4 : stats->retries += (tries - 1);
1496 4 : stats->retried++;
1497 : }
1498 :
1499 18082 : switch (estatus)
1500 : {
1501 : /* Record the successful transaction */
1502 18082 : case ESTATUS_NO_ERROR:
1503 18082 : stats->cnt++;
1504 :
1505 18082 : addToSimpleStats(&stats->latency, lat);
1506 :
1507 : /* and possibly the same for schedule lag */
1508 18082 : if (throttle_delay)
1509 402 : addToSimpleStats(&stats->lag, lag);
1510 18082 : break;
1511 :
1512 : /* Record the failed transaction */
1513 0 : case ESTATUS_SERIALIZATION_ERROR:
1514 0 : stats->serialization_failures++;
1515 0 : break;
1516 0 : case ESTATUS_DEADLOCK_ERROR:
1517 0 : stats->deadlock_failures++;
1518 0 : break;
1519 0 : default:
1520 : /* internal error which should never occur */
1521 0 : pg_fatal("unexpected error status: %d", estatus);
1522 : }
1523 : }
1524 :
1525 : /* call PQexec() and exit() on failure */
1526 : static void
1527 118 : executeStatement(PGconn *con, const char *sql)
1528 : {
1529 : PGresult *res;
1530 :
1531 118 : res = PQexec(con, sql);
1532 118 : if (PQresultStatus(res) != PGRES_COMMAND_OK)
1533 : {
1534 0 : pg_log_error("query failed: %s", PQerrorMessage(con));
1535 0 : pg_log_error_detail("Query was: %s", sql);
1536 0 : exit(1);
1537 : }
1538 118 : PQclear(res);
1539 118 : }
1540 :
1541 : /* call PQexec() and complain, but without exiting, on failure */
1542 : static void
1543 60 : tryExecuteStatement(PGconn *con, const char *sql)
1544 : {
1545 : PGresult *res;
1546 :
1547 60 : res = PQexec(con, sql);
1548 60 : if (PQresultStatus(res) != PGRES_COMMAND_OK)
1549 : {
1550 0 : pg_log_error("%s", PQerrorMessage(con));
1551 0 : pg_log_error_detail("(ignoring this error and continuing anyway)");
1552 : }
1553 60 : PQclear(res);
1554 60 : }
1555 :
1556 : /* set up a connection to the backend */
1557 : static PGconn *
1558 640 : doConnect(void)
1559 : {
1560 : PGconn *conn;
1561 : bool new_pass;
1562 : static char *password = NULL;
1563 :
1564 : /*
1565 : * Start the connection. Loop until we have a password if requested by
1566 : * backend.
1567 : */
1568 : do
1569 : {
1570 : #define PARAMS_ARRAY_SIZE 7
1571 :
1572 : const char *keywords[PARAMS_ARRAY_SIZE];
1573 : const char *values[PARAMS_ARRAY_SIZE];
1574 :
1575 640 : keywords[0] = "host";
1576 640 : values[0] = pghost;
1577 640 : keywords[1] = "port";
1578 640 : values[1] = pgport;
1579 640 : keywords[2] = "user";
1580 640 : values[2] = username;
1581 640 : keywords[3] = "password";
1582 640 : values[3] = password;
1583 640 : keywords[4] = "dbname";
1584 640 : values[4] = dbName;
1585 640 : keywords[5] = "fallback_application_name";
1586 640 : values[5] = progname;
1587 640 : keywords[6] = NULL;
1588 640 : values[6] = NULL;
1589 :
1590 640 : new_pass = false;
1591 :
1592 640 : conn = PQconnectdbParams(keywords, values, true);
1593 :
1594 640 : if (!conn)
1595 : {
1596 0 : pg_log_error("connection to database \"%s\" failed", dbName);
1597 0 : return NULL;
1598 : }
1599 :
1600 642 : if (PQstatus(conn) == CONNECTION_BAD &&
1601 2 : PQconnectionNeedsPassword(conn) &&
1602 0 : !password)
1603 : {
1604 0 : PQfinish(conn);
1605 0 : password = simple_prompt("Password: ", false);
1606 0 : new_pass = true;
1607 : }
1608 640 : } while (new_pass);
1609 :
1610 : /* check to see that the backend connection was successfully made */
1611 640 : if (PQstatus(conn) == CONNECTION_BAD)
1612 : {
1613 2 : pg_log_error("%s", PQerrorMessage(conn));
1614 2 : PQfinish(conn);
1615 2 : return NULL;
1616 : }
1617 :
1618 638 : return conn;
1619 : }
1620 :
1621 : /* qsort comparator for Variable array */
1622 : static int
1623 107852 : compareVariableNames(const void *v1, const void *v2)
1624 : {
1625 215704 : return strcmp(((const Variable *) v1)->name,
1626 107852 : ((const Variable *) v2)->name);
1627 : }
1628 :
1629 : /* Locate a variable by name; returns NULL if unknown */
1630 : static Variable *
1631 15910 : lookupVariable(Variables *variables, char *name)
1632 : {
1633 : Variable key;
1634 :
1635 : /* On some versions of Solaris, bsearch of zero items dumps core */
1636 15910 : if (variables->nvars <= 0)
1637 398 : return NULL;
1638 :
1639 : /* Sort if we have to */
1640 15512 : if (!variables->vars_sorted)
1641 : {
1642 2028 : qsort(variables->vars, variables->nvars, sizeof(Variable),
1643 : compareVariableNames);
1644 2028 : variables->vars_sorted = true;
1645 : }
1646 :
1647 : /* Now we can search */
1648 15512 : key.name = name;
1649 15512 : return (Variable *) bsearch(&key,
1650 15512 : variables->vars,
1651 15512 : variables->nvars,
1652 : sizeof(Variable),
1653 : compareVariableNames);
1654 : }
1655 :
1656 : /* Get the value of a variable, in string form; returns NULL if unknown */
1657 : static char *
1658 4908 : getVariable(Variables *variables, char *name)
1659 : {
1660 : Variable *var;
1661 : char stringform[64];
1662 :
1663 4908 : var = lookupVariable(variables, name);
1664 4908 : if (var == NULL)
1665 8 : return NULL; /* not found */
1666 :
1667 4900 : if (var->svalue)
1668 1688 : return var->svalue; /* we have it in string form */
1669 :
1670 : /* We need to produce a string equivalent of the value */
1671 : Assert(var->value.type != PGBT_NO_VALUE);
1672 3212 : if (var->value.type == PGBT_NULL)
1673 2 : snprintf(stringform, sizeof(stringform), "NULL");
1674 3210 : else if (var->value.type == PGBT_BOOLEAN)
1675 2 : snprintf(stringform, sizeof(stringform),
1676 2 : "%s", var->value.u.bval ? "true" : "false");
1677 3208 : else if (var->value.type == PGBT_INT)
1678 3204 : snprintf(stringform, sizeof(stringform),
1679 : INT64_FORMAT, var->value.u.ival);
1680 4 : else if (var->value.type == PGBT_DOUBLE)
1681 4 : snprintf(stringform, sizeof(stringform),
1682 : "%.*g", DBL_DIG, var->value.u.dval);
1683 : else /* internal error, unexpected type */
1684 : Assert(0);
1685 3212 : var->svalue = pg_strdup(stringform);
1686 3212 : return var->svalue;
1687 : }
1688 :
1689 : /* Try to convert variable to a value; return false on failure */
1690 : static bool
1691 4016 : makeVariableValue(Variable *var)
1692 : {
1693 : size_t slen;
1694 :
1695 4016 : if (var->value.type != PGBT_NO_VALUE)
1696 2986 : return true; /* no work */
1697 :
1698 1030 : slen = strlen(var->svalue);
1699 :
1700 1030 : if (slen == 0)
1701 : /* what should it do on ""? */
1702 0 : return false;
1703 :
1704 1030 : if (pg_strcasecmp(var->svalue, "null") == 0)
1705 : {
1706 2 : setNullValue(&var->value);
1707 : }
1708 :
1709 : /*
1710 : * accept prefixes such as y, ye, n, no... but not for "o". 0/1 are
1711 : * recognized later as an int, which is converted to bool if needed.
1712 : */
1713 2054 : else if (pg_strncasecmp(var->svalue, "true", slen) == 0 ||
1714 2052 : pg_strncasecmp(var->svalue, "yes", slen) == 0 ||
1715 1026 : pg_strcasecmp(var->svalue, "on") == 0)
1716 : {
1717 2 : setBoolValue(&var->value, true);
1718 : }
1719 2052 : else if (pg_strncasecmp(var->svalue, "false", slen) == 0 ||
1720 2052 : pg_strncasecmp(var->svalue, "no", slen) == 0 ||
1721 2052 : pg_strcasecmp(var->svalue, "off") == 0 ||
1722 1026 : pg_strcasecmp(var->svalue, "of") == 0)
1723 : {
1724 2 : setBoolValue(&var->value, false);
1725 : }
1726 1024 : else if (is_an_int(var->svalue))
1727 : {
1728 : /* if it looks like an int, it must be an int without overflow */
1729 : int64 iv;
1730 :
1731 1018 : if (!strtoint64(var->svalue, false, &iv))
1732 0 : return false;
1733 :
1734 1018 : setIntValue(&var->value, iv);
1735 : }
1736 : else /* type should be double */
1737 : {
1738 : double dv;
1739 :
1740 6 : if (!strtodouble(var->svalue, true, &dv))
1741 : {
1742 4 : pg_log_error("malformed variable \"%s\" value: \"%s\"",
1743 : var->name, var->svalue);
1744 4 : return false;
1745 : }
1746 2 : setDoubleValue(&var->value, dv);
1747 : }
1748 1026 : return true;
1749 : }
1750 :
1751 : /*
1752 : * Check whether a variable's name is allowed.
1753 : *
1754 : * We allow any non-ASCII character, as well as ASCII letters, digits, and
1755 : * underscore.
1756 : *
1757 : * Keep this in sync with the definitions of variable name characters in
1758 : * "src/fe_utils/psqlscan.l", "src/bin/psql/psqlscanslash.l" and
1759 : * "src/bin/pgbench/exprscan.l". Also see parseVariable(), below.
1760 : *
1761 : * Note: this static function is copied from "src/bin/psql/variables.c"
1762 : * but changed to disallow variable names starting with a digit.
1763 : */
1764 : static bool
1765 2210 : valid_variable_name(const char *name)
1766 : {
1767 2210 : const unsigned char *ptr = (const unsigned char *) name;
1768 :
1769 : /* Mustn't be zero-length */
1770 2210 : if (*ptr == '\0')
1771 0 : return false;
1772 :
1773 : /* must not start with [0-9] */
1774 2210 : if (IS_HIGHBIT_SET(*ptr) ||
1775 2210 : strchr("ABCDEFGHIJKLMNOPQRSTUVWXYZ" "abcdefghijklmnopqrstuvwxyz"
1776 2210 : "_", *ptr) != NULL)
1777 2206 : ptr++;
1778 : else
1779 4 : return false;
1780 :
1781 : /* remaining characters can include [0-9] */
1782 14436 : while (*ptr)
1783 : {
1784 12232 : if (IS_HIGHBIT_SET(*ptr) ||
1785 12232 : strchr("ABCDEFGHIJKLMNOPQRSTUVWXYZ" "abcdefghijklmnopqrstuvwxyz"
1786 12232 : "_0123456789", *ptr) != NULL)
1787 12230 : ptr++;
1788 : else
1789 2 : return false;
1790 : }
1791 :
1792 2204 : return true;
1793 : }
1794 :
1795 : /*
1796 : * Make sure there is enough space for 'needed' more variable in the variables
1797 : * array.
1798 : */
1799 : static void
1800 2204 : enlargeVariables(Variables *variables, int needed)
1801 : {
1802 : /* total number of variables required now */
1803 2204 : needed += variables->nvars;
1804 :
1805 2204 : if (variables->max_vars < needed)
1806 : {
1807 376 : variables->max_vars = needed + VARIABLES_ALLOC_MARGIN;
1808 376 : variables->vars = (Variable *)
1809 376 : pg_realloc(variables->vars, variables->max_vars * sizeof(Variable));
1810 : }
1811 2204 : }
1812 :
1813 : /*
1814 : * Lookup a variable by name, creating it if need be.
1815 : * Caller is expected to assign a value to the variable.
1816 : * Returns NULL on failure (bad name).
1817 : */
1818 : static Variable *
1819 6294 : lookupCreateVariable(Variables *variables, const char *context, char *name)
1820 : {
1821 : Variable *var;
1822 :
1823 6294 : var = lookupVariable(variables, name);
1824 6294 : if (var == NULL)
1825 : {
1826 : /*
1827 : * Check for the name only when declaring a new variable to avoid
1828 : * overhead.
1829 : */
1830 2210 : if (!valid_variable_name(name))
1831 : {
1832 6 : pg_log_error("%s: invalid variable name: \"%s\"", context, name);
1833 6 : return NULL;
1834 : }
1835 :
1836 : /* Create variable at the end of the array */
1837 2204 : enlargeVariables(variables, 1);
1838 :
1839 2204 : var = &(variables->vars[variables->nvars]);
1840 :
1841 2204 : var->name = pg_strdup(name);
1842 2204 : var->svalue = NULL;
1843 : /* caller is expected to initialize remaining fields */
1844 :
1845 2204 : variables->nvars++;
1846 : /* we don't re-sort the array till we have to */
1847 2204 : variables->vars_sorted = false;
1848 : }
1849 :
1850 6288 : return var;
1851 : }
1852 :
1853 : /* Assign a string value to a variable, creating it if need be */
1854 : /* Returns false on failure (bad name) */
1855 : static bool
1856 1906 : putVariable(Variables *variables, const char *context, char *name,
1857 : const char *value)
1858 : {
1859 : Variable *var;
1860 : char *val;
1861 :
1862 1906 : var = lookupCreateVariable(variables, context, name);
1863 1906 : if (!var)
1864 4 : return false;
1865 :
1866 : /* dup then free, in case value is pointing at this variable */
1867 1902 : val = pg_strdup(value);
1868 :
1869 1902 : free(var->svalue);
1870 1902 : var->svalue = val;
1871 1902 : var->value.type = PGBT_NO_VALUE;
1872 :
1873 1902 : return true;
1874 : }
1875 :
1876 : /* Assign a value to a variable, creating it if need be */
1877 : /* Returns false on failure (bad name) */
1878 : static bool
1879 4388 : putVariableValue(Variables *variables, const char *context, char *name,
1880 : const PgBenchValue *value)
1881 : {
1882 : Variable *var;
1883 :
1884 4388 : var = lookupCreateVariable(variables, context, name);
1885 4388 : if (!var)
1886 2 : return false;
1887 :
1888 4386 : free(var->svalue);
1889 4386 : var->svalue = NULL;
1890 4386 : var->value = *value;
1891 :
1892 4386 : return true;
1893 : }
1894 :
1895 : /* Assign an integer value to a variable, creating it if need be */
1896 : /* Returns false on failure (bad name) */
1897 : static bool
1898 1010 : putVariableInt(Variables *variables, const char *context, char *name,
1899 : int64 value)
1900 : {
1901 : PgBenchValue val;
1902 :
1903 1010 : setIntValue(&val, value);
1904 1010 : return putVariableValue(variables, context, name, &val);
1905 : }
1906 :
1907 : /*
1908 : * Parse a possible variable reference (:varname).
1909 : *
1910 : * "sql" points at a colon. If what follows it looks like a valid
1911 : * variable name, return a malloc'd string containing the variable name,
1912 : * and set *eaten to the number of characters consumed (including the colon).
1913 : * Otherwise, return NULL.
1914 : */
1915 : static char *
1916 4672 : parseVariable(const char *sql, int *eaten)
1917 : {
1918 4672 : int i = 1; /* starting at 1 skips the colon */
1919 : char *name;
1920 :
1921 : /* keep this logic in sync with valid_variable_name() */
1922 4672 : if (IS_HIGHBIT_SET(sql[i]) ||
1923 4672 : strchr("ABCDEFGHIJKLMNOPQRSTUVWXYZ" "abcdefghijklmnopqrstuvwxyz"
1924 4672 : "_", sql[i]) != NULL)
1925 2124 : i++;
1926 : else
1927 2548 : return NULL;
1928 :
1929 9614 : while (IS_HIGHBIT_SET(sql[i]) ||
1930 9614 : strchr("ABCDEFGHIJKLMNOPQRSTUVWXYZ" "abcdefghijklmnopqrstuvwxyz"
1931 9614 : "_0123456789", sql[i]) != NULL)
1932 7490 : i++;
1933 :
1934 2124 : name = pg_malloc(i);
1935 2124 : memcpy(name, &sql[1], i - 1);
1936 2124 : name[i - 1] = '\0';
1937 :
1938 2124 : *eaten = i;
1939 2124 : return name;
1940 : }
1941 :
1942 : static char *
1943 2122 : replaceVariable(char **sql, char *param, int len, char *value)
1944 : {
1945 2122 : int valueln = strlen(value);
1946 :
1947 2122 : if (valueln > len)
1948 : {
1949 1162 : size_t offset = param - *sql;
1950 :
1951 1162 : *sql = pg_realloc(*sql, strlen(*sql) - len + valueln + 1);
1952 1162 : param = *sql + offset;
1953 : }
1954 :
1955 2122 : if (valueln != len)
1956 2050 : memmove(param + valueln, param + len, strlen(param + len) + 1);
1957 2122 : memcpy(param, value, valueln);
1958 :
1959 2122 : return param + valueln;
1960 : }
1961 :
1962 : static char *
1963 16258 : assignVariables(Variables *variables, char *sql)
1964 : {
1965 : char *p,
1966 : *name,
1967 : *val;
1968 :
1969 16258 : p = sql;
1970 20336 : while ((p = strchr(p, ':')) != NULL)
1971 : {
1972 : int eaten;
1973 :
1974 4078 : name = parseVariable(p, &eaten);
1975 4078 : if (name == NULL)
1976 : {
1977 6062 : while (*p == ':')
1978 : {
1979 3546 : p++;
1980 : }
1981 2516 : continue;
1982 : }
1983 :
1984 1562 : val = getVariable(variables, name);
1985 1562 : free(name);
1986 1562 : if (val == NULL)
1987 : {
1988 0 : p++;
1989 0 : continue;
1990 : }
1991 :
1992 1562 : p = replaceVariable(&sql, p, eaten, val);
1993 : }
1994 :
1995 16258 : return sql;
1996 : }
1997 :
1998 : static void
1999 5078 : getQueryParams(Variables *variables, const Command *command,
2000 : const char **params)
2001 : {
2002 : int i;
2003 :
2004 8414 : for (i = 0; i < command->argc - 1; i++)
2005 3336 : params[i] = getVariable(variables, command->argv[i + 1]);
2006 5078 : }
2007 :
2008 : static char *
2009 8 : valueTypeName(PgBenchValue *pval)
2010 : {
2011 8 : if (pval->type == PGBT_NO_VALUE)
2012 0 : return "none";
2013 8 : else if (pval->type == PGBT_NULL)
2014 0 : return "null";
2015 8 : else if (pval->type == PGBT_INT)
2016 0 : return "int";
2017 8 : else if (pval->type == PGBT_DOUBLE)
2018 2 : return "double";
2019 6 : else if (pval->type == PGBT_BOOLEAN)
2020 6 : return "boolean";
2021 : else
2022 : {
2023 : /* internal error, should never get there */
2024 : Assert(false);
2025 0 : return NULL;
2026 : }
2027 : }
2028 :
2029 : /* get a value as a boolean, or tell if there is a problem */
2030 : static bool
2031 216 : coerceToBool(PgBenchValue *pval, bool *bval)
2032 : {
2033 216 : if (pval->type == PGBT_BOOLEAN)
2034 : {
2035 214 : *bval = pval->u.bval;
2036 214 : return true;
2037 : }
2038 : else /* NULL, INT or DOUBLE */
2039 : {
2040 2 : pg_log_error("cannot coerce %s to boolean", valueTypeName(pval));
2041 2 : *bval = false; /* suppress uninitialized-variable warnings */
2042 2 : return false;
2043 : }
2044 : }
2045 :
2046 : /*
2047 : * Return true or false from an expression for conditional purposes.
2048 : * Non zero numerical values are true, zero and NULL are false.
2049 : */
2050 : static bool
2051 1054 : valueTruth(PgBenchValue *pval)
2052 : {
2053 1054 : switch (pval->type)
2054 : {
2055 2 : case PGBT_NULL:
2056 2 : return false;
2057 62 : case PGBT_BOOLEAN:
2058 62 : return pval->u.bval;
2059 988 : case PGBT_INT:
2060 988 : return pval->u.ival != 0;
2061 2 : case PGBT_DOUBLE:
2062 2 : return pval->u.dval != 0.0;
2063 0 : default:
2064 : /* internal error, unexpected type */
2065 : Assert(0);
2066 0 : return false;
2067 : }
2068 : }
2069 :
2070 : /* get a value as an int, tell if there is a problem */
2071 : static bool
2072 13184 : coerceToInt(PgBenchValue *pval, int64 *ival)
2073 : {
2074 13184 : if (pval->type == PGBT_INT)
2075 : {
2076 13176 : *ival = pval->u.ival;
2077 13176 : return true;
2078 : }
2079 8 : else if (pval->type == PGBT_DOUBLE)
2080 : {
2081 4 : double dval = rint(pval->u.dval);
2082 :
2083 4 : if (isnan(dval) || !FLOAT8_FITS_IN_INT64(dval))
2084 : {
2085 2 : pg_log_error("double to int overflow for %f", dval);
2086 2 : return false;
2087 : }
2088 2 : *ival = (int64) dval;
2089 2 : return true;
2090 : }
2091 : else /* BOOLEAN or NULL */
2092 : {
2093 4 : pg_log_error("cannot coerce %s to int", valueTypeName(pval));
2094 4 : return false;
2095 : }
2096 : }
2097 :
2098 : /* get a value as a double, or tell if there is a problem */
2099 : static bool
2100 208 : coerceToDouble(PgBenchValue *pval, double *dval)
2101 : {
2102 208 : if (pval->type == PGBT_DOUBLE)
2103 : {
2104 146 : *dval = pval->u.dval;
2105 146 : return true;
2106 : }
2107 62 : else if (pval->type == PGBT_INT)
2108 : {
2109 60 : *dval = (double) pval->u.ival;
2110 60 : return true;
2111 : }
2112 : else /* BOOLEAN or NULL */
2113 : {
2114 2 : pg_log_error("cannot coerce %s to double", valueTypeName(pval));
2115 2 : return false;
2116 : }
2117 : }
2118 :
2119 : /* assign a null value */
2120 : static void
2121 8 : setNullValue(PgBenchValue *pv)
2122 : {
2123 8 : pv->type = PGBT_NULL;
2124 8 : pv->u.ival = 0;
2125 8 : }
2126 :
2127 : /* assign a boolean value */
2128 : static void
2129 278 : setBoolValue(PgBenchValue *pv, bool bval)
2130 : {
2131 278 : pv->type = PGBT_BOOLEAN;
2132 278 : pv->u.bval = bval;
2133 278 : }
2134 :
2135 : /* assign an integer value */
2136 : static void
2137 8436 : setIntValue(PgBenchValue *pv, int64 ival)
2138 : {
2139 8436 : pv->type = PGBT_INT;
2140 8436 : pv->u.ival = ival;
2141 8436 : }
2142 :
2143 : /* assign a double value */
2144 : static void
2145 78 : setDoubleValue(PgBenchValue *pv, double dval)
2146 : {
2147 78 : pv->type = PGBT_DOUBLE;
2148 78 : pv->u.dval = dval;
2149 78 : }
2150 :
2151 : static bool
2152 7004 : isLazyFunc(PgBenchFunction func)
2153 : {
2154 7004 : return func == PGBENCH_AND || func == PGBENCH_OR || func == PGBENCH_CASE;
2155 : }
2156 :
2157 : /* lazy evaluation of some functions */
2158 : static bool
2159 130 : evalLazyFunc(CState *st,
2160 : PgBenchFunction func, PgBenchExprLink *args, PgBenchValue *retval)
2161 : {
2162 : PgBenchValue a1,
2163 : a2;
2164 : bool ba1,
2165 : ba2;
2166 :
2167 : Assert(isLazyFunc(func) && args != NULL && args->next != NULL);
2168 :
2169 : /* args points to first condition */
2170 130 : if (!evaluateExpr(st, args->expr, &a1))
2171 2 : return false;
2172 :
2173 : /* second condition for AND/OR and corresponding branch for CASE */
2174 128 : args = args->next;
2175 :
2176 128 : switch (func)
2177 : {
2178 88 : case PGBENCH_AND:
2179 88 : if (a1.type == PGBT_NULL)
2180 : {
2181 0 : setNullValue(retval);
2182 0 : return true;
2183 : }
2184 :
2185 88 : if (!coerceToBool(&a1, &ba1))
2186 0 : return false;
2187 :
2188 88 : if (!ba1)
2189 : {
2190 6 : setBoolValue(retval, false);
2191 6 : return true;
2192 : }
2193 :
2194 82 : if (!evaluateExpr(st, args->expr, &a2))
2195 0 : return false;
2196 :
2197 82 : if (a2.type == PGBT_NULL)
2198 : {
2199 0 : setNullValue(retval);
2200 0 : return true;
2201 : }
2202 82 : else if (!coerceToBool(&a2, &ba2))
2203 0 : return false;
2204 : else
2205 : {
2206 82 : setBoolValue(retval, ba2);
2207 82 : return true;
2208 : }
2209 :
2210 : return true;
2211 :
2212 8 : case PGBENCH_OR:
2213 :
2214 8 : if (a1.type == PGBT_NULL)
2215 : {
2216 0 : setNullValue(retval);
2217 0 : return true;
2218 : }
2219 :
2220 8 : if (!coerceToBool(&a1, &ba1))
2221 0 : return false;
2222 :
2223 8 : if (ba1)
2224 : {
2225 2 : setBoolValue(retval, true);
2226 2 : return true;
2227 : }
2228 :
2229 6 : if (!evaluateExpr(st, args->expr, &a2))
2230 0 : return false;
2231 :
2232 6 : if (a2.type == PGBT_NULL)
2233 : {
2234 0 : setNullValue(retval);
2235 0 : return true;
2236 : }
2237 6 : else if (!coerceToBool(&a2, &ba2))
2238 0 : return false;
2239 : else
2240 : {
2241 6 : setBoolValue(retval, ba2);
2242 6 : return true;
2243 : }
2244 :
2245 32 : case PGBENCH_CASE:
2246 : /* when true, execute branch */
2247 32 : if (valueTruth(&a1))
2248 22 : return evaluateExpr(st, args->expr, retval);
2249 :
2250 : /* now args contains next condition or final else expression */
2251 10 : args = args->next;
2252 :
2253 : /* final else case? */
2254 10 : if (args->next == NULL)
2255 6 : return evaluateExpr(st, args->expr, retval);
2256 :
2257 : /* no, another when, proceed */
2258 4 : return evalLazyFunc(st, PGBENCH_CASE, args, retval);
2259 :
2260 0 : default:
2261 : /* internal error, cannot get here */
2262 : Assert(0);
2263 0 : break;
2264 : }
2265 0 : return false;
2266 : }
2267 :
2268 : /* maximum number of function arguments */
2269 : #define MAX_FARGS 16
2270 :
2271 : /*
2272 : * Recursive evaluation of standard functions,
2273 : * which do not require lazy evaluation.
2274 : */
2275 : static bool
2276 6878 : evalStandardFunc(CState *st,
2277 : PgBenchFunction func, PgBenchExprLink *args,
2278 : PgBenchValue *retval)
2279 : {
2280 : /* evaluate all function arguments */
2281 6878 : int nargs = 0;
2282 6878 : PgBenchValue vargs[MAX_FARGS] = {0};
2283 6878 : PgBenchExprLink *l = args;
2284 6878 : bool has_null = false;
2285 :
2286 20560 : for (nargs = 0; nargs < MAX_FARGS && l != NULL; nargs++, l = l->next)
2287 : {
2288 13686 : if (!evaluateExpr(st, l->expr, &vargs[nargs]))
2289 4 : return false;
2290 13682 : has_null |= vargs[nargs].type == PGBT_NULL;
2291 : }
2292 :
2293 6874 : if (l != NULL)
2294 : {
2295 2 : pg_log_error("too many function arguments, maximum is %d", MAX_FARGS);
2296 2 : return false;
2297 : }
2298 :
2299 : /* NULL arguments */
2300 6872 : if (has_null && func != PGBENCH_IS && func != PGBENCH_DEBUG)
2301 : {
2302 6 : setNullValue(retval);
2303 6 : return true;
2304 : }
2305 :
2306 : /* then evaluate function */
2307 6866 : switch (func)
2308 : {
2309 : /* overloaded operators */
2310 3396 : case PGBENCH_ADD:
2311 : case PGBENCH_SUB:
2312 : case PGBENCH_MUL:
2313 : case PGBENCH_DIV:
2314 : case PGBENCH_MOD:
2315 : case PGBENCH_EQ:
2316 : case PGBENCH_NE:
2317 : case PGBENCH_LE:
2318 : case PGBENCH_LT:
2319 : {
2320 3396 : PgBenchValue *lval = &vargs[0],
2321 3396 : *rval = &vargs[1];
2322 :
2323 : Assert(nargs == 2);
2324 :
2325 : /* overloaded type management, double if some double */
2326 3396 : if ((lval->type == PGBT_DOUBLE ||
2327 3396 : rval->type == PGBT_DOUBLE) && func != PGBENCH_MOD)
2328 0 : {
2329 : double ld,
2330 : rd;
2331 :
2332 62 : if (!coerceToDouble(lval, &ld) ||
2333 62 : !coerceToDouble(rval, &rd))
2334 62 : return false;
2335 :
2336 62 : switch (func)
2337 : {
2338 2 : case PGBENCH_ADD:
2339 2 : setDoubleValue(retval, ld + rd);
2340 2 : return true;
2341 :
2342 20 : case PGBENCH_SUB:
2343 20 : setDoubleValue(retval, ld - rd);
2344 20 : return true;
2345 :
2346 16 : case PGBENCH_MUL:
2347 16 : setDoubleValue(retval, ld * rd);
2348 16 : return true;
2349 :
2350 4 : case PGBENCH_DIV:
2351 4 : setDoubleValue(retval, ld / rd);
2352 4 : return true;
2353 :
2354 8 : case PGBENCH_EQ:
2355 8 : setBoolValue(retval, ld == rd);
2356 8 : return true;
2357 :
2358 4 : case PGBENCH_NE:
2359 4 : setBoolValue(retval, ld != rd);
2360 4 : return true;
2361 :
2362 4 : case PGBENCH_LE:
2363 4 : setBoolValue(retval, ld <= rd);
2364 4 : return true;
2365 :
2366 4 : case PGBENCH_LT:
2367 4 : setBoolValue(retval, ld < rd);
2368 4 : return true;
2369 :
2370 0 : default:
2371 : /* cannot get here */
2372 : Assert(0);
2373 : }
2374 : }
2375 : else /* we have integer operands, or % */
2376 : {
2377 : int64 li,
2378 : ri,
2379 : res;
2380 :
2381 3334 : if (!coerceToInt(lval, &li) ||
2382 3332 : !coerceToInt(rval, &ri))
2383 3334 : return false;
2384 :
2385 3332 : switch (func)
2386 : {
2387 88 : case PGBENCH_ADD:
2388 88 : if (pg_add_s64_overflow(li, ri, &res))
2389 : {
2390 2 : pg_log_error("bigint add out of range");
2391 2 : return false;
2392 : }
2393 86 : setIntValue(retval, res);
2394 86 : return true;
2395 :
2396 298 : case PGBENCH_SUB:
2397 298 : if (pg_sub_s64_overflow(li, ri, &res))
2398 : {
2399 2 : pg_log_error("bigint sub out of range");
2400 2 : return false;
2401 : }
2402 296 : setIntValue(retval, res);
2403 296 : return true;
2404 :
2405 2818 : case PGBENCH_MUL:
2406 2818 : if (pg_mul_s64_overflow(li, ri, &res))
2407 : {
2408 2 : pg_log_error("bigint mul out of range");
2409 2 : return false;
2410 : }
2411 2816 : setIntValue(retval, res);
2412 2816 : return true;
2413 :
2414 64 : case PGBENCH_EQ:
2415 64 : setBoolValue(retval, li == ri);
2416 64 : return true;
2417 :
2418 10 : case PGBENCH_NE:
2419 10 : setBoolValue(retval, li != ri);
2420 10 : return true;
2421 :
2422 10 : case PGBENCH_LE:
2423 10 : setBoolValue(retval, li <= ri);
2424 10 : return true;
2425 :
2426 24 : case PGBENCH_LT:
2427 24 : setBoolValue(retval, li < ri);
2428 24 : return true;
2429 :
2430 20 : case PGBENCH_DIV:
2431 : case PGBENCH_MOD:
2432 20 : if (ri == 0)
2433 : {
2434 4 : pg_log_error("division by zero");
2435 4 : return false;
2436 : }
2437 : /* special handling of -1 divisor */
2438 16 : if (ri == -1)
2439 : {
2440 6 : if (func == PGBENCH_DIV)
2441 : {
2442 : /* overflow check (needed for INT64_MIN) */
2443 4 : if (li == PG_INT64_MIN)
2444 : {
2445 2 : pg_log_error("bigint div out of range");
2446 2 : return false;
2447 : }
2448 : else
2449 2 : setIntValue(retval, -li);
2450 : }
2451 : else
2452 2 : setIntValue(retval, 0);
2453 4 : return true;
2454 : }
2455 : /* else divisor is not -1 */
2456 10 : if (func == PGBENCH_DIV)
2457 4 : setIntValue(retval, li / ri);
2458 : else /* func == PGBENCH_MOD */
2459 6 : setIntValue(retval, li % ri);
2460 :
2461 10 : return true;
2462 :
2463 0 : default:
2464 : /* cannot get here */
2465 : Assert(0);
2466 : }
2467 : }
2468 :
2469 : Assert(0);
2470 0 : return false; /* NOTREACHED */
2471 : }
2472 :
2473 : /* integer bitwise operators */
2474 28 : case PGBENCH_BITAND:
2475 : case PGBENCH_BITOR:
2476 : case PGBENCH_BITXOR:
2477 : case PGBENCH_LSHIFT:
2478 : case PGBENCH_RSHIFT:
2479 : {
2480 : int64 li,
2481 : ri;
2482 :
2483 28 : if (!coerceToInt(&vargs[0], &li) || !coerceToInt(&vargs[1], &ri))
2484 0 : return false;
2485 :
2486 28 : if (func == PGBENCH_BITAND)
2487 2 : setIntValue(retval, li & ri);
2488 26 : else if (func == PGBENCH_BITOR)
2489 4 : setIntValue(retval, li | ri);
2490 22 : else if (func == PGBENCH_BITXOR)
2491 6 : setIntValue(retval, li ^ ri);
2492 16 : else if (func == PGBENCH_LSHIFT)
2493 14 : setIntValue(retval, li << ri);
2494 2 : else if (func == PGBENCH_RSHIFT)
2495 2 : setIntValue(retval, li >> ri);
2496 : else /* cannot get here */
2497 : Assert(0);
2498 :
2499 28 : return true;
2500 : }
2501 :
2502 : /* logical operators */
2503 32 : case PGBENCH_NOT:
2504 : {
2505 : bool b;
2506 :
2507 32 : if (!coerceToBool(&vargs[0], &b))
2508 2 : return false;
2509 :
2510 30 : setBoolValue(retval, !b);
2511 30 : return true;
2512 : }
2513 :
2514 : /* no arguments */
2515 2 : case PGBENCH_PI:
2516 2 : setDoubleValue(retval, M_PI);
2517 2 : return true;
2518 :
2519 : /* 1 overloaded argument */
2520 4 : case PGBENCH_ABS:
2521 : {
2522 4 : PgBenchValue *varg = &vargs[0];
2523 :
2524 : Assert(nargs == 1);
2525 :
2526 4 : if (varg->type == PGBT_INT)
2527 : {
2528 2 : int64 i = varg->u.ival;
2529 :
2530 2 : setIntValue(retval, i < 0 ? -i : i);
2531 : }
2532 : else
2533 : {
2534 2 : double d = varg->u.dval;
2535 :
2536 : Assert(varg->type == PGBT_DOUBLE);
2537 2 : setDoubleValue(retval, d < 0.0 ? -d : d);
2538 : }
2539 :
2540 4 : return true;
2541 : }
2542 :
2543 168 : case PGBENCH_DEBUG:
2544 : {
2545 168 : PgBenchValue *varg = &vargs[0];
2546 :
2547 : Assert(nargs == 1);
2548 :
2549 168 : fprintf(stderr, "debug(script=%d,command=%d): ",
2550 168 : st->use_file, st->command + 1);
2551 :
2552 168 : if (varg->type == PGBT_NULL)
2553 4 : fprintf(stderr, "null\n");
2554 164 : else if (varg->type == PGBT_BOOLEAN)
2555 38 : fprintf(stderr, "boolean %s\n", varg->u.bval ? "true" : "false");
2556 126 : else if (varg->type == PGBT_INT)
2557 94 : fprintf(stderr, "int " INT64_FORMAT "\n", varg->u.ival);
2558 32 : else if (varg->type == PGBT_DOUBLE)
2559 32 : fprintf(stderr, "double %.*g\n", DBL_DIG, varg->u.dval);
2560 : else /* internal error, unexpected type */
2561 : Assert(0);
2562 :
2563 168 : *retval = *varg;
2564 :
2565 168 : return true;
2566 : }
2567 :
2568 : /* 1 double argument */
2569 10 : case PGBENCH_DOUBLE:
2570 : case PGBENCH_SQRT:
2571 : case PGBENCH_LN:
2572 : case PGBENCH_EXP:
2573 : {
2574 : double dval;
2575 :
2576 : Assert(nargs == 1);
2577 :
2578 10 : if (!coerceToDouble(&vargs[0], &dval))
2579 2 : return false;
2580 :
2581 8 : if (func == PGBENCH_SQRT)
2582 2 : dval = sqrt(dval);
2583 6 : else if (func == PGBENCH_LN)
2584 2 : dval = log(dval);
2585 4 : else if (func == PGBENCH_EXP)
2586 2 : dval = exp(dval);
2587 : /* else is cast: do nothing */
2588 :
2589 8 : setDoubleValue(retval, dval);
2590 8 : return true;
2591 : }
2592 :
2593 : /* 1 int argument */
2594 4 : case PGBENCH_INT:
2595 : {
2596 : int64 ival;
2597 :
2598 : Assert(nargs == 1);
2599 :
2600 4 : if (!coerceToInt(&vargs[0], &ival))
2601 2 : return false;
2602 :
2603 2 : setIntValue(retval, ival);
2604 2 : return true;
2605 : }
2606 :
2607 : /* variable number of arguments */
2608 8 : case PGBENCH_LEAST:
2609 : case PGBENCH_GREATEST:
2610 : {
2611 : bool havedouble;
2612 : int i;
2613 :
2614 : Assert(nargs >= 1);
2615 :
2616 : /* need double result if any input is double */
2617 8 : havedouble = false;
2618 28 : for (i = 0; i < nargs; i++)
2619 : {
2620 24 : if (vargs[i].type == PGBT_DOUBLE)
2621 : {
2622 4 : havedouble = true;
2623 4 : break;
2624 : }
2625 : }
2626 8 : if (havedouble)
2627 : {
2628 : double extremum;
2629 :
2630 4 : if (!coerceToDouble(&vargs[0], &extremum))
2631 0 : return false;
2632 12 : for (i = 1; i < nargs; i++)
2633 : {
2634 : double dval;
2635 :
2636 8 : if (!coerceToDouble(&vargs[i], &dval))
2637 0 : return false;
2638 8 : if (func == PGBENCH_LEAST)
2639 4 : extremum = Min(extremum, dval);
2640 : else
2641 4 : extremum = Max(extremum, dval);
2642 : }
2643 4 : setDoubleValue(retval, extremum);
2644 : }
2645 : else
2646 : {
2647 : int64 extremum;
2648 :
2649 4 : if (!coerceToInt(&vargs[0], &extremum))
2650 0 : return false;
2651 16 : for (i = 1; i < nargs; i++)
2652 : {
2653 : int64 ival;
2654 :
2655 12 : if (!coerceToInt(&vargs[i], &ival))
2656 0 : return false;
2657 12 : if (func == PGBENCH_LEAST)
2658 6 : extremum = Min(extremum, ival);
2659 : else
2660 6 : extremum = Max(extremum, ival);
2661 : }
2662 4 : setIntValue(retval, extremum);
2663 : }
2664 8 : return true;
2665 : }
2666 :
2667 : /* random functions */
2668 3072 : case PGBENCH_RANDOM:
2669 : case PGBENCH_RANDOM_EXPONENTIAL:
2670 : case PGBENCH_RANDOM_GAUSSIAN:
2671 : case PGBENCH_RANDOM_ZIPFIAN:
2672 : {
2673 : int64 imin,
2674 : imax,
2675 : delta;
2676 :
2677 : Assert(nargs >= 2);
2678 :
2679 3072 : if (!coerceToInt(&vargs[0], &imin) ||
2680 3070 : !coerceToInt(&vargs[1], &imax))
2681 2 : return false;
2682 :
2683 : /* check random range */
2684 3070 : if (unlikely(imin > imax))
2685 : {
2686 2 : pg_log_error("empty range given to random");
2687 2 : return false;
2688 : }
2689 3068 : else if (unlikely(pg_sub_s64_overflow(imax, imin, &delta) ||
2690 : pg_add_s64_overflow(delta, 1, &delta)))
2691 : {
2692 : /* prevent int overflows in random functions */
2693 2 : pg_log_error("random range is too large");
2694 2 : return false;
2695 : }
2696 :
2697 3066 : if (func == PGBENCH_RANDOM)
2698 : {
2699 : Assert(nargs == 2);
2700 3040 : setIntValue(retval, getrand(&st->cs_func_rs, imin, imax));
2701 : }
2702 : else /* gaussian & exponential */
2703 : {
2704 : double param;
2705 :
2706 : Assert(nargs == 3);
2707 :
2708 26 : if (!coerceToDouble(&vargs[2], ¶m))
2709 8 : return false;
2710 :
2711 26 : if (func == PGBENCH_RANDOM_GAUSSIAN)
2712 : {
2713 8 : if (param < MIN_GAUSSIAN_PARAM)
2714 : {
2715 2 : pg_log_error("gaussian parameter must be at least %f (not %f)",
2716 : MIN_GAUSSIAN_PARAM, param);
2717 2 : return false;
2718 : }
2719 :
2720 6 : setIntValue(retval,
2721 : getGaussianRand(&st->cs_func_rs,
2722 : imin, imax, param));
2723 : }
2724 18 : else if (func == PGBENCH_RANDOM_ZIPFIAN)
2725 : {
2726 10 : if (param < MIN_ZIPFIAN_PARAM || param > MAX_ZIPFIAN_PARAM)
2727 : {
2728 4 : pg_log_error("zipfian parameter must be in range [%.3f, %.0f] (not %f)",
2729 : MIN_ZIPFIAN_PARAM, MAX_ZIPFIAN_PARAM, param);
2730 4 : return false;
2731 : }
2732 :
2733 6 : setIntValue(retval,
2734 : getZipfianRand(&st->cs_func_rs, imin, imax, param));
2735 : }
2736 : else /* exponential */
2737 : {
2738 8 : if (param <= 0.0)
2739 : {
2740 2 : pg_log_error("exponential parameter must be greater than zero (not %f)",
2741 : param);
2742 2 : return false;
2743 : }
2744 :
2745 6 : setIntValue(retval,
2746 : getExponentialRand(&st->cs_func_rs,
2747 : imin, imax, param));
2748 : }
2749 : }
2750 :
2751 3058 : return true;
2752 : }
2753 :
2754 18 : case PGBENCH_POW:
2755 : {
2756 18 : PgBenchValue *lval = &vargs[0];
2757 18 : PgBenchValue *rval = &vargs[1];
2758 : double ld,
2759 : rd;
2760 :
2761 : Assert(nargs == 2);
2762 :
2763 18 : if (!coerceToDouble(lval, &ld) ||
2764 18 : !coerceToDouble(rval, &rd))
2765 0 : return false;
2766 :
2767 18 : setDoubleValue(retval, pow(ld, rd));
2768 :
2769 18 : return true;
2770 : }
2771 :
2772 20 : case PGBENCH_IS:
2773 : {
2774 : Assert(nargs == 2);
2775 :
2776 : /*
2777 : * note: this simple implementation is more permissive than
2778 : * SQL
2779 : */
2780 20 : setBoolValue(retval,
2781 30 : vargs[0].type == vargs[1].type &&
2782 10 : vargs[0].u.bval == vargs[1].u.bval);
2783 20 : return true;
2784 : }
2785 :
2786 : /* hashing */
2787 12 : case PGBENCH_HASH_FNV1A:
2788 : case PGBENCH_HASH_MURMUR2:
2789 : {
2790 : int64 val,
2791 : seed;
2792 :
2793 : Assert(nargs == 2);
2794 :
2795 12 : if (!coerceToInt(&vargs[0], &val) ||
2796 12 : !coerceToInt(&vargs[1], &seed))
2797 0 : return false;
2798 :
2799 12 : if (func == PGBENCH_HASH_MURMUR2)
2800 10 : setIntValue(retval, getHashMurmur2(val, seed));
2801 2 : else if (func == PGBENCH_HASH_FNV1A)
2802 2 : setIntValue(retval, getHashFnv1a(val, seed));
2803 : else
2804 : /* cannot get here */
2805 : Assert(0);
2806 :
2807 12 : return true;
2808 : }
2809 :
2810 92 : case PGBENCH_PERMUTE:
2811 : {
2812 : int64 val,
2813 : size,
2814 : seed;
2815 :
2816 : Assert(nargs == 3);
2817 :
2818 92 : if (!coerceToInt(&vargs[0], &val) ||
2819 92 : !coerceToInt(&vargs[1], &size) ||
2820 92 : !coerceToInt(&vargs[2], &seed))
2821 0 : return false;
2822 :
2823 92 : if (size <= 0)
2824 : {
2825 2 : pg_log_error("permute size parameter must be greater than zero");
2826 2 : return false;
2827 : }
2828 :
2829 90 : setIntValue(retval, permute(val, size, seed));
2830 90 : return true;
2831 : }
2832 :
2833 0 : default:
2834 : /* cannot get here */
2835 : Assert(0);
2836 : /* dead code to avoid a compiler warning */
2837 0 : return false;
2838 : }
2839 : }
2840 :
2841 : /* evaluate some function */
2842 : static bool
2843 7004 : evalFunc(CState *st,
2844 : PgBenchFunction func, PgBenchExprLink *args, PgBenchValue *retval)
2845 : {
2846 7004 : if (isLazyFunc(func))
2847 126 : return evalLazyFunc(st, func, args, retval);
2848 : else
2849 6878 : return evalStandardFunc(st, func, args, retval);
2850 : }
2851 :
2852 : /*
2853 : * Recursive evaluation of an expression in a pgbench script
2854 : * using the current state of variables.
2855 : * Returns whether the evaluation was ok,
2856 : * the value itself is returned through the retval pointer.
2857 : */
2858 : static bool
2859 18378 : evaluateExpr(CState *st, PgBenchExpr *expr, PgBenchValue *retval)
2860 : {
2861 18378 : switch (expr->etype)
2862 : {
2863 7354 : case ENODE_CONSTANT:
2864 : {
2865 7354 : *retval = expr->u.constant;
2866 7354 : return true;
2867 : }
2868 :
2869 4020 : case ENODE_VARIABLE:
2870 : {
2871 : Variable *var;
2872 :
2873 4020 : if ((var = lookupVariable(&st->variables, expr->u.variable.varname)) == NULL)
2874 : {
2875 4 : pg_log_error("undefined variable \"%s\"", expr->u.variable.varname);
2876 4 : return false;
2877 : }
2878 :
2879 4016 : if (!makeVariableValue(var))
2880 4 : return false;
2881 :
2882 4012 : *retval = var->value;
2883 4012 : return true;
2884 : }
2885 :
2886 7004 : case ENODE_FUNCTION:
2887 7004 : return evalFunc(st,
2888 : expr->u.function.function,
2889 : expr->u.function.args,
2890 : retval);
2891 :
2892 0 : default:
2893 : /* internal error which should never occur */
2894 0 : pg_fatal("unexpected enode type in evaluation: %d", expr->etype);
2895 : }
2896 : }
2897 :
2898 : /*
2899 : * Convert command name to meta-command enum identifier
2900 : */
2901 : static MetaCommand
2902 1064 : getMetaCommand(const char *cmd)
2903 : {
2904 : MetaCommand mc;
2905 :
2906 1064 : if (cmd == NULL)
2907 0 : mc = META_NONE;
2908 1064 : else if (pg_strcasecmp(cmd, "set") == 0)
2909 726 : mc = META_SET;
2910 338 : else if (pg_strcasecmp(cmd, "setshell") == 0)
2911 8 : mc = META_SETSHELL;
2912 330 : else if (pg_strcasecmp(cmd, "shell") == 0)
2913 10 : mc = META_SHELL;
2914 320 : else if (pg_strcasecmp(cmd, "sleep") == 0)
2915 18 : mc = META_SLEEP;
2916 302 : else if (pg_strcasecmp(cmd, "if") == 0)
2917 48 : mc = META_IF;
2918 254 : else if (pg_strcasecmp(cmd, "elif") == 0)
2919 26 : mc = META_ELIF;
2920 228 : else if (pg_strcasecmp(cmd, "else") == 0)
2921 28 : mc = META_ELSE;
2922 200 : else if (pg_strcasecmp(cmd, "endif") == 0)
2923 42 : mc = META_ENDIF;
2924 158 : else if (pg_strcasecmp(cmd, "gset") == 0)
2925 64 : mc = META_GSET;
2926 94 : else if (pg_strcasecmp(cmd, "aset") == 0)
2927 6 : mc = META_ASET;
2928 88 : else if (pg_strcasecmp(cmd, "startpipeline") == 0)
2929 42 : mc = META_STARTPIPELINE;
2930 46 : else if (pg_strcasecmp(cmd, "syncpipeline") == 0)
2931 10 : mc = META_SYNCPIPELINE;
2932 36 : else if (pg_strcasecmp(cmd, "endpipeline") == 0)
2933 34 : mc = META_ENDPIPELINE;
2934 : else
2935 2 : mc = META_NONE;
2936 1064 : return mc;
2937 : }
2938 :
2939 : /*
2940 : * Run a shell command. The result is assigned to the variable if not NULL.
2941 : * Return true if succeeded, or false on error.
2942 : */
2943 : static bool
2944 12 : runShellCommand(Variables *variables, char *variable, char **argv, int argc)
2945 : {
2946 : char command[SHELL_COMMAND_SIZE];
2947 : int i,
2948 12 : len = 0;
2949 : FILE *fp;
2950 : char res[64];
2951 : char *endptr;
2952 : int retval;
2953 :
2954 : /*----------
2955 : * Join arguments with whitespace separators. Arguments starting with
2956 : * exactly one colon are treated as variables:
2957 : * name - append a string "name"
2958 : * :var - append a variable named 'var'
2959 : * ::name - append a string ":name"
2960 : *----------
2961 : */
2962 34 : for (i = 0; i < argc; i++)
2963 : {
2964 : char *arg;
2965 : int arglen;
2966 :
2967 24 : if (argv[i][0] != ':')
2968 : {
2969 18 : arg = argv[i]; /* a string literal */
2970 : }
2971 6 : else if (argv[i][1] == ':')
2972 : {
2973 2 : arg = argv[i] + 1; /* a string literal starting with colons */
2974 : }
2975 4 : else if ((arg = getVariable(variables, argv[i] + 1)) == NULL)
2976 : {
2977 2 : pg_log_error("%s: undefined variable \"%s\"", argv[0], argv[i]);
2978 2 : return false;
2979 : }
2980 :
2981 22 : arglen = strlen(arg);
2982 22 : if (len + arglen + (i > 0 ? 1 : 0) >= SHELL_COMMAND_SIZE - 1)
2983 : {
2984 0 : pg_log_error("%s: shell command is too long", argv[0]);
2985 0 : return false;
2986 : }
2987 :
2988 22 : if (i > 0)
2989 10 : command[len++] = ' ';
2990 22 : memcpy(command + len, arg, arglen);
2991 22 : len += arglen;
2992 : }
2993 :
2994 10 : command[len] = '\0';
2995 :
2996 10 : fflush(NULL); /* needed before either system() or popen() */
2997 :
2998 : /* Fast path for non-assignment case */
2999 10 : if (variable == NULL)
3000 : {
3001 4 : if (system(command))
3002 : {
3003 2 : if (!timer_exceeded)
3004 2 : pg_log_error("%s: could not launch shell command", argv[0]);
3005 2 : return false;
3006 : }
3007 2 : return true;
3008 : }
3009 :
3010 : /* Execute the command with pipe and read the standard output. */
3011 6 : if ((fp = popen(command, "r")) == NULL)
3012 : {
3013 0 : pg_log_error("%s: could not launch shell command", argv[0]);
3014 0 : return false;
3015 : }
3016 6 : if (fgets(res, sizeof(res), fp) == NULL)
3017 : {
3018 2 : if (!timer_exceeded)
3019 2 : pg_log_error("%s: could not read result of shell command", argv[0]);
3020 2 : (void) pclose(fp);
3021 2 : return false;
3022 : }
3023 4 : if (pclose(fp) < 0)
3024 : {
3025 0 : pg_log_error("%s: could not run shell command: %m", argv[0]);
3026 0 : return false;
3027 : }
3028 :
3029 : /* Check whether the result is an integer and assign it to the variable */
3030 4 : retval = (int) strtol(res, &endptr, 10);
3031 6 : while (*endptr != '\0' && isspace((unsigned char) *endptr))
3032 2 : endptr++;
3033 4 : if (*res == '\0' || *endptr != '\0')
3034 : {
3035 2 : pg_log_error("%s: shell command must return an integer (not \"%s\")", argv[0], res);
3036 2 : return false;
3037 : }
3038 2 : if (!putVariableInt(variables, "setshell", variable, retval))
3039 0 : return false;
3040 :
3041 2 : pg_log_debug("%s: shell parameter name: \"%s\", value: \"%s\"", argv[0], argv[1], res);
3042 :
3043 2 : return true;
3044 : }
3045 :
3046 : /*
3047 : * Report the abortion of the client when processing SQL commands.
3048 : */
3049 : static void
3050 64 : commandFailed(CState *st, const char *cmd, const char *message)
3051 : {
3052 64 : pg_log_error("client %d aborted in command %d (%s) of script %d; %s",
3053 : st->id, st->command, cmd, st->use_file, message);
3054 64 : }
3055 :
3056 : /*
3057 : * Report the error in the command while the script is executing.
3058 : */
3059 : static void
3060 4 : commandError(CState *st, const char *message)
3061 : {
3062 : Assert(sql_script[st->use_file].commands[st->command]->type == SQL_COMMAND);
3063 4 : pg_log_info("client %d got an error in command %d (SQL) of script %d; %s",
3064 : st->id, st->command, st->use_file, message);
3065 4 : }
3066 :
3067 : /* return a script number with a weighted choice. */
3068 : static int
3069 15488 : chooseScript(TState *thread)
3070 : {
3071 15488 : int i = 0;
3072 : int64 w;
3073 :
3074 15488 : if (num_scripts == 1)
3075 12788 : return 0;
3076 :
3077 2700 : w = getrand(&thread->ts_choose_rs, 0, total_weight - 1);
3078 : do
3079 : {
3080 6488 : w -= sql_script[i++].weight;
3081 6488 : } while (w >= 0);
3082 :
3083 2700 : return i - 1;
3084 : }
3085 :
3086 : /*
3087 : * Allocate space for CState->prepared: we need one boolean for each command
3088 : * of each script.
3089 : */
3090 : static void
3091 68 : allocCStatePrepared(CState *st)
3092 : {
3093 : Assert(st->prepared == NULL);
3094 :
3095 68 : st->prepared = pg_malloc(sizeof(bool *) * num_scripts);
3096 148 : for (int i = 0; i < num_scripts; i++)
3097 : {
3098 80 : ParsedScript *script = &sql_script[i];
3099 : int numcmds;
3100 :
3101 340 : for (numcmds = 0; script->commands[numcmds] != NULL; numcmds++)
3102 : ;
3103 80 : st->prepared[i] = pg_malloc0(sizeof(bool) * numcmds);
3104 : }
3105 68 : }
3106 :
3107 : /*
3108 : * Prepare the SQL command from st->use_file at command_num.
3109 : */
3110 : static void
3111 4008 : prepareCommand(CState *st, int command_num)
3112 : {
3113 4008 : Command *command = sql_script[st->use_file].commands[command_num];
3114 :
3115 : /* No prepare for non-SQL commands */
3116 4008 : if (command->type != SQL_COMMAND)
3117 0 : return;
3118 :
3119 4008 : if (!st->prepared)
3120 58 : allocCStatePrepared(st);
3121 :
3122 4008 : if (!st->prepared[st->use_file][command_num])
3123 : {
3124 : PGresult *res;
3125 :
3126 218 : pg_log_debug("client %d preparing %s", st->id, command->prepname);
3127 218 : res = PQprepare(st->con, command->prepname,
3128 218 : command->argv[0], command->argc - 1, NULL);
3129 218 : if (PQresultStatus(res) != PGRES_COMMAND_OK)
3130 2 : pg_log_error("%s", PQerrorMessage(st->con));
3131 218 : PQclear(res);
3132 218 : st->prepared[st->use_file][command_num] = true;
3133 : }
3134 : }
3135 :
3136 : /*
3137 : * Prepare all the commands in the script that come after the \startpipeline
3138 : * that's at position st->command, and the first \endpipeline we find.
3139 : *
3140 : * This sets the ->prepared flag for each relevant command as well as the
3141 : * \startpipeline itself, but doesn't move the st->command counter.
3142 : */
3143 : static void
3144 84 : prepareCommandsInPipeline(CState *st)
3145 : {
3146 : int j;
3147 84 : Command **commands = sql_script[st->use_file].commands;
3148 :
3149 : Assert(commands[st->command]->type == META_COMMAND &&
3150 : commands[st->command]->meta == META_STARTPIPELINE);
3151 :
3152 84 : if (!st->prepared)
3153 10 : allocCStatePrepared(st);
3154 :
3155 : /*
3156 : * We set the 'prepared' flag on the \startpipeline itself to flag that we
3157 : * don't need to do this next time without calling prepareCommand(), even
3158 : * though we don't actually prepare this command.
3159 : */
3160 84 : if (st->prepared[st->use_file][st->command])
3161 72 : return;
3162 :
3163 128 : for (j = st->command + 1; commands[j] != NULL; j++)
3164 : {
3165 128 : if (commands[j]->type == META_COMMAND &&
3166 12 : commands[j]->meta == META_ENDPIPELINE)
3167 12 : break;
3168 :
3169 116 : prepareCommand(st, j);
3170 : }
3171 :
3172 12 : st->prepared[st->use_file][st->command] = true;
3173 : }
3174 :
3175 : /* Send a SQL command, using the chosen querymode */
3176 : static bool
3177 21336 : sendCommand(CState *st, Command *command)
3178 : {
3179 : int r;
3180 :
3181 21336 : if (querymode == QUERY_SIMPLE)
3182 : {
3183 : char *sql;
3184 :
3185 16258 : sql = pg_strdup(command->argv[0]);
3186 16258 : sql = assignVariables(&st->variables, sql);
3187 :
3188 16258 : pg_log_debug("client %d sending %s", st->id, sql);
3189 16258 : r = PQsendQuery(st->con, sql);
3190 16258 : free(sql);
3191 : }
3192 5078 : else if (querymode == QUERY_EXTENDED)
3193 : {
3194 1186 : const char *sql = command->argv[0];
3195 : const char *params[MAX_ARGS];
3196 :
3197 1186 : getQueryParams(&st->variables, command, params);
3198 :
3199 1186 : pg_log_debug("client %d sending %s", st->id, sql);
3200 1186 : r = PQsendQueryParams(st->con, sql, command->argc - 1,
3201 : NULL, params, NULL, NULL, 0);
3202 : }
3203 3892 : else if (querymode == QUERY_PREPARED)
3204 : {
3205 : const char *params[MAX_ARGS];
3206 :
3207 3892 : prepareCommand(st, st->command);
3208 3892 : getQueryParams(&st->variables, command, params);
3209 :
3210 3892 : pg_log_debug("client %d sending %s", st->id, command->prepname);
3211 3892 : r = PQsendQueryPrepared(st->con, command->prepname, command->argc - 1,
3212 : params, NULL, NULL, 0);
3213 : }
3214 : else /* unknown sql mode */
3215 0 : r = 0;
3216 :
3217 21336 : if (r == 0)
3218 : {
3219 0 : pg_log_debug("client %d could not send %s", st->id, command->argv[0]);
3220 0 : return false;
3221 : }
3222 : else
3223 21336 : return true;
3224 : }
3225 :
3226 : /*
3227 : * Get the error status from the error code.
3228 : */
3229 : static EStatus
3230 26 : getSQLErrorStatus(const char *sqlState)
3231 : {
3232 26 : if (sqlState != NULL)
3233 : {
3234 26 : if (strcmp(sqlState, ERRCODE_T_R_SERIALIZATION_FAILURE) == 0)
3235 2 : return ESTATUS_SERIALIZATION_ERROR;
3236 24 : else if (strcmp(sqlState, ERRCODE_T_R_DEADLOCK_DETECTED) == 0)
3237 2 : return ESTATUS_DEADLOCK_ERROR;
3238 : }
3239 :
3240 22 : return ESTATUS_OTHER_SQL_ERROR;
3241 : }
3242 :
3243 : /*
3244 : * Returns true if this type of error can be retried.
3245 : */
3246 : static bool
3247 66 : canRetryError(EStatus estatus)
3248 : {
3249 66 : return (estatus == ESTATUS_SERIALIZATION_ERROR ||
3250 : estatus == ESTATUS_DEADLOCK_ERROR);
3251 : }
3252 :
3253 : /*
3254 : * Process query response from the backend.
3255 : *
3256 : * If varprefix is not NULL, it's the variable name prefix where to store
3257 : * the results of the *last* command (META_GSET) or *all* commands
3258 : * (META_ASET).
3259 : *
3260 : * Returns true if everything is A-OK, false if any error occurs.
3261 : */
3262 : static bool
3263 21426 : readCommandResponse(CState *st, MetaCommand meta, char *varprefix)
3264 : {
3265 : PGresult *res;
3266 : PGresult *next_res;
3267 21426 : int qrynum = 0;
3268 :
3269 : /*
3270 : * varprefix should be set only with \gset or \aset, and \endpipeline and
3271 : * SQL commands do not need it.
3272 : */
3273 : Assert((meta == META_NONE && varprefix == NULL) ||
3274 : ((meta == META_ENDPIPELINE) && varprefix == NULL) ||
3275 : ((meta == META_GSET || meta == META_ASET) && varprefix != NULL));
3276 :
3277 21426 : res = PQgetResult(st->con);
3278 :
3279 42828 : while (res != NULL)
3280 : {
3281 : bool is_last;
3282 :
3283 : /* peek at the next result to know whether the current is last */
3284 21438 : next_res = PQgetResult(st->con);
3285 21438 : is_last = (next_res == NULL);
3286 :
3287 21438 : switch (PQresultStatus(res))
3288 : {
3289 16656 : case PGRES_COMMAND_OK: /* non-SELECT commands */
3290 : case PGRES_EMPTY_QUERY: /* may be used for testing no-op overhead */
3291 16656 : if (is_last && meta == META_GSET)
3292 : {
3293 2 : pg_log_error("client %d script %d command %d query %d: expected one row, got %d",
3294 : st->id, st->use_file, st->command, qrynum, 0);
3295 2 : st->estatus = ESTATUS_META_COMMAND_ERROR;
3296 2 : goto error;
3297 : }
3298 16654 : break;
3299 :
3300 4648 : case PGRES_TUPLES_OK:
3301 4648 : if ((is_last && meta == META_GSET) || meta == META_ASET)
3302 : {
3303 1042 : int ntuples = PQntuples(res);
3304 :
3305 1042 : if (meta == META_GSET && ntuples != 1)
3306 : {
3307 : /* under \gset, report the error */
3308 4 : pg_log_error("client %d script %d command %d query %d: expected one row, got %d",
3309 : st->id, st->use_file, st->command, qrynum, PQntuples(res));
3310 4 : st->estatus = ESTATUS_META_COMMAND_ERROR;
3311 4 : goto error;
3312 : }
3313 1038 : else if (meta == META_ASET && ntuples <= 0)
3314 : {
3315 : /* coldly skip empty result under \aset */
3316 2 : break;
3317 : }
3318 :
3319 : /* store results into variables */
3320 2072 : for (int fld = 0; fld < PQnfields(res); fld++)
3321 : {
3322 1040 : char *varname = PQfname(res, fld);
3323 :
3324 : /* allocate varname only if necessary, freed below */
3325 1040 : if (*varprefix != '\0')
3326 2 : varname = psprintf("%s%s", varprefix, varname);
3327 :
3328 : /* store last row result as a string */
3329 1040 : if (!putVariable(&st->variables, meta == META_ASET ? "aset" : "gset", varname,
3330 1040 : PQgetvalue(res, ntuples - 1, fld)))
3331 : {
3332 : /* internal error */
3333 4 : pg_log_error("client %d script %d command %d query %d: error storing into variable %s",
3334 : st->id, st->use_file, st->command, qrynum, varname);
3335 4 : st->estatus = ESTATUS_META_COMMAND_ERROR;
3336 4 : goto error;
3337 : }
3338 :
3339 1036 : if (*varprefix != '\0')
3340 2 : pg_free(varname);
3341 : }
3342 : }
3343 : /* otherwise the result is simply thrown away by PQclear below */
3344 4638 : break;
3345 :
3346 108 : case PGRES_PIPELINE_SYNC:
3347 108 : pg_log_debug("client %d pipeline ending, ongoing syncs: %d",
3348 : st->id, st->num_syncs);
3349 108 : st->num_syncs--;
3350 108 : if (st->num_syncs == 0 && PQexitPipelineMode(st->con) != 1)
3351 0 : pg_log_error("client %d failed to exit pipeline mode: %s", st->id,
3352 : PQerrorMessage(st->con));
3353 108 : break;
3354 :
3355 26 : case PGRES_NONFATAL_ERROR:
3356 : case PGRES_FATAL_ERROR:
3357 26 : st->estatus = getSQLErrorStatus(PQresultErrorField(res,
3358 : PG_DIAG_SQLSTATE));
3359 26 : if (canRetryError(st->estatus))
3360 : {
3361 4 : if (verbose_errors)
3362 4 : commandError(st, PQerrorMessage(st->con));
3363 4 : goto error;
3364 : }
3365 : /* fall through */
3366 :
3367 : default:
3368 : /* anything else is unexpected */
3369 22 : pg_log_error("client %d script %d aborted in command %d query %d: %s",
3370 : st->id, st->use_file, st->command, qrynum,
3371 : PQerrorMessage(st->con));
3372 22 : goto error;
3373 : }
3374 :
3375 21402 : PQclear(res);
3376 21402 : qrynum++;
3377 21402 : res = next_res;
3378 : }
3379 :
3380 21390 : if (qrynum == 0)
3381 : {
3382 0 : pg_log_error("client %d command %d: no results", st->id, st->command);
3383 0 : return false;
3384 : }
3385 :
3386 21390 : return true;
3387 :
3388 36 : error:
3389 36 : PQclear(res);
3390 36 : PQclear(next_res);
3391 : do
3392 : {
3393 44 : res = PQgetResult(st->con);
3394 44 : PQclear(res);
3395 44 : } while (res);
3396 :
3397 36 : return false;
3398 : }
3399 :
3400 : /*
3401 : * Parse the argument to a \sleep command, and return the requested amount
3402 : * of delay, in microseconds. Returns true on success, false on error.
3403 : */
3404 : static bool
3405 12 : evaluateSleep(Variables *variables, int argc, char **argv, int *usecs)
3406 : {
3407 : char *var;
3408 : int usec;
3409 :
3410 12 : if (*argv[1] == ':')
3411 : {
3412 6 : if ((var = getVariable(variables, argv[1] + 1)) == NULL)
3413 : {
3414 2 : pg_log_error("%s: undefined variable \"%s\"", argv[0], argv[1] + 1);
3415 2 : return false;
3416 : }
3417 :
3418 4 : usec = atoi(var);
3419 :
3420 : /* Raise an error if the value of a variable is not a number */
3421 4 : if (usec == 0 && !isdigit((unsigned char) *var))
3422 : {
3423 0 : pg_log_error("%s: invalid sleep time \"%s\" for variable \"%s\"",
3424 : argv[0], var, argv[1] + 1);
3425 0 : return false;
3426 : }
3427 : }
3428 : else
3429 6 : usec = atoi(argv[1]);
3430 :
3431 10 : if (argc > 2)
3432 : {
3433 8 : if (pg_strcasecmp(argv[2], "ms") == 0)
3434 4 : usec *= 1000;
3435 4 : else if (pg_strcasecmp(argv[2], "s") == 0)
3436 2 : usec *= 1000000;
3437 : }
3438 : else
3439 2 : usec *= 1000000;
3440 :
3441 10 : *usecs = usec;
3442 10 : return true;
3443 : }
3444 :
3445 :
3446 : /*
3447 : * Returns true if the error can be retried.
3448 : */
3449 : static bool
3450 4 : doRetry(CState *st, pg_time_usec_t *now)
3451 : {
3452 : Assert(st->estatus != ESTATUS_NO_ERROR);
3453 :
3454 : /* We can only retry serialization or deadlock errors. */
3455 4 : if (!canRetryError(st->estatus))
3456 0 : return false;
3457 :
3458 : /*
3459 : * We must have at least one option to limit the retrying of transactions
3460 : * that got an error.
3461 : */
3462 : Assert(max_tries || latency_limit || duration > 0);
3463 :
3464 : /*
3465 : * We cannot retry the error if we have reached the maximum number of
3466 : * tries.
3467 : */
3468 4 : if (max_tries && st->tries >= max_tries)
3469 0 : return false;
3470 :
3471 : /*
3472 : * We cannot retry the error if we spent too much time on this
3473 : * transaction.
3474 : */
3475 4 : if (latency_limit)
3476 : {
3477 0 : pg_time_now_lazy(now);
3478 0 : if (*now - st->txn_scheduled > latency_limit)
3479 0 : return false;
3480 : }
3481 :
3482 : /*
3483 : * We cannot retry the error if the benchmark duration is over.
3484 : */
3485 4 : if (timer_exceeded)
3486 0 : return false;
3487 :
3488 : /* OK */
3489 4 : return true;
3490 : }
3491 :
3492 : /*
3493 : * Read results and discard it until a sync point.
3494 : */
3495 : static int
3496 0 : discardUntilSync(CState *st)
3497 : {
3498 0 : bool received_sync = false;
3499 :
3500 : /* send a sync */
3501 0 : if (!PQpipelineSync(st->con))
3502 : {
3503 0 : pg_log_error("client %d aborted: failed to send a pipeline sync",
3504 : st->id);
3505 0 : return 0;
3506 : }
3507 :
3508 : /* receive PGRES_PIPELINE_SYNC and null following it */
3509 : for (;;)
3510 0 : {
3511 0 : PGresult *res = PQgetResult(st->con);
3512 :
3513 0 : if (PQresultStatus(res) == PGRES_PIPELINE_SYNC)
3514 0 : received_sync = true;
3515 0 : else if (received_sync)
3516 : {
3517 : /*
3518 : * PGRES_PIPELINE_SYNC must be followed by another
3519 : * PGRES_PIPELINE_SYNC or NULL; otherwise, assert failure.
3520 : */
3521 : Assert(res == NULL);
3522 :
3523 : /*
3524 : * Reset ongoing sync count to 0 since all PGRES_PIPELINE_SYNC
3525 : * results have been discarded.
3526 : */
3527 0 : st->num_syncs = 0;
3528 0 : PQclear(res);
3529 0 : break;
3530 : }
3531 0 : PQclear(res);
3532 : }
3533 :
3534 : /* exit pipeline */
3535 0 : if (PQexitPipelineMode(st->con) != 1)
3536 : {
3537 0 : pg_log_error("client %d aborted: failed to exit pipeline mode for rolling back the failed transaction",
3538 : st->id);
3539 0 : return 0;
3540 : }
3541 0 : return 1;
3542 : }
3543 :
3544 : /*
3545 : * Get the transaction status at the end of a command especially for
3546 : * checking if we are in a (failed) transaction block.
3547 : */
3548 : static TStatus
3549 15386 : getTransactionStatus(PGconn *con)
3550 : {
3551 : PGTransactionStatusType tx_status;
3552 :
3553 15386 : tx_status = PQtransactionStatus(con);
3554 15386 : switch (tx_status)
3555 : {
3556 15382 : case PQTRANS_IDLE:
3557 15382 : return TSTATUS_IDLE;
3558 4 : case PQTRANS_INTRANS:
3559 : case PQTRANS_INERROR:
3560 4 : return TSTATUS_IN_BLOCK;
3561 0 : case PQTRANS_UNKNOWN:
3562 : /* PQTRANS_UNKNOWN is expected given a broken connection */
3563 0 : if (PQstatus(con) == CONNECTION_BAD)
3564 0 : return TSTATUS_CONN_ERROR;
3565 : /* fall through */
3566 : case PQTRANS_ACTIVE:
3567 : default:
3568 :
3569 : /*
3570 : * We cannot find out whether we are in a transaction block or
3571 : * not. Internal error which should never occur.
3572 : */
3573 0 : pg_log_error("unexpected transaction status %d", tx_status);
3574 0 : return TSTATUS_OTHER_ERROR;
3575 : }
3576 :
3577 : /* not reached */
3578 : Assert(false);
3579 : return TSTATUS_OTHER_ERROR;
3580 : }
3581 :
3582 : /*
3583 : * Print verbose messages of an error
3584 : */
3585 : static void
3586 4 : printVerboseErrorMessages(CState *st, pg_time_usec_t *now, bool is_retry)
3587 : {
3588 : static PQExpBuffer buf = NULL;
3589 :
3590 4 : if (buf == NULL)
3591 4 : buf = createPQExpBuffer();
3592 : else
3593 0 : resetPQExpBuffer(buf);
3594 :
3595 4 : printfPQExpBuffer(buf, "client %d ", st->id);
3596 4 : appendPQExpBufferStr(buf, (is_retry ?
3597 : "repeats the transaction after the error" :
3598 : "ends the failed transaction"));
3599 4 : appendPQExpBuffer(buf, " (try %u", st->tries);
3600 :
3601 : /* Print max_tries if it is not unlimited. */
3602 4 : if (max_tries)
3603 4 : appendPQExpBuffer(buf, "/%u", max_tries);
3604 :
3605 : /*
3606 : * If the latency limit is used, print a percentage of the current
3607 : * transaction latency from the latency limit.
3608 : */
3609 4 : if (latency_limit)
3610 : {
3611 0 : pg_time_now_lazy(now);
3612 0 : appendPQExpBuffer(buf, ", %.3f%% of the maximum time of tries was used",
3613 0 : (100.0 * (*now - st->txn_scheduled) / latency_limit));
3614 : }
3615 4 : appendPQExpBufferStr(buf, ")\n");
3616 :
3617 4 : pg_log_info("%s", buf->data);
3618 4 : }
3619 :
3620 : /*
3621 : * Advance the state machine of a connection.
3622 : */
3623 : static void
3624 35456 : advanceConnectionState(TState *thread, CState *st, StatsData *agg)
3625 : {
3626 :
3627 : /*
3628 : * gettimeofday() isn't free, so we get the current timestamp lazily the
3629 : * first time it's needed, and reuse the same value throughout this
3630 : * function after that. This also ensures that e.g. the calculated
3631 : * latency reported in the log file and in the totals are the same. Zero
3632 : * means "not set yet". Reset "now" when we execute shell commands or
3633 : * expressions, which might take a non-negligible amount of time, though.
3634 : */
3635 35456 : pg_time_usec_t now = 0;
3636 :
3637 : /*
3638 : * Loop in the state machine, until we have to wait for a result from the
3639 : * server or have to sleep for throttling or \sleep.
3640 : *
3641 : * Note: In the switch-statement below, 'break' will loop back here,
3642 : * meaning "continue in the state machine". Return is used to return to
3643 : * the caller, giving the thread the opportunity to advance another
3644 : * client.
3645 : */
3646 : for (;;)
3647 121898 : {
3648 : Command *command;
3649 :
3650 157354 : switch (st->state)
3651 : {
3652 : /* Select transaction (script) to run. */
3653 15488 : case CSTATE_CHOOSE_SCRIPT:
3654 15488 : st->use_file = chooseScript(thread);
3655 : Assert(conditional_stack_empty(st->cstack));
3656 :
3657 : /* reset transaction variables to default values */
3658 15488 : st->estatus = ESTATUS_NO_ERROR;
3659 15488 : st->tries = 1;
3660 :
3661 15488 : pg_log_debug("client %d executing script \"%s\"",
3662 : st->id, sql_script[st->use_file].desc);
3663 :
3664 : /*
3665 : * If time is over, we're done; otherwise, get ready to start
3666 : * a new transaction, or to get throttled if that's requested.
3667 : */
3668 30976 : st->state = timer_exceeded ? CSTATE_FINISHED :
3669 15488 : throttle_delay > 0 ? CSTATE_PREPARE_THROTTLE : CSTATE_START_TX;
3670 15488 : break;
3671 :
3672 : /* Start new transaction (script) */
3673 15486 : case CSTATE_START_TX:
3674 15486 : pg_time_now_lazy(&now);
3675 :
3676 : /* establish connection if needed, i.e. under --connect */
3677 15486 : if (st->con == NULL)
3678 : {
3679 220 : pg_time_usec_t start = now;
3680 :
3681 220 : if ((st->con = doConnect()) == NULL)
3682 : {
3683 : /*
3684 : * as the bench is already running, we do not abort
3685 : * the process
3686 : */
3687 0 : pg_log_error("client %d aborted while establishing connection", st->id);
3688 0 : st->state = CSTATE_ABORTED;
3689 0 : break;
3690 : }
3691 :
3692 : /* reset now after connection */
3693 220 : now = pg_time_now();
3694 :
3695 220 : thread->conn_duration += now - start;
3696 :
3697 : /* Reset session-local state */
3698 220 : pg_free(st->prepared);
3699 220 : st->prepared = NULL;
3700 : }
3701 :
3702 : /*
3703 : * It is the first try to run this transaction. Remember the
3704 : * random state: maybe it will get an error and we will need
3705 : * to run it again.
3706 : */
3707 15486 : st->random_state = st->cs_func_rs;
3708 :
3709 : /* record transaction start time */
3710 15486 : st->txn_begin = now;
3711 :
3712 : /*
3713 : * When not throttling, this is also the transaction's
3714 : * scheduled start time.
3715 : */
3716 15486 : if (!throttle_delay)
3717 15084 : st->txn_scheduled = now;
3718 :
3719 : /* Begin with the first command */
3720 15486 : st->state = CSTATE_START_COMMAND;
3721 15486 : st->command = 0;
3722 15486 : break;
3723 :
3724 : /*
3725 : * Handle throttling once per transaction by sleeping.
3726 : */
3727 420 : case CSTATE_PREPARE_THROTTLE:
3728 :
3729 : /*
3730 : * Generate a delay such that the series of delays will
3731 : * approximate a Poisson distribution centered on the
3732 : * throttle_delay time.
3733 : *
3734 : * If transactions are too slow or a given wait is shorter
3735 : * than a transaction, the next transaction will start right
3736 : * away.
3737 : */
3738 : Assert(throttle_delay > 0);
3739 :
3740 420 : thread->throttle_trigger +=
3741 420 : getPoissonRand(&thread->ts_throttle_rs, throttle_delay);
3742 420 : st->txn_scheduled = thread->throttle_trigger;
3743 :
3744 : /*
3745 : * If --latency-limit is used, and this slot is already late
3746 : * so that the transaction will miss the latency limit even if
3747 : * it completed immediately, skip this time slot and loop to
3748 : * reschedule.
3749 : */
3750 420 : if (latency_limit)
3751 : {
3752 420 : pg_time_now_lazy(&now);
3753 :
3754 420 : if (thread->throttle_trigger < now - latency_limit)
3755 : {
3756 18 : processXactStats(thread, st, &now, true, agg);
3757 :
3758 : /*
3759 : * Finish client if -T or -t was exceeded.
3760 : *
3761 : * Stop counting skipped transactions under -T as soon
3762 : * as the timer is exceeded. Because otherwise it can
3763 : * take a very long time to count all of them
3764 : * especially when quite a lot of them happen with
3765 : * unrealistically high rate setting in -R, which
3766 : * would prevent pgbench from ending immediately.
3767 : * Because of this behavior, note that there is no
3768 : * guarantee that all skipped transactions are counted
3769 : * under -T though there is under -t. This is OK in
3770 : * practice because it's very unlikely to happen with
3771 : * realistic setting.
3772 : */
3773 18 : if (timer_exceeded || (nxacts > 0 && st->cnt >= nxacts))
3774 2 : st->state = CSTATE_FINISHED;
3775 :
3776 : /* Go back to top of loop with CSTATE_PREPARE_THROTTLE */
3777 18 : break;
3778 : }
3779 : }
3780 :
3781 : /*
3782 : * stop client if next transaction is beyond pgbench end of
3783 : * execution; otherwise, throttle it.
3784 : */
3785 0 : st->state = end_time > 0 && st->txn_scheduled > end_time ?
3786 402 : CSTATE_FINISHED : CSTATE_THROTTLE;
3787 402 : break;
3788 :
3789 : /*
3790 : * Wait until it's time to start next transaction.
3791 : */
3792 402 : case CSTATE_THROTTLE:
3793 402 : pg_time_now_lazy(&now);
3794 :
3795 402 : if (now < st->txn_scheduled)
3796 0 : return; /* still sleeping, nothing to do here */
3797 :
3798 : /* done sleeping, but don't start transaction if we're done */
3799 402 : st->state = timer_exceeded ? CSTATE_FINISHED : CSTATE_START_TX;
3800 402 : break;
3801 :
3802 : /*
3803 : * Send a command to server (or execute a meta-command)
3804 : */
3805 41530 : case CSTATE_START_COMMAND:
3806 41530 : command = sql_script[st->use_file].commands[st->command];
3807 :
3808 : /*
3809 : * Transition to script end processing if done, but close up
3810 : * shop if a pipeline is open at this point.
3811 : */
3812 41530 : if (command == NULL)
3813 : {
3814 15388 : if (PQpipelineStatus(st->con) == PQ_PIPELINE_OFF)
3815 15382 : st->state = CSTATE_END_TX;
3816 : else
3817 : {
3818 6 : pg_log_error("client %d aborted: end of script reached with pipeline open",
3819 : st->id);
3820 6 : st->state = CSTATE_ABORTED;
3821 : }
3822 :
3823 15388 : break;
3824 : }
3825 :
3826 : /* record begin time of next command, and initiate it */
3827 26142 : if (report_per_command)
3828 : {
3829 802 : pg_time_now_lazy(&now);
3830 802 : st->stmt_begin = now;
3831 : }
3832 :
3833 : /* Execute the command */
3834 26142 : if (command->type == SQL_COMMAND)
3835 : {
3836 : /* disallow \aset and \gset in pipeline mode */
3837 21338 : if (PQpipelineStatus(st->con) != PQ_PIPELINE_OFF)
3838 : {
3839 1048 : if (command->meta == META_GSET)
3840 : {
3841 2 : commandFailed(st, "gset", "\\gset is not allowed in pipeline mode");
3842 2 : st->state = CSTATE_ABORTED;
3843 2 : break;
3844 : }
3845 1046 : else if (command->meta == META_ASET)
3846 : {
3847 0 : commandFailed(st, "aset", "\\aset is not allowed in pipeline mode");
3848 0 : st->state = CSTATE_ABORTED;
3849 0 : break;
3850 : }
3851 : }
3852 :
3853 21336 : if (!sendCommand(st, command))
3854 : {
3855 0 : commandFailed(st, "SQL", "SQL command send failed");
3856 0 : st->state = CSTATE_ABORTED;
3857 : }
3858 : else
3859 : {
3860 : /* Wait for results, unless in pipeline mode */
3861 21336 : if (PQpipelineStatus(st->con) == PQ_PIPELINE_OFF)
3862 20290 : st->state = CSTATE_WAIT_RESULT;
3863 : else
3864 1046 : st->state = CSTATE_END_COMMAND;
3865 : }
3866 : }
3867 4804 : else if (command->type == META_COMMAND)
3868 : {
3869 : /*-----
3870 : * Possible state changes when executing meta commands:
3871 : * - on errors CSTATE_ABORTED
3872 : * - on sleep CSTATE_SLEEP
3873 : * - else CSTATE_END_COMMAND
3874 : */
3875 4804 : st->state = executeMetaCommand(st, &now);
3876 4804 : if (st->state == CSTATE_ABORTED)
3877 62 : st->estatus = ESTATUS_META_COMMAND_ERROR;
3878 : }
3879 :
3880 : /*
3881 : * We're now waiting for an SQL command to complete, or
3882 : * finished processing a metacommand, or need to sleep, or
3883 : * something bad happened.
3884 : */
3885 : Assert(st->state == CSTATE_WAIT_RESULT ||
3886 : st->state == CSTATE_END_COMMAND ||
3887 : st->state == CSTATE_SLEEP ||
3888 : st->state == CSTATE_ABORTED);
3889 26140 : break;
3890 :
3891 : /*
3892 : * non executed conditional branch
3893 : */
3894 5146 : case CSTATE_SKIP_COMMAND:
3895 : Assert(!conditional_active(st->cstack));
3896 : /* quickly skip commands until something to do... */
3897 : while (true)
3898 : {
3899 5146 : command = sql_script[st->use_file].commands[st->command];
3900 :
3901 : /* cannot reach end of script in that state */
3902 : Assert(command != NULL);
3903 :
3904 : /*
3905 : * if this is conditional related, update conditional
3906 : * state
3907 : */
3908 5146 : if (command->type == META_COMMAND &&
3909 990 : (command->meta == META_IF ||
3910 984 : command->meta == META_ELIF ||
3911 968 : command->meta == META_ELSE ||
3912 954 : command->meta == META_ENDIF))
3913 : {
3914 966 : switch (conditional_stack_peek(st->cstack))
3915 : {
3916 936 : case IFSTATE_FALSE:
3917 936 : if (command->meta == META_IF)
3918 : {
3919 : /* nested if in skipped branch - ignore */
3920 4 : conditional_stack_push(st->cstack,
3921 : IFSTATE_IGNORED);
3922 4 : st->command++;
3923 : }
3924 932 : else if (command->meta == META_ELIF)
3925 : {
3926 : /* we must evaluate the condition */
3927 10 : st->state = CSTATE_START_COMMAND;
3928 : }
3929 922 : else if (command->meta == META_ELSE)
3930 : {
3931 : /* we must execute next command */
3932 6 : conditional_stack_poke(st->cstack,
3933 : IFSTATE_ELSE_TRUE);
3934 6 : st->state = CSTATE_START_COMMAND;
3935 6 : st->command++;
3936 : }
3937 916 : else if (command->meta == META_ENDIF)
3938 : {
3939 : Assert(!conditional_stack_empty(st->cstack));
3940 916 : conditional_stack_pop(st->cstack);
3941 916 : if (conditional_active(st->cstack))
3942 916 : st->state = CSTATE_START_COMMAND;
3943 : /* else state remains CSTATE_SKIP_COMMAND */
3944 916 : st->command++;
3945 : }
3946 936 : break;
3947 :
3948 30 : case IFSTATE_IGNORED:
3949 : case IFSTATE_ELSE_FALSE:
3950 30 : if (command->meta == META_IF)
3951 2 : conditional_stack_push(st->cstack,
3952 : IFSTATE_IGNORED);
3953 28 : else if (command->meta == META_ENDIF)
3954 : {
3955 : Assert(!conditional_stack_empty(st->cstack));
3956 14 : conditional_stack_pop(st->cstack);
3957 14 : if (conditional_active(st->cstack))
3958 8 : st->state = CSTATE_START_COMMAND;
3959 : }
3960 : /* could detect "else" & "elif" after "else" */
3961 30 : st->command++;
3962 30 : break;
3963 :
3964 966 : case IFSTATE_NONE:
3965 : case IFSTATE_TRUE:
3966 : case IFSTATE_ELSE_TRUE:
3967 : default:
3968 :
3969 : /*
3970 : * inconsistent if inactive, unreachable dead
3971 : * code
3972 : */
3973 : Assert(false);
3974 : }
3975 : }
3976 : else
3977 : {
3978 : /* skip and consider next */
3979 4180 : st->command++;
3980 : }
3981 :
3982 5146 : if (st->state != CSTATE_SKIP_COMMAND)
3983 : /* out of quick skip command loop */
3984 940 : break;
3985 : }
3986 940 : break;
3987 :
3988 : /*
3989 : * Wait for the current SQL command to complete
3990 : */
3991 41388 : case CSTATE_WAIT_RESULT:
3992 41388 : pg_log_debug("client %d receiving", st->id);
3993 :
3994 : /*
3995 : * Only check for new network data if we processed all data
3996 : * fetched prior. Otherwise we end up doing a syscall for each
3997 : * individual pipelined query, which has a measurable
3998 : * performance impact.
3999 : */
4000 41388 : if (PQisBusy(st->con) && !PQconsumeInput(st->con))
4001 : {
4002 : /* there's something wrong */
4003 0 : commandFailed(st, "SQL", "perhaps the backend died while processing");
4004 0 : st->state = CSTATE_ABORTED;
4005 0 : break;
4006 : }
4007 41388 : if (PQisBusy(st->con))
4008 19962 : return; /* don't have the whole result yet */
4009 :
4010 : /* store or discard the query results */
4011 21426 : if (readCommandResponse(st,
4012 21426 : sql_script[st->use_file].commands[st->command]->meta,
4013 21426 : sql_script[st->use_file].commands[st->command]->varprefix))
4014 : {
4015 : /*
4016 : * outside of pipeline mode: stop reading results.
4017 : * pipeline mode: continue reading results until an
4018 : * end-of-pipeline response.
4019 : */
4020 21390 : if (PQpipelineStatus(st->con) != PQ_PIPELINE_ON)
4021 20360 : st->state = CSTATE_END_COMMAND;
4022 : }
4023 36 : else if (canRetryError(st->estatus))
4024 4 : st->state = CSTATE_ERROR;
4025 : else
4026 32 : st->state = CSTATE_ABORTED;
4027 21426 : break;
4028 :
4029 : /*
4030 : * Wait until sleep is done. This state is entered after a
4031 : * \sleep metacommand. The behavior is similar to
4032 : * CSTATE_THROTTLE, but proceeds to CSTATE_START_COMMAND
4033 : * instead of CSTATE_START_TX.
4034 : */
4035 16 : case CSTATE_SLEEP:
4036 16 : pg_time_now_lazy(&now);
4037 16 : if (now < st->sleep_until)
4038 6 : return; /* still sleeping, nothing to do here */
4039 : /* Else done sleeping. */
4040 10 : st->state = CSTATE_END_COMMAND;
4041 10 : break;
4042 :
4043 : /*
4044 : * End of command: record stats and proceed to next command.
4045 : */
4046 26040 : case CSTATE_END_COMMAND:
4047 :
4048 : /*
4049 : * command completed: accumulate per-command execution times
4050 : * in thread-local data structure, if per-command latencies
4051 : * are requested.
4052 : */
4053 26040 : if (report_per_command)
4054 : {
4055 802 : pg_time_now_lazy(&now);
4056 :
4057 802 : command = sql_script[st->use_file].commands[st->command];
4058 : /* XXX could use a mutex here, but we choose not to */
4059 802 : addToSimpleStats(&command->stats,
4060 802 : PG_TIME_GET_DOUBLE(now - st->stmt_begin));
4061 : }
4062 :
4063 : /* Go ahead with next command, to be executed or skipped */
4064 26040 : st->command++;
4065 26040 : st->state = conditional_active(st->cstack) ?
4066 26040 : CSTATE_START_COMMAND : CSTATE_SKIP_COMMAND;
4067 26040 : break;
4068 :
4069 : /*
4070 : * Clean up after an error.
4071 : */
4072 4 : case CSTATE_ERROR:
4073 : {
4074 : TStatus tstatus;
4075 :
4076 : Assert(st->estatus != ESTATUS_NO_ERROR);
4077 :
4078 : /* Clear the conditional stack */
4079 4 : conditional_stack_reset(st->cstack);
4080 :
4081 : /* Read and discard until a sync point in pipeline mode */
4082 4 : if (PQpipelineStatus(st->con) != PQ_PIPELINE_OFF)
4083 : {
4084 0 : if (!discardUntilSync(st))
4085 : {
4086 0 : st->state = CSTATE_ABORTED;
4087 0 : break;
4088 : }
4089 : }
4090 :
4091 : /*
4092 : * Check if we have a (failed) transaction block or not,
4093 : * and roll it back if any.
4094 : */
4095 4 : tstatus = getTransactionStatus(st->con);
4096 4 : if (tstatus == TSTATUS_IN_BLOCK)
4097 : {
4098 : /* Try to rollback a (failed) transaction block. */
4099 2 : if (!PQsendQuery(st->con, "ROLLBACK"))
4100 : {
4101 0 : pg_log_error("client %d aborted: failed to send sql command for rolling back the failed transaction",
4102 : st->id);
4103 0 : st->state = CSTATE_ABORTED;
4104 : }
4105 : else
4106 2 : st->state = CSTATE_WAIT_ROLLBACK_RESULT;
4107 : }
4108 2 : else if (tstatus == TSTATUS_IDLE)
4109 : {
4110 : /*
4111 : * If time is over, we're done; otherwise, check if we
4112 : * can retry the error.
4113 : */
4114 4 : st->state = timer_exceeded ? CSTATE_FINISHED :
4115 2 : doRetry(st, &now) ? CSTATE_RETRY : CSTATE_FAILURE;
4116 : }
4117 : else
4118 : {
4119 0 : if (tstatus == TSTATUS_CONN_ERROR)
4120 0 : pg_log_error("perhaps the backend died while processing");
4121 :
4122 0 : pg_log_error("client %d aborted while receiving the transaction status", st->id);
4123 0 : st->state = CSTATE_ABORTED;
4124 : }
4125 4 : break;
4126 : }
4127 :
4128 : /*
4129 : * Wait for the rollback command to complete
4130 : */
4131 4 : case CSTATE_WAIT_ROLLBACK_RESULT:
4132 : {
4133 : PGresult *res;
4134 :
4135 4 : pg_log_debug("client %d receiving", st->id);
4136 4 : if (!PQconsumeInput(st->con))
4137 : {
4138 0 : pg_log_error("client %d aborted while rolling back the transaction after an error; perhaps the backend died while processing",
4139 : st->id);
4140 0 : st->state = CSTATE_ABORTED;
4141 0 : break;
4142 : }
4143 4 : if (PQisBusy(st->con))
4144 2 : return; /* don't have the whole result yet */
4145 :
4146 : /*
4147 : * Read and discard the query result;
4148 : */
4149 2 : res = PQgetResult(st->con);
4150 2 : switch (PQresultStatus(res))
4151 : {
4152 2 : case PGRES_COMMAND_OK:
4153 : /* OK */
4154 2 : PQclear(res);
4155 : /* null must be returned */
4156 2 : res = PQgetResult(st->con);
4157 : Assert(res == NULL);
4158 :
4159 : /*
4160 : * If time is over, we're done; otherwise, check
4161 : * if we can retry the error.
4162 : */
4163 4 : st->state = timer_exceeded ? CSTATE_FINISHED :
4164 2 : doRetry(st, &now) ? CSTATE_RETRY : CSTATE_FAILURE;
4165 2 : break;
4166 0 : default:
4167 0 : pg_log_error("client %d aborted while rolling back the transaction after an error; %s",
4168 : st->id, PQerrorMessage(st->con));
4169 0 : PQclear(res);
4170 0 : st->state = CSTATE_ABORTED;
4171 0 : break;
4172 : }
4173 2 : break;
4174 : }
4175 :
4176 : /*
4177 : * Retry the transaction after an error.
4178 : */
4179 4 : case CSTATE_RETRY:
4180 4 : command = sql_script[st->use_file].commands[st->command];
4181 :
4182 : /*
4183 : * Inform that the transaction will be retried after the
4184 : * error.
4185 : */
4186 4 : if (verbose_errors)
4187 4 : printVerboseErrorMessages(st, &now, true);
4188 :
4189 : /* Count tries and retries */
4190 4 : st->tries++;
4191 4 : command->retries++;
4192 :
4193 : /*
4194 : * Reset the random state as they were at the beginning of the
4195 : * transaction.
4196 : */
4197 4 : st->cs_func_rs = st->random_state;
4198 :
4199 : /* Process the first transaction command. */
4200 4 : st->command = 0;
4201 4 : st->estatus = ESTATUS_NO_ERROR;
4202 4 : st->state = CSTATE_START_COMMAND;
4203 4 : break;
4204 :
4205 : /*
4206 : * Record a failed transaction.
4207 : */
4208 0 : case CSTATE_FAILURE:
4209 0 : command = sql_script[st->use_file].commands[st->command];
4210 :
4211 : /* Accumulate the failure. */
4212 0 : command->failures++;
4213 :
4214 : /*
4215 : * Inform that the failed transaction will not be retried.
4216 : */
4217 0 : if (verbose_errors)
4218 0 : printVerboseErrorMessages(st, &now, false);
4219 :
4220 : /* End the failed transaction. */
4221 0 : st->state = CSTATE_END_TX;
4222 0 : break;
4223 :
4224 : /*
4225 : * End of transaction (end of script, really).
4226 : */
4227 15382 : case CSTATE_END_TX:
4228 : {
4229 : TStatus tstatus;
4230 :
4231 : /* transaction finished: calculate latency and do log */
4232 15382 : processXactStats(thread, st, &now, false, agg);
4233 :
4234 : /*
4235 : * missing \endif... cannot happen if CheckConditional was
4236 : * okay
4237 : */
4238 : Assert(conditional_stack_empty(st->cstack));
4239 :
4240 : /*
4241 : * We must complete all the transaction blocks that were
4242 : * started in this script.
4243 : */
4244 15382 : tstatus = getTransactionStatus(st->con);
4245 15382 : if (tstatus == TSTATUS_IN_BLOCK)
4246 : {
4247 2 : pg_log_error("client %d aborted: end of script reached without completing the last transaction",
4248 : st->id);
4249 2 : st->state = CSTATE_ABORTED;
4250 2 : break;
4251 : }
4252 15380 : else if (tstatus != TSTATUS_IDLE)
4253 : {
4254 0 : if (tstatus == TSTATUS_CONN_ERROR)
4255 0 : pg_log_error("perhaps the backend died while processing");
4256 :
4257 0 : pg_log_error("client %d aborted while receiving the transaction status", st->id);
4258 0 : st->state = CSTATE_ABORTED;
4259 0 : break;
4260 : }
4261 :
4262 15380 : if (is_connect)
4263 : {
4264 220 : pg_time_usec_t start = now;
4265 :
4266 220 : pg_time_now_lazy(&start);
4267 220 : finishCon(st);
4268 220 : now = pg_time_now();
4269 220 : thread->conn_duration += now - start;
4270 : }
4271 :
4272 15380 : if ((st->cnt >= nxacts && duration <= 0) || timer_exceeded)
4273 : {
4274 : /* script completed */
4275 144 : st->state = CSTATE_FINISHED;
4276 144 : break;
4277 : }
4278 :
4279 : /* next transaction (script) */
4280 15236 : st->state = CSTATE_CHOOSE_SCRIPT;
4281 :
4282 : /*
4283 : * Ensure that we always return on this point, so as to
4284 : * avoid an infinite loop if the script only contains meta
4285 : * commands.
4286 : */
4287 15236 : return;
4288 : }
4289 :
4290 : /*
4291 : * Final states. Close the connection if it's still open.
4292 : */
4293 250 : case CSTATE_ABORTED:
4294 : case CSTATE_FINISHED:
4295 :
4296 : /*
4297 : * Don't measure the disconnection delays here even if in
4298 : * CSTATE_FINISHED and -C/--connect option is specified.
4299 : * Because in this case all the connections that this thread
4300 : * established are closed at the end of transactions and the
4301 : * disconnection delays should have already been measured at
4302 : * that moment.
4303 : *
4304 : * In CSTATE_ABORTED state, the measurement is no longer
4305 : * necessary because we cannot report complete results anyways
4306 : * in this case.
4307 : */
4308 250 : finishCon(st);
4309 250 : return;
4310 : }
4311 : }
4312 : }
4313 :
4314 : /*
4315 : * Subroutine for advanceConnectionState -- initiate or execute the current
4316 : * meta command, and return the next state to set.
4317 : *
4318 : * *now is updated to the current time, unless the command is expected to
4319 : * take no time to execute.
4320 : */
4321 : static ConnectionStateEnum
4322 4804 : executeMetaCommand(CState *st, pg_time_usec_t *now)
4323 : {
4324 4804 : Command *command = sql_script[st->use_file].commands[st->command];
4325 : int argc;
4326 : char **argv;
4327 :
4328 : Assert(command != NULL && command->type == META_COMMAND);
4329 :
4330 4804 : argc = command->argc;
4331 4804 : argv = command->argv;
4332 :
4333 4804 : if (unlikely(__pg_log_level <= PG_LOG_DEBUG))
4334 : {
4335 : PQExpBufferData buf;
4336 :
4337 1406 : initPQExpBuffer(&buf);
4338 :
4339 1406 : printfPQExpBuffer(&buf, "client %d executing \\%s", st->id, argv[0]);
4340 2812 : for (int i = 1; i < argc; i++)
4341 1406 : appendPQExpBuffer(&buf, " %s", argv[i]);
4342 :
4343 1406 : pg_log_debug("%s", buf.data);
4344 :
4345 1406 : termPQExpBuffer(&buf);
4346 : }
4347 :
4348 4804 : if (command->meta == META_SLEEP)
4349 : {
4350 : int usec;
4351 :
4352 : /*
4353 : * A \sleep doesn't execute anything, we just get the delay from the
4354 : * argument, and enter the CSTATE_SLEEP state. (The per-command
4355 : * latency will be recorded in CSTATE_SLEEP state, not here, after the
4356 : * delay has elapsed.)
4357 : */
4358 12 : if (!evaluateSleep(&st->variables, argc, argv, &usec))
4359 : {
4360 2 : commandFailed(st, "sleep", "execution of meta-command failed");
4361 2 : return CSTATE_ABORTED;
4362 : }
4363 :
4364 10 : pg_time_now_lazy(now);
4365 10 : st->sleep_until = (*now) + usec;
4366 10 : return CSTATE_SLEEP;
4367 : }
4368 4792 : else if (command->meta == META_SET)
4369 : {
4370 3424 : PgBenchExpr *expr = command->expr;
4371 : PgBenchValue result;
4372 :
4373 3424 : if (!evaluateExpr(st, expr, &result))
4374 : {
4375 46 : commandFailed(st, argv[0], "evaluation of meta-command failed");
4376 48 : return CSTATE_ABORTED;
4377 : }
4378 :
4379 3378 : if (!putVariableValue(&st->variables, argv[0], argv[1], &result))
4380 : {
4381 2 : commandFailed(st, "set", "assignment of meta-command failed");
4382 2 : return CSTATE_ABORTED;
4383 : }
4384 : }
4385 1368 : else if (command->meta == META_IF)
4386 : {
4387 : /* backslash commands with an expression to evaluate */
4388 1012 : PgBenchExpr *expr = command->expr;
4389 : PgBenchValue result;
4390 : bool cond;
4391 :
4392 1012 : if (!evaluateExpr(st, expr, &result))
4393 : {
4394 0 : commandFailed(st, argv[0], "evaluation of meta-command failed");
4395 0 : return CSTATE_ABORTED;
4396 : }
4397 :
4398 1012 : cond = valueTruth(&result);
4399 1012 : conditional_stack_push(st->cstack, cond ? IFSTATE_TRUE : IFSTATE_FALSE);
4400 : }
4401 356 : else if (command->meta == META_ELIF)
4402 : {
4403 : /* backslash commands with an expression to evaluate */
4404 14 : PgBenchExpr *expr = command->expr;
4405 : PgBenchValue result;
4406 : bool cond;
4407 :
4408 14 : if (conditional_stack_peek(st->cstack) == IFSTATE_TRUE)
4409 : {
4410 : /* elif after executed block, skip eval and wait for endif. */
4411 4 : conditional_stack_poke(st->cstack, IFSTATE_IGNORED);
4412 4 : return CSTATE_END_COMMAND;
4413 : }
4414 :
4415 10 : if (!evaluateExpr(st, expr, &result))
4416 : {
4417 0 : commandFailed(st, argv[0], "evaluation of meta-command failed");
4418 0 : return CSTATE_ABORTED;
4419 : }
4420 :
4421 10 : cond = valueTruth(&result);
4422 : Assert(conditional_stack_peek(st->cstack) == IFSTATE_FALSE);
4423 10 : conditional_stack_poke(st->cstack, cond ? IFSTATE_TRUE : IFSTATE_FALSE);
4424 : }
4425 342 : else if (command->meta == META_ELSE)
4426 : {
4427 4 : switch (conditional_stack_peek(st->cstack))
4428 : {
4429 4 : case IFSTATE_TRUE:
4430 4 : conditional_stack_poke(st->cstack, IFSTATE_ELSE_FALSE);
4431 4 : break;
4432 4 : case IFSTATE_FALSE: /* inconsistent if active */
4433 : case IFSTATE_IGNORED: /* inconsistent if active */
4434 : case IFSTATE_NONE: /* else without if */
4435 : case IFSTATE_ELSE_TRUE: /* else after else */
4436 : case IFSTATE_ELSE_FALSE: /* else after else */
4437 : default:
4438 : /* dead code if conditional check is ok */
4439 : Assert(false);
4440 : }
4441 : }
4442 338 : else if (command->meta == META_ENDIF)
4443 : {
4444 : Assert(!conditional_stack_empty(st->cstack));
4445 86 : conditional_stack_pop(st->cstack);
4446 : }
4447 252 : else if (command->meta == META_SETSHELL)
4448 : {
4449 6 : if (!runShellCommand(&st->variables, argv[1], argv + 2, argc - 2))
4450 : {
4451 4 : commandFailed(st, "setshell", "execution of meta-command failed");
4452 4 : return CSTATE_ABORTED;
4453 : }
4454 : }
4455 246 : else if (command->meta == META_SHELL)
4456 : {
4457 6 : if (!runShellCommand(&st->variables, NULL, argv + 1, argc - 1))
4458 : {
4459 4 : commandFailed(st, "shell", "execution of meta-command failed");
4460 4 : return CSTATE_ABORTED;
4461 : }
4462 : }
4463 240 : else if (command->meta == META_STARTPIPELINE)
4464 : {
4465 : /*
4466 : * In pipeline mode, we use a workflow based on libpq pipeline
4467 : * functions.
4468 : */
4469 120 : if (querymode == QUERY_SIMPLE)
4470 : {
4471 0 : commandFailed(st, "startpipeline", "cannot use pipeline mode with the simple query protocol");
4472 0 : return CSTATE_ABORTED;
4473 : }
4474 :
4475 : /*
4476 : * If we're in prepared-query mode, we need to prepare all the
4477 : * commands that are inside the pipeline before we actually start the
4478 : * pipeline itself. This solves the problem that running BEGIN
4479 : * ISOLATION LEVEL SERIALIZABLE in a pipeline would fail due to a
4480 : * snapshot having been acquired by the prepare within the pipeline.
4481 : */
4482 120 : if (querymode == QUERY_PREPARED)
4483 84 : prepareCommandsInPipeline(st);
4484 :
4485 120 : if (PQpipelineStatus(st->con) != PQ_PIPELINE_OFF)
4486 : {
4487 2 : commandFailed(st, "startpipeline", "already in pipeline mode");
4488 2 : return CSTATE_ABORTED;
4489 : }
4490 118 : if (PQenterPipelineMode(st->con) == 0)
4491 : {
4492 0 : commandFailed(st, "startpipeline", "failed to enter pipeline mode");
4493 0 : return CSTATE_ABORTED;
4494 : }
4495 : }
4496 120 : else if (command->meta == META_SYNCPIPELINE)
4497 : {
4498 10 : if (PQpipelineStatus(st->con) != PQ_PIPELINE_ON)
4499 : {
4500 0 : commandFailed(st, "syncpipeline", "not in pipeline mode");
4501 0 : return CSTATE_ABORTED;
4502 : }
4503 10 : if (PQsendPipelineSync(st->con) == 0)
4504 : {
4505 0 : commandFailed(st, "syncpipeline", "failed to send a pipeline sync");
4506 0 : return CSTATE_ABORTED;
4507 : }
4508 10 : st->num_syncs++;
4509 : }
4510 110 : else if (command->meta == META_ENDPIPELINE)
4511 : {
4512 110 : if (PQpipelineStatus(st->con) != PQ_PIPELINE_ON)
4513 : {
4514 2 : commandFailed(st, "endpipeline", "not in pipeline mode");
4515 2 : return CSTATE_ABORTED;
4516 : }
4517 108 : if (!PQpipelineSync(st->con))
4518 : {
4519 0 : commandFailed(st, "endpipeline", "failed to send a pipeline sync");
4520 0 : return CSTATE_ABORTED;
4521 : }
4522 108 : st->num_syncs++;
4523 : /* Now wait for the PGRES_PIPELINE_SYNC and exit pipeline mode there */
4524 : /* collect pending results before getting out of pipeline mode */
4525 108 : return CSTATE_WAIT_RESULT;
4526 : }
4527 :
4528 : /*
4529 : * executing the expression or shell command might have taken a
4530 : * non-negligible amount of time, so reset 'now'
4531 : */
4532 4620 : *now = 0;
4533 :
4534 4620 : return CSTATE_END_COMMAND;
4535 : }
4536 :
4537 : /*
4538 : * Return the number of failed transactions.
4539 : */
4540 : static int64
4541 196 : getFailures(const StatsData *stats)
4542 : {
4543 392 : return (stats->serialization_failures +
4544 196 : stats->deadlock_failures);
4545 : }
4546 :
4547 : /*
4548 : * Return a string constant representing the result of a transaction
4549 : * that is not successfully processed.
4550 : */
4551 : static const char *
4552 0 : getResultString(bool skipped, EStatus estatus)
4553 : {
4554 0 : if (skipped)
4555 0 : return "skipped";
4556 0 : else if (failures_detailed)
4557 : {
4558 0 : switch (estatus)
4559 : {
4560 0 : case ESTATUS_SERIALIZATION_ERROR:
4561 0 : return "serialization";
4562 0 : case ESTATUS_DEADLOCK_ERROR:
4563 0 : return "deadlock";
4564 0 : default:
4565 : /* internal error which should never occur */
4566 0 : pg_fatal("unexpected error status: %d", estatus);
4567 : }
4568 : }
4569 : else
4570 0 : return "failed";
4571 : }
4572 :
4573 : /*
4574 : * Print log entry after completing one transaction.
4575 : *
4576 : * We print Unix-epoch timestamps in the log, so that entries can be
4577 : * correlated against other logs.
4578 : *
4579 : * XXX We could obtain the time from the caller and just shift it here, to
4580 : * avoid the cost of an extra call to pg_time_now().
4581 : */
4582 : static void
4583 220 : doLog(TState *thread, CState *st,
4584 : StatsData *agg, bool skipped, double latency, double lag)
4585 : {
4586 220 : FILE *logfile = thread->logfile;
4587 220 : pg_time_usec_t now = pg_time_now() + epoch_shift;
4588 :
4589 : Assert(use_log);
4590 :
4591 : /*
4592 : * Skip the log entry if sampling is enabled and this row doesn't belong
4593 : * to the random sample.
4594 : */
4595 220 : if (sample_rate != 0.0 &&
4596 200 : pg_prng_double(&thread->ts_sample_rs) > sample_rate)
4597 110 : return;
4598 :
4599 : /* should we aggregate the results or not? */
4600 110 : if (agg_interval > 0)
4601 : {
4602 : pg_time_usec_t next;
4603 :
4604 : /*
4605 : * Loop until we reach the interval of the current moment, and print
4606 : * any empty intervals in between (this may happen with very low tps,
4607 : * e.g. --rate=0.1).
4608 : */
4609 :
4610 0 : while ((next = agg->start_time + agg_interval * INT64CONST(1000000)) <= now)
4611 : {
4612 0 : double lag_sum = 0.0;
4613 0 : double lag_sum2 = 0.0;
4614 0 : double lag_min = 0.0;
4615 0 : double lag_max = 0.0;
4616 0 : int64 skipped = 0;
4617 0 : int64 serialization_failures = 0;
4618 0 : int64 deadlock_failures = 0;
4619 0 : int64 retried = 0;
4620 0 : int64 retries = 0;
4621 :
4622 : /* print aggregated report to logfile */
4623 0 : fprintf(logfile, INT64_FORMAT " " INT64_FORMAT " %.0f %.0f %.0f %.0f",
4624 0 : agg->start_time / 1000000, /* seconds since Unix epoch */
4625 : agg->cnt,
4626 : agg->latency.sum,
4627 : agg->latency.sum2,
4628 : agg->latency.min,
4629 : agg->latency.max);
4630 :
4631 0 : if (throttle_delay)
4632 : {
4633 0 : lag_sum = agg->lag.sum;
4634 0 : lag_sum2 = agg->lag.sum2;
4635 0 : lag_min = agg->lag.min;
4636 0 : lag_max = agg->lag.max;
4637 : }
4638 0 : fprintf(logfile, " %.0f %.0f %.0f %.0f",
4639 : lag_sum,
4640 : lag_sum2,
4641 : lag_min,
4642 : lag_max);
4643 :
4644 0 : if (latency_limit)
4645 0 : skipped = agg->skipped;
4646 0 : fprintf(logfile, " " INT64_FORMAT, skipped);
4647 :
4648 0 : if (max_tries != 1)
4649 : {
4650 0 : retried = agg->retried;
4651 0 : retries = agg->retries;
4652 : }
4653 0 : fprintf(logfile, " " INT64_FORMAT " " INT64_FORMAT, retried, retries);
4654 :
4655 0 : if (failures_detailed)
4656 : {
4657 0 : serialization_failures = agg->serialization_failures;
4658 0 : deadlock_failures = agg->deadlock_failures;
4659 : }
4660 0 : fprintf(logfile, " " INT64_FORMAT " " INT64_FORMAT,
4661 : serialization_failures,
4662 : deadlock_failures);
4663 :
4664 0 : fputc('\n', logfile);
4665 :
4666 : /* reset data and move to next interval */
4667 0 : initStats(agg, next);
4668 : }
4669 :
4670 : /* accumulate the current transaction */
4671 0 : accumStats(agg, skipped, latency, lag, st->estatus, st->tries);
4672 : }
4673 : else
4674 : {
4675 : /* no, print raw transactions */
4676 110 : if (!skipped && st->estatus == ESTATUS_NO_ERROR)
4677 110 : fprintf(logfile, "%d " INT64_FORMAT " %.0f %d " INT64_FORMAT " "
4678 : INT64_FORMAT,
4679 : st->id, st->cnt, latency, st->use_file,
4680 : now / 1000000, now % 1000000);
4681 : else
4682 0 : fprintf(logfile, "%d " INT64_FORMAT " %s %d " INT64_FORMAT " "
4683 : INT64_FORMAT,
4684 : st->id, st->cnt, getResultString(skipped, st->estatus),
4685 : st->use_file, now / 1000000, now % 1000000);
4686 :
4687 110 : if (throttle_delay)
4688 0 : fprintf(logfile, " %.0f", lag);
4689 110 : if (max_tries != 1)
4690 0 : fprintf(logfile, " %u", st->tries - 1);
4691 110 : fputc('\n', logfile);
4692 : }
4693 : }
4694 :
4695 : /*
4696 : * Accumulate and report statistics at end of a transaction.
4697 : *
4698 : * (This is also called when a transaction is late and thus skipped.
4699 : * Note that even skipped and failed transactions are counted in the CState
4700 : * "cnt" field.)
4701 : */
4702 : static void
4703 15400 : processXactStats(TState *thread, CState *st, pg_time_usec_t *now,
4704 : bool skipped, StatsData *agg)
4705 : {
4706 15400 : double latency = 0.0,
4707 15400 : lag = 0.0;
4708 15400 : bool detailed = progress || throttle_delay || latency_limit ||
4709 30800 : use_log || per_script_stats;
4710 :
4711 15400 : if (detailed && !skipped && st->estatus == ESTATUS_NO_ERROR)
4712 : {
4713 3322 : pg_time_now_lazy(now);
4714 :
4715 : /* compute latency & lag */
4716 3322 : latency = (*now) - st->txn_scheduled;
4717 3322 : lag = st->txn_begin - st->txn_scheduled;
4718 : }
4719 :
4720 : /* keep detailed thread stats */
4721 15400 : accumStats(&thread->stats, skipped, latency, lag, st->estatus, st->tries);
4722 :
4723 : /* count transactions over the latency limit, if needed */
4724 15400 : if (latency_limit && latency > latency_limit)
4725 2 : thread->latency_late++;
4726 :
4727 : /* client stat is just counting */
4728 15400 : st->cnt++;
4729 :
4730 15400 : if (use_log)
4731 220 : doLog(thread, st, agg, skipped, latency, lag);
4732 :
4733 : /* XXX could use a mutex here, but we choose not to */
4734 15400 : if (per_script_stats)
4735 2700 : accumStats(&sql_script[st->use_file].stats, skipped, latency, lag,
4736 2700 : st->estatus, st->tries);
4737 15400 : }
4738 :
4739 :
4740 : /* discard connections */
4741 : static void
4742 340 : disconnect_all(CState *state, int length)
4743 : {
4744 : int i;
4745 :
4746 836 : for (i = 0; i < length; i++)
4747 496 : finishCon(&state[i]);
4748 340 : }
4749 :
4750 : /*
4751 : * Remove old pgbench tables, if any exist
4752 : */
4753 : static void
4754 6 : initDropTables(PGconn *con)
4755 : {
4756 6 : fprintf(stderr, "dropping old tables...\n");
4757 :
4758 : /*
4759 : * We drop all the tables in one command, so that whether there are
4760 : * foreign key dependencies or not doesn't matter.
4761 : */
4762 6 : executeStatement(con, "drop table if exists "
4763 : "pgbench_accounts, "
4764 : "pgbench_branches, "
4765 : "pgbench_history, "
4766 : "pgbench_tellers");
4767 6 : }
4768 :
4769 : /*
4770 : * Create "pgbench_accounts" partitions if needed.
4771 : *
4772 : * This is the larger table of pgbench default tpc-b like schema
4773 : * with a known size, so we choose to partition it.
4774 : */
4775 : static void
4776 4 : createPartitions(PGconn *con)
4777 : {
4778 : PQExpBufferData query;
4779 :
4780 : /* we must have to create some partitions */
4781 : Assert(partitions > 0);
4782 :
4783 4 : fprintf(stderr, "creating %d partitions...\n", partitions);
4784 :
4785 4 : initPQExpBuffer(&query);
4786 :
4787 14 : for (int p = 1; p <= partitions; p++)
4788 : {
4789 10 : if (partition_method == PART_RANGE)
4790 : {
4791 6 : int64 part_size = (naccounts * (int64) scale + partitions - 1) / partitions;
4792 :
4793 6 : printfPQExpBuffer(&query,
4794 : "create%s table pgbench_accounts_%d\n"
4795 : " partition of pgbench_accounts\n"
4796 : " for values from (",
4797 6 : unlogged_tables ? " unlogged" : "", p);
4798 :
4799 : /*
4800 : * For RANGE, we use open-ended partitions at the beginning and
4801 : * end to allow any valid value for the primary key. Although the
4802 : * actual minimum and maximum values can be derived from the
4803 : * scale, it is more generic and the performance is better.
4804 : */
4805 6 : if (p == 1)
4806 2 : appendPQExpBufferStr(&query, "minvalue");
4807 : else
4808 4 : appendPQExpBuffer(&query, INT64_FORMAT, (p - 1) * part_size + 1);
4809 :
4810 6 : appendPQExpBufferStr(&query, ") to (");
4811 :
4812 6 : if (p < partitions)
4813 4 : appendPQExpBuffer(&query, INT64_FORMAT, p * part_size + 1);
4814 : else
4815 2 : appendPQExpBufferStr(&query, "maxvalue");
4816 :
4817 6 : appendPQExpBufferChar(&query, ')');
4818 : }
4819 4 : else if (partition_method == PART_HASH)
4820 4 : printfPQExpBuffer(&query,
4821 : "create%s table pgbench_accounts_%d\n"
4822 : " partition of pgbench_accounts\n"
4823 : " for values with (modulus %d, remainder %d)",
4824 4 : unlogged_tables ? " unlogged" : "", p,
4825 : partitions, p - 1);
4826 : else /* cannot get there */
4827 : Assert(0);
4828 :
4829 : /*
4830 : * Per ddlinfo in initCreateTables, fillfactor is needed on table
4831 : * pgbench_accounts.
4832 : */
4833 10 : appendPQExpBuffer(&query, " with (fillfactor=%d)", fillfactor);
4834 :
4835 10 : executeStatement(con, query.data);
4836 : }
4837 :
4838 4 : termPQExpBuffer(&query);
4839 4 : }
4840 :
4841 : /*
4842 : * Create pgbench's standard tables
4843 : */
4844 : static void
4845 6 : initCreateTables(PGconn *con)
4846 : {
4847 : /*
4848 : * Note: TPC-B requires at least 100 bytes per row, and the "filler"
4849 : * fields in these table declarations were intended to comply with that.
4850 : * The pgbench_accounts table complies with that because the "filler"
4851 : * column is set to blank-padded empty string. But for all other tables
4852 : * the columns default to NULL and so don't actually take any space. We
4853 : * could fix that by giving them non-null default values. However, that
4854 : * would completely break comparability of pgbench results with prior
4855 : * versions. Since pgbench has never pretended to be fully TPC-B compliant
4856 : * anyway, we stick with the historical behavior.
4857 : */
4858 : struct ddlinfo
4859 : {
4860 : const char *table; /* table name */
4861 : const char *smcols; /* column decls if accountIDs are 32 bits */
4862 : const char *bigcols; /* column decls if accountIDs are 64 bits */
4863 : int declare_fillfactor;
4864 : };
4865 : static const struct ddlinfo DDLs[] = {
4866 : {
4867 : "pgbench_history",
4868 : "tid int,bid int,aid int,delta int,mtime timestamp,filler char(22)",
4869 : "tid int,bid int,aid bigint,delta int,mtime timestamp,filler char(22)",
4870 : 0
4871 : },
4872 : {
4873 : "pgbench_tellers",
4874 : "tid int not null,bid int,tbalance int,filler char(84)",
4875 : "tid int not null,bid int,tbalance int,filler char(84)",
4876 : 1
4877 : },
4878 : {
4879 : "pgbench_accounts",
4880 : "aid int not null,bid int,abalance int,filler char(84)",
4881 : "aid bigint not null,bid int,abalance int,filler char(84)",
4882 : 1
4883 : },
4884 : {
4885 : "pgbench_branches",
4886 : "bid int not null,bbalance int,filler char(88)",
4887 : "bid int not null,bbalance int,filler char(88)",
4888 : 1
4889 : }
4890 : };
4891 : int i;
4892 : PQExpBufferData query;
4893 :
4894 6 : fprintf(stderr, "creating tables...\n");
4895 :
4896 6 : initPQExpBuffer(&query);
4897 :
4898 30 : for (i = 0; i < lengthof(DDLs); i++)
4899 : {
4900 24 : const struct ddlinfo *ddl = &DDLs[i];
4901 :
4902 : /* Construct new create table statement. */
4903 48 : printfPQExpBuffer(&query, "create%s table %s(%s)",
4904 16 : (unlogged_tables && partition_method == PART_NONE) ? " unlogged" : "",
4905 24 : ddl->table,
4906 24 : (scale >= SCALE_32BIT_THRESHOLD) ? ddl->bigcols : ddl->smcols);
4907 :
4908 : /* Partition pgbench_accounts table */
4909 24 : if (partition_method != PART_NONE && strcmp(ddl->table, "pgbench_accounts") == 0)
4910 4 : appendPQExpBuffer(&query,
4911 4 : " partition by %s (aid)", PARTITION_METHOD[partition_method]);
4912 20 : else if (ddl->declare_fillfactor)
4913 : {
4914 : /* fillfactor is only expected on actual tables */
4915 14 : appendPQExpBuffer(&query, " with (fillfactor=%d)", fillfactor);
4916 : }
4917 :
4918 24 : if (tablespace != NULL)
4919 : {
4920 : char *escape_tablespace;
4921 :
4922 8 : escape_tablespace = PQescapeIdentifier(con, tablespace, strlen(tablespace));
4923 8 : appendPQExpBuffer(&query, " tablespace %s", escape_tablespace);
4924 8 : PQfreemem(escape_tablespace);
4925 : }
4926 :
4927 24 : executeStatement(con, query.data);
4928 : }
4929 :
4930 6 : termPQExpBuffer(&query);
4931 :
4932 6 : if (partition_method != PART_NONE)
4933 4 : createPartitions(con);
4934 6 : }
4935 :
4936 : /*
4937 : * Truncate away any old data, in one command in case there are foreign keys
4938 : */
4939 : static void
4940 6 : initTruncateTables(PGconn *con)
4941 : {
4942 6 : executeStatement(con, "truncate table "
4943 : "pgbench_accounts, "
4944 : "pgbench_branches, "
4945 : "pgbench_history, "
4946 : "pgbench_tellers");
4947 6 : }
4948 :
4949 : static void
4950 4 : initBranch(PQExpBufferData *sql, int64 curr)
4951 : {
4952 : /* "filler" column uses NULL */
4953 4 : printfPQExpBuffer(sql,
4954 : INT64_FORMAT "\t0\t\\N\n",
4955 : curr + 1);
4956 4 : }
4957 :
4958 : static void
4959 40 : initTeller(PQExpBufferData *sql, int64 curr)
4960 : {
4961 : /* "filler" column uses NULL */
4962 40 : printfPQExpBuffer(sql,
4963 : INT64_FORMAT "\t" INT64_FORMAT "\t0\t\\N\n",
4964 40 : curr + 1, curr / ntellers + 1);
4965 40 : }
4966 :
4967 : static void
4968 400000 : initAccount(PQExpBufferData *sql, int64 curr)
4969 : {
4970 : /* "filler" column defaults to blank padded empty string */
4971 400000 : printfPQExpBuffer(sql,
4972 : INT64_FORMAT "\t" INT64_FORMAT "\t0\t\n",
4973 400000 : curr + 1, curr / naccounts + 1);
4974 400000 : }
4975 :
4976 : static void
4977 12 : initPopulateTable(PGconn *con, const char *table, int64 base,
4978 : initRowMethod init_row)
4979 : {
4980 : int n;
4981 : int64 k;
4982 12 : int chars = 0;
4983 12 : int prev_chars = 0;
4984 : PGresult *res;
4985 : PQExpBufferData sql;
4986 : char copy_statement[256];
4987 12 : const char *copy_statement_fmt = "copy %s from stdin";
4988 12 : int64 total = base * scale;
4989 :
4990 : /* used to track elapsed time and estimate of the remaining time */
4991 : pg_time_usec_t start;
4992 12 : int log_interval = 1;
4993 :
4994 : /* Stay on the same line if reporting to a terminal */
4995 12 : char eol = isatty(fileno(stderr)) ? '\r' : '\n';
4996 :
4997 12 : initPQExpBuffer(&sql);
4998 :
4999 : /* Use COPY with FREEZE on v14 and later for all ordinary tables */
5000 24 : if ((PQserverVersion(con) >= 140000) &&
5001 12 : get_table_relkind(con, table) == RELKIND_RELATION)
5002 10 : copy_statement_fmt = "copy %s from stdin with (freeze on)";
5003 :
5004 :
5005 12 : n = pg_snprintf(copy_statement, sizeof(copy_statement), copy_statement_fmt, table);
5006 12 : if (n >= sizeof(copy_statement))
5007 0 : pg_fatal("invalid buffer size: must be at least %d characters long", n);
5008 12 : else if (n == -1)
5009 0 : pg_fatal("invalid format string");
5010 :
5011 12 : res = PQexec(con, copy_statement);
5012 :
5013 12 : if (PQresultStatus(res) != PGRES_COPY_IN)
5014 0 : pg_fatal("unexpected copy in result: %s", PQerrorMessage(con));
5015 12 : PQclear(res);
5016 :
5017 12 : start = pg_time_now();
5018 :
5019 400056 : for (k = 0; k < total; k++)
5020 : {
5021 400044 : int64 j = k + 1;
5022 :
5023 400044 : init_row(&sql, k);
5024 400044 : if (PQputline(con, sql.data))
5025 0 : pg_fatal("PQputline failed");
5026 :
5027 400044 : if (CancelRequested)
5028 0 : break;
5029 :
5030 : /*
5031 : * If we want to stick with the original logging, print a message each
5032 : * 100k inserted rows.
5033 : */
5034 400044 : if ((!use_quiet) && (j % 100000 == 0))
5035 2 : {
5036 2 : double elapsed_sec = PG_TIME_GET_DOUBLE(pg_time_now() - start);
5037 2 : double remaining_sec = ((double) total - j) * elapsed_sec / j;
5038 :
5039 2 : chars = fprintf(stderr, INT64_FORMAT " of " INT64_FORMAT " tuples (%d%%) of %s done (elapsed %.2f s, remaining %.2f s)",
5040 : j, total,
5041 2 : (int) ((j * 100) / total),
5042 : table, elapsed_sec, remaining_sec);
5043 :
5044 : /*
5045 : * If the previous progress message is longer than the current
5046 : * one, add spaces to the current line to fully overwrite any
5047 : * remaining characters from the previous message.
5048 : */
5049 2 : if (prev_chars > chars)
5050 0 : fprintf(stderr, "%*c", prev_chars - chars, ' ');
5051 2 : fputc(eol, stderr);
5052 2 : prev_chars = chars;
5053 : }
5054 : /* let's not call the timing for each row, but only each 100 rows */
5055 400042 : else if (use_quiet && (j % 100 == 0))
5056 : {
5057 2000 : double elapsed_sec = PG_TIME_GET_DOUBLE(pg_time_now() - start);
5058 2000 : double remaining_sec = ((double) total - j) * elapsed_sec / j;
5059 :
5060 : /* have we reached the next interval (or end)? */
5061 2000 : if ((j == total) || (elapsed_sec >= log_interval * LOG_STEP_SECONDS))
5062 : {
5063 2 : chars = fprintf(stderr, INT64_FORMAT " of " INT64_FORMAT " tuples (%d%%) of %s done (elapsed %.2f s, remaining %.2f s)",
5064 : j, total,
5065 2 : (int) ((j * 100) / total),
5066 : table, elapsed_sec, remaining_sec);
5067 :
5068 : /*
5069 : * If the previous progress message is longer than the current
5070 : * one, add spaces to the current line to fully overwrite any
5071 : * remaining characters from the previous message.
5072 : */
5073 2 : if (prev_chars > chars)
5074 0 : fprintf(stderr, "%*c", prev_chars - chars, ' ');
5075 2 : fputc(eol, stderr);
5076 2 : prev_chars = chars;
5077 :
5078 : /* skip to the next interval */
5079 2 : log_interval = (int) ceil(elapsed_sec / LOG_STEP_SECONDS);
5080 : }
5081 : }
5082 : }
5083 :
5084 12 : if (chars != 0 && eol != '\n')
5085 0 : fprintf(stderr, "%*c\r", chars, ' '); /* Clear the current line */
5086 :
5087 12 : if (PQputline(con, "\\.\n"))
5088 0 : pg_fatal("very last PQputline failed");
5089 12 : if (PQendcopy(con))
5090 0 : pg_fatal("PQendcopy failed");
5091 :
5092 12 : termPQExpBuffer(&sql);
5093 12 : }
5094 :
5095 : /*
5096 : * Fill the standard tables with some data generated and sent from the client.
5097 : *
5098 : * The filler column is NULL in pgbench_branches and pgbench_tellers, and is
5099 : * a blank-padded string in pgbench_accounts.
5100 : */
5101 : static void
5102 4 : initGenerateDataClientSide(PGconn *con)
5103 : {
5104 4 : fprintf(stderr, "generating data (client-side)...\n");
5105 :
5106 : /*
5107 : * we do all of this in one transaction to enable the backend's
5108 : * data-loading optimizations
5109 : */
5110 4 : executeStatement(con, "begin");
5111 :
5112 : /* truncate away any old data */
5113 4 : initTruncateTables(con);
5114 :
5115 : /*
5116 : * fill branches, tellers, accounts in that order in case foreign keys
5117 : * already exist
5118 : */
5119 4 : initPopulateTable(con, "pgbench_branches", nbranches, initBranch);
5120 4 : initPopulateTable(con, "pgbench_tellers", ntellers, initTeller);
5121 4 : initPopulateTable(con, "pgbench_accounts", naccounts, initAccount);
5122 :
5123 4 : executeStatement(con, "commit");
5124 4 : }
5125 :
5126 : /*
5127 : * Fill the standard tables with some data generated on the server
5128 : *
5129 : * As already the case with the client-side data generation, the filler
5130 : * column defaults to NULL in pgbench_branches and pgbench_tellers,
5131 : * and is a blank-padded string in pgbench_accounts.
5132 : */
5133 : static void
5134 2 : initGenerateDataServerSide(PGconn *con)
5135 : {
5136 : PQExpBufferData sql;
5137 :
5138 2 : fprintf(stderr, "generating data (server-side)...\n");
5139 :
5140 : /*
5141 : * we do all of this in one transaction to enable the backend's
5142 : * data-loading optimizations
5143 : */
5144 2 : executeStatement(con, "begin");
5145 :
5146 : /* truncate away any old data */
5147 2 : initTruncateTables(con);
5148 :
5149 2 : initPQExpBuffer(&sql);
5150 :
5151 2 : printfPQExpBuffer(&sql,
5152 : "insert into pgbench_branches(bid,bbalance) "
5153 : "select bid, 0 "
5154 : "from generate_series(1, %d) as bid", nbranches * scale);
5155 2 : executeStatement(con, sql.data);
5156 :
5157 2 : printfPQExpBuffer(&sql,
5158 : "insert into pgbench_tellers(tid,bid,tbalance) "
5159 : "select tid, (tid - 1) / %d + 1, 0 "
5160 : "from generate_series(1, %d) as tid", ntellers, ntellers * scale);
5161 2 : executeStatement(con, sql.data);
5162 :
5163 2 : printfPQExpBuffer(&sql,
5164 : "insert into pgbench_accounts(aid,bid,abalance,filler) "
5165 : "select aid, (aid - 1) / %d + 1, 0, '' "
5166 : "from generate_series(1, " INT64_FORMAT ") as aid",
5167 : naccounts, (int64) naccounts * scale);
5168 2 : executeStatement(con, sql.data);
5169 :
5170 2 : termPQExpBuffer(&sql);
5171 :
5172 2 : executeStatement(con, "commit");
5173 2 : }
5174 :
5175 : /*
5176 : * Invoke vacuum on the standard tables
5177 : */
5178 : static void
5179 4 : initVacuum(PGconn *con)
5180 : {
5181 4 : fprintf(stderr, "vacuuming...\n");
5182 4 : executeStatement(con, "vacuum analyze pgbench_branches");
5183 4 : executeStatement(con, "vacuum analyze pgbench_tellers");
5184 4 : executeStatement(con, "vacuum analyze pgbench_accounts");
5185 4 : executeStatement(con, "vacuum analyze pgbench_history");
5186 4 : }
5187 :
5188 : /*
5189 : * Create primary keys on the standard tables
5190 : */
5191 : static void
5192 6 : initCreatePKeys(PGconn *con)
5193 : {
5194 : static const char *const DDLINDEXes[] = {
5195 : "alter table pgbench_branches add primary key (bid)",
5196 : "alter table pgbench_tellers add primary key (tid)",
5197 : "alter table pgbench_accounts add primary key (aid)"
5198 : };
5199 : int i;
5200 : PQExpBufferData query;
5201 :
5202 6 : fprintf(stderr, "creating primary keys...\n");
5203 6 : initPQExpBuffer(&query);
5204 :
5205 24 : for (i = 0; i < lengthof(DDLINDEXes); i++)
5206 : {
5207 18 : resetPQExpBuffer(&query);
5208 18 : appendPQExpBufferStr(&query, DDLINDEXes[i]);
5209 :
5210 18 : if (index_tablespace != NULL)
5211 : {
5212 : char *escape_tablespace;
5213 :
5214 6 : escape_tablespace = PQescapeIdentifier(con, index_tablespace,
5215 : strlen(index_tablespace));
5216 6 : appendPQExpBuffer(&query, " using index tablespace %s", escape_tablespace);
5217 6 : PQfreemem(escape_tablespace);
5218 : }
5219 :
5220 18 : executeStatement(con, query.data);
5221 : }
5222 :
5223 6 : termPQExpBuffer(&query);
5224 6 : }
5225 :
5226 : /*
5227 : * Create foreign key constraints between the standard tables
5228 : */
5229 : static void
5230 4 : initCreateFKeys(PGconn *con)
5231 : {
5232 : static const char *const DDLKEYs[] = {
5233 : "alter table pgbench_tellers add constraint pgbench_tellers_bid_fkey foreign key (bid) references pgbench_branches",
5234 : "alter table pgbench_accounts add constraint pgbench_accounts_bid_fkey foreign key (bid) references pgbench_branches",
5235 : "alter table pgbench_history add constraint pgbench_history_bid_fkey foreign key (bid) references pgbench_branches",
5236 : "alter table pgbench_history add constraint pgbench_history_tid_fkey foreign key (tid) references pgbench_tellers",
5237 : "alter table pgbench_history add constraint pgbench_history_aid_fkey foreign key (aid) references pgbench_accounts"
5238 : };
5239 : int i;
5240 :
5241 4 : fprintf(stderr, "creating foreign keys...\n");
5242 24 : for (i = 0; i < lengthof(DDLKEYs); i++)
5243 : {
5244 20 : executeStatement(con, DDLKEYs[i]);
5245 : }
5246 4 : }
5247 :
5248 : /*
5249 : * Validate an initialization-steps string
5250 : *
5251 : * (We could just leave it to runInitSteps() to fail if there are wrong
5252 : * characters, but since initialization can take awhile, it seems friendlier
5253 : * to check during option parsing.)
5254 : */
5255 : static void
5256 8 : checkInitSteps(const char *initialize_steps)
5257 : {
5258 8 : if (initialize_steps[0] == '\0')
5259 0 : pg_fatal("no initialization steps specified");
5260 :
5261 42 : for (const char *step = initialize_steps; *step != '\0'; step++)
5262 : {
5263 36 : if (strchr(ALL_INIT_STEPS " ", *step) == NULL)
5264 : {
5265 2 : pg_log_error("unrecognized initialization step \"%c\"", *step);
5266 2 : pg_log_error_detail("Allowed step characters are: \"" ALL_INIT_STEPS "\".");
5267 2 : exit(1);
5268 : }
5269 : }
5270 6 : }
5271 :
5272 : /*
5273 : * Invoke each initialization step in the given string
5274 : */
5275 : static void
5276 6 : runInitSteps(const char *initialize_steps)
5277 : {
5278 : PQExpBufferData stats;
5279 : PGconn *con;
5280 : const char *step;
5281 6 : double run_time = 0.0;
5282 6 : bool first = true;
5283 :
5284 6 : initPQExpBuffer(&stats);
5285 :
5286 6 : if ((con = doConnect()) == NULL)
5287 0 : pg_fatal("could not create connection for initialization");
5288 :
5289 6 : setup_cancel_handler(NULL);
5290 6 : SetCancelConn(con);
5291 :
5292 44 : for (step = initialize_steps; *step != '\0'; step++)
5293 : {
5294 38 : char *op = NULL;
5295 38 : pg_time_usec_t start = pg_time_now();
5296 :
5297 38 : switch (*step)
5298 : {
5299 6 : case 'd':
5300 6 : op = "drop tables";
5301 6 : initDropTables(con);
5302 6 : break;
5303 6 : case 't':
5304 6 : op = "create tables";
5305 6 : initCreateTables(con);
5306 6 : break;
5307 4 : case 'g':
5308 4 : op = "client-side generate";
5309 4 : initGenerateDataClientSide(con);
5310 4 : break;
5311 2 : case 'G':
5312 2 : op = "server-side generate";
5313 2 : initGenerateDataServerSide(con);
5314 2 : break;
5315 4 : case 'v':
5316 4 : op = "vacuum";
5317 4 : initVacuum(con);
5318 4 : break;
5319 6 : case 'p':
5320 6 : op = "primary keys";
5321 6 : initCreatePKeys(con);
5322 6 : break;
5323 4 : case 'f':
5324 4 : op = "foreign keys";
5325 4 : initCreateFKeys(con);
5326 4 : break;
5327 6 : case ' ':
5328 6 : break; /* ignore */
5329 0 : default:
5330 0 : pg_log_error("unrecognized initialization step \"%c\"", *step);
5331 0 : PQfinish(con);
5332 0 : exit(1);
5333 : }
5334 :
5335 38 : if (op != NULL)
5336 : {
5337 32 : double elapsed_sec = PG_TIME_GET_DOUBLE(pg_time_now() - start);
5338 :
5339 32 : if (!first)
5340 26 : appendPQExpBufferStr(&stats, ", ");
5341 : else
5342 6 : first = false;
5343 :
5344 32 : appendPQExpBuffer(&stats, "%s %.2f s", op, elapsed_sec);
5345 :
5346 32 : run_time += elapsed_sec;
5347 : }
5348 : }
5349 :
5350 6 : fprintf(stderr, "done in %.2f s (%s).\n", run_time, stats.data);
5351 6 : ResetCancelConn();
5352 6 : PQfinish(con);
5353 6 : termPQExpBuffer(&stats);
5354 6 : }
5355 :
5356 : /*
5357 : * Extract pgbench table information into global variables scale,
5358 : * partition_method and partitions.
5359 : */
5360 : static void
5361 14 : GetTableInfo(PGconn *con, bool scale_given)
5362 : {
5363 : PGresult *res;
5364 :
5365 : /*
5366 : * get the scaling factor that should be same as count(*) from
5367 : * pgbench_branches if this is not a custom query
5368 : */
5369 14 : res = PQexec(con, "select count(*) from pgbench_branches");
5370 14 : if (PQresultStatus(res) != PGRES_TUPLES_OK)
5371 : {
5372 2 : char *sqlState = PQresultErrorField(res, PG_DIAG_SQLSTATE);
5373 :
5374 2 : pg_log_error("could not count number of branches: %s", PQerrorMessage(con));
5375 :
5376 2 : if (sqlState && strcmp(sqlState, ERRCODE_UNDEFINED_TABLE) == 0)
5377 2 : pg_log_error_hint("Perhaps you need to do initialization (\"pgbench -i\") in database \"%s\".",
5378 : PQdb(con));
5379 :
5380 2 : exit(1);
5381 : }
5382 12 : scale = atoi(PQgetvalue(res, 0, 0));
5383 12 : if (scale < 0)
5384 0 : pg_fatal("invalid count(*) from pgbench_branches: \"%s\"",
5385 : PQgetvalue(res, 0, 0));
5386 12 : PQclear(res);
5387 :
5388 : /* warn if we override user-given -s switch */
5389 12 : if (scale_given)
5390 2 : pg_log_warning("scale option ignored, using count from pgbench_branches table (%d)",
5391 : scale);
5392 :
5393 : /*
5394 : * Get the partition information for the first "pgbench_accounts" table
5395 : * found in search_path.
5396 : *
5397 : * The result is empty if no "pgbench_accounts" is found.
5398 : *
5399 : * Otherwise, it always returns one row even if the table is not
5400 : * partitioned (in which case the partition strategy is NULL).
5401 : *
5402 : * The number of partitions can be 0 even for partitioned tables, if no
5403 : * partition is attached.
5404 : *
5405 : * We assume no partitioning on any failure, so as to avoid failing on an
5406 : * old version without "pg_partitioned_table".
5407 : */
5408 12 : res = PQexec(con,
5409 : "select o.n, p.partstrat, pg_catalog.count(i.inhparent) "
5410 : "from pg_catalog.pg_class as c "
5411 : "join pg_catalog.pg_namespace as n on (n.oid = c.relnamespace) "
5412 : "cross join lateral (select pg_catalog.array_position(pg_catalog.current_schemas(true), n.nspname)) as o(n) "
5413 : "left join pg_catalog.pg_partitioned_table as p on (p.partrelid = c.oid) "
5414 : "left join pg_catalog.pg_inherits as i on (c.oid = i.inhparent) "
5415 : "where c.relname = 'pgbench_accounts' and o.n is not null "
5416 : "group by 1, 2 "
5417 : "order by 1 asc "
5418 : "limit 1");
5419 :
5420 12 : if (PQresultStatus(res) != PGRES_TUPLES_OK)
5421 : {
5422 : /* probably an older version, coldly assume no partitioning */
5423 0 : partition_method = PART_NONE;
5424 0 : partitions = 0;
5425 : }
5426 12 : else if (PQntuples(res) == 0)
5427 : {
5428 : /*
5429 : * This case is unlikely as pgbench already found "pgbench_branches"
5430 : * above to compute the scale.
5431 : */
5432 0 : pg_log_error("no pgbench_accounts table found in \"search_path\"");
5433 0 : pg_log_error_hint("Perhaps you need to do initialization (\"pgbench -i\") in database \"%s\".", PQdb(con));
5434 0 : exit(1);
5435 : }
5436 : else /* PQntuples(res) == 1 */
5437 : {
5438 : /* normal case, extract partition information */
5439 12 : if (PQgetisnull(res, 0, 1))
5440 0 : partition_method = PART_NONE;
5441 : else
5442 : {
5443 12 : char *ps = PQgetvalue(res, 0, 1);
5444 :
5445 : /* column must be there */
5446 : Assert(ps != NULL);
5447 :
5448 12 : if (strcmp(ps, "r") == 0)
5449 12 : partition_method = PART_RANGE;
5450 0 : else if (strcmp(ps, "h") == 0)
5451 0 : partition_method = PART_HASH;
5452 : else
5453 : {
5454 : /* possibly a newer version with new partition method */
5455 0 : pg_fatal("unexpected partition method: \"%s\"", ps);
5456 : }
5457 : }
5458 :
5459 12 : partitions = atoi(PQgetvalue(res, 0, 2));
5460 : }
5461 :
5462 12 : PQclear(res);
5463 12 : }
5464 :
5465 : /*
5466 : * Replace :param with $n throughout the command's SQL text, which
5467 : * is a modifiable string in cmd->lines.
5468 : */
5469 : static bool
5470 188 : parseQuery(Command *cmd)
5471 : {
5472 : char *sql,
5473 : *p;
5474 :
5475 188 : cmd->argc = 1;
5476 :
5477 188 : p = sql = pg_strdup(cmd->lines.data);
5478 780 : while ((p = strchr(p, ':')) != NULL)
5479 : {
5480 : char var[13];
5481 : char *name;
5482 : int eaten;
5483 :
5484 594 : name = parseVariable(p, &eaten);
5485 594 : if (name == NULL)
5486 : {
5487 96 : while (*p == ':')
5488 : {
5489 64 : p++;
5490 : }
5491 32 : continue;
5492 : }
5493 :
5494 : /*
5495 : * cmd->argv[0] is the SQL statement itself, so the max number of
5496 : * arguments is one less than MAX_ARGS
5497 : */
5498 562 : if (cmd->argc >= MAX_ARGS)
5499 : {
5500 2 : pg_log_error("statement has too many arguments (maximum is %d): %s",
5501 : MAX_ARGS - 1, cmd->lines.data);
5502 2 : pg_free(name);
5503 2 : return false;
5504 : }
5505 :
5506 560 : sprintf(var, "$%d", cmd->argc);
5507 560 : p = replaceVariable(&sql, p, eaten, var);
5508 :
5509 560 : cmd->argv[cmd->argc] = name;
5510 560 : cmd->argc++;
5511 : }
5512 :
5513 : Assert(cmd->argv[0] == NULL);
5514 186 : cmd->argv[0] = sql;
5515 186 : return true;
5516 : }
5517 :
5518 : /*
5519 : * syntax error while parsing a script (in practice, while parsing a
5520 : * backslash command, because we don't detect syntax errors in SQL)
5521 : *
5522 : * source: source of script (filename or builtin-script ID)
5523 : * lineno: line number within script (count from 1)
5524 : * line: whole line of backslash command, if available
5525 : * command: backslash command name, if available
5526 : * msg: the actual error message
5527 : * more: optional extra message
5528 : * column: zero-based column number, or -1 if unknown
5529 : */
5530 : void
5531 66 : syntax_error(const char *source, int lineno,
5532 : const char *line, const char *command,
5533 : const char *msg, const char *more, int column)
5534 : {
5535 : PQExpBufferData buf;
5536 :
5537 66 : initPQExpBuffer(&buf);
5538 :
5539 66 : printfPQExpBuffer(&buf, "%s:%d: %s", source, lineno, msg);
5540 66 : if (more != NULL)
5541 30 : appendPQExpBuffer(&buf, " (%s)", more);
5542 66 : if (column >= 0 && line == NULL)
5543 0 : appendPQExpBuffer(&buf, " at column %d", column + 1);
5544 66 : if (command != NULL)
5545 60 : appendPQExpBuffer(&buf, " in command \"%s\"", command);
5546 :
5547 66 : pg_log_error("%s", buf.data);
5548 :
5549 66 : termPQExpBuffer(&buf);
5550 :
5551 66 : if (line != NULL)
5552 : {
5553 56 : fprintf(stderr, "%s\n", line);
5554 56 : if (column >= 0)
5555 42 : fprintf(stderr, "%*c error found here\n", column + 1, '^');
5556 : }
5557 :
5558 66 : exit(1);
5559 : }
5560 :
5561 : /*
5562 : * Return a pointer to the start of the SQL command, after skipping over
5563 : * whitespace and "--" comments.
5564 : * If the end of the string is reached, return NULL.
5565 : */
5566 : static char *
5567 2342 : skip_sql_comments(char *sql_command)
5568 : {
5569 2342 : char *p = sql_command;
5570 :
5571 : /* Skip any leading whitespace, as well as "--" style comments */
5572 : for (;;)
5573 : {
5574 2342 : if (isspace((unsigned char) *p))
5575 0 : p++;
5576 2342 : else if (strncmp(p, "--", 2) == 0)
5577 : {
5578 0 : p = strchr(p, '\n');
5579 0 : if (p == NULL)
5580 0 : return NULL;
5581 0 : p++;
5582 : }
5583 : else
5584 2342 : break;
5585 : }
5586 :
5587 : /* NULL if there's nothing but whitespace and comments */
5588 2342 : if (*p == '\0')
5589 1496 : return NULL;
5590 :
5591 846 : return p;
5592 : }
5593 :
5594 : /*
5595 : * Parse a SQL command; return a Command struct, or NULL if it's a comment
5596 : *
5597 : * On entry, psqlscan.l has collected the command into "buf", so we don't
5598 : * really need to do much here except check for comments and set up a Command
5599 : * struct.
5600 : */
5601 : static Command *
5602 2342 : create_sql_command(PQExpBuffer buf, const char *source)
5603 : {
5604 : Command *my_command;
5605 2342 : char *p = skip_sql_comments(buf->data);
5606 :
5607 2342 : if (p == NULL)
5608 1496 : return NULL;
5609 :
5610 : /* Allocate and initialize Command structure */
5611 846 : my_command = (Command *) pg_malloc(sizeof(Command));
5612 846 : initPQExpBuffer(&my_command->lines);
5613 846 : appendPQExpBufferStr(&my_command->lines, p);
5614 846 : my_command->first_line = NULL; /* this is set later */
5615 846 : my_command->type = SQL_COMMAND;
5616 846 : my_command->meta = META_NONE;
5617 846 : my_command->argc = 0;
5618 846 : my_command->retries = 0;
5619 846 : my_command->failures = 0;
5620 846 : memset(my_command->argv, 0, sizeof(my_command->argv));
5621 846 : my_command->varprefix = NULL; /* allocated later, if needed */
5622 846 : my_command->expr = NULL;
5623 846 : initSimpleStats(&my_command->stats);
5624 846 : my_command->prepname = NULL; /* set later, if needed */
5625 :
5626 846 : return my_command;
5627 : }
5628 :
5629 : /* Free a Command structure and associated data */
5630 : static void
5631 62 : free_command(Command *command)
5632 : {
5633 62 : termPQExpBuffer(&command->lines);
5634 62 : pg_free(command->first_line);
5635 128 : for (int i = 0; i < command->argc; i++)
5636 66 : pg_free(command->argv[i]);
5637 62 : pg_free(command->varprefix);
5638 :
5639 : /*
5640 : * It should also free expr recursively, but this is currently not needed
5641 : * as only gset commands (which do not have an expression) are freed.
5642 : */
5643 62 : pg_free(command);
5644 62 : }
5645 :
5646 : /*
5647 : * Once an SQL command is fully parsed, possibly by accumulating several
5648 : * parts, complete other fields of the Command structure.
5649 : */
5650 : static void
5651 584 : postprocess_sql_command(Command *my_command)
5652 : {
5653 : char buffer[128];
5654 : static int prepnum = 0;
5655 :
5656 : Assert(my_command->type == SQL_COMMAND);
5657 :
5658 : /* Save the first line for error display. */
5659 584 : strlcpy(buffer, my_command->lines.data, sizeof(buffer));
5660 584 : buffer[strcspn(buffer, "\n\r")] = '\0';
5661 584 : my_command->first_line = pg_strdup(buffer);
5662 :
5663 : /* Parse query and generate prepared statement name, if necessary */
5664 584 : switch (querymode)
5665 : {
5666 396 : case QUERY_SIMPLE:
5667 396 : my_command->argv[0] = my_command->lines.data;
5668 396 : my_command->argc++;
5669 396 : break;
5670 104 : case QUERY_PREPARED:
5671 104 : my_command->prepname = psprintf("P_%d", prepnum++);
5672 : /* fall through */
5673 188 : case QUERY_EXTENDED:
5674 188 : if (!parseQuery(my_command))
5675 2 : exit(1);
5676 186 : break;
5677 0 : default:
5678 0 : exit(1);
5679 : }
5680 582 : }
5681 :
5682 : /*
5683 : * Parse a backslash command; return a Command struct, or NULL if comment
5684 : *
5685 : * At call, we have scanned only the initial backslash.
5686 : */
5687 : static Command *
5688 1064 : process_backslash_command(PsqlScanState sstate, const char *source,
5689 : int lineno, int start_offset)
5690 : {
5691 : Command *my_command;
5692 : PQExpBufferData word_buf;
5693 : int word_offset;
5694 : int offsets[MAX_ARGS]; /* offsets of argument words */
5695 : int j;
5696 :
5697 1064 : initPQExpBuffer(&word_buf);
5698 :
5699 : /* Collect first word of command */
5700 1064 : if (!expr_lex_one_word(sstate, &word_buf, &word_offset))
5701 : {
5702 0 : termPQExpBuffer(&word_buf);
5703 0 : return NULL;
5704 : }
5705 :
5706 : /* Allocate and initialize Command structure */
5707 1064 : my_command = (Command *) pg_malloc0(sizeof(Command));
5708 1064 : my_command->type = META_COMMAND;
5709 1064 : my_command->argc = 0;
5710 1064 : initSimpleStats(&my_command->stats);
5711 :
5712 : /* Save first word (command name) */
5713 1064 : j = 0;
5714 1064 : offsets[j] = word_offset;
5715 1064 : my_command->argv[j++] = pg_strdup(word_buf.data);
5716 1064 : my_command->argc++;
5717 :
5718 : /* ... and convert it to enum form */
5719 1064 : my_command->meta = getMetaCommand(my_command->argv[0]);
5720 :
5721 1064 : if (my_command->meta == META_SET ||
5722 338 : my_command->meta == META_IF ||
5723 290 : my_command->meta == META_ELIF)
5724 : {
5725 : yyscan_t yyscanner;
5726 :
5727 : /* For \set, collect var name */
5728 800 : if (my_command->meta == META_SET)
5729 : {
5730 726 : if (!expr_lex_one_word(sstate, &word_buf, &word_offset))
5731 2 : syntax_error(source, lineno, my_command->first_line, my_command->argv[0],
5732 : "missing argument", NULL, -1);
5733 :
5734 724 : offsets[j] = word_offset;
5735 724 : my_command->argv[j++] = pg_strdup(word_buf.data);
5736 724 : my_command->argc++;
5737 : }
5738 :
5739 : /* then for all parse the expression */
5740 798 : yyscanner = expr_scanner_init(sstate, source, lineno, start_offset,
5741 798 : my_command->argv[0]);
5742 :
5743 798 : if (expr_yyparse(&my_command->expr, yyscanner) != 0)
5744 : {
5745 : /* dead code: exit done from syntax_error called by yyerror */
5746 0 : exit(1);
5747 : }
5748 :
5749 : /* Save line, trimming any trailing newline */
5750 760 : my_command->first_line =
5751 760 : expr_scanner_get_substring(sstate,
5752 : start_offset,
5753 : true);
5754 :
5755 760 : expr_scanner_finish(yyscanner);
5756 :
5757 760 : termPQExpBuffer(&word_buf);
5758 :
5759 760 : return my_command;
5760 : }
5761 :
5762 : /* For all other commands, collect remaining words. */
5763 846 : while (expr_lex_one_word(sstate, &word_buf, &word_offset))
5764 : {
5765 : /*
5766 : * my_command->argv[0] is the command itself, so the max number of
5767 : * arguments is one less than MAX_ARGS
5768 : */
5769 584 : if (j >= MAX_ARGS)
5770 2 : syntax_error(source, lineno, my_command->first_line, my_command->argv[0],
5771 : "too many arguments", NULL, -1);
5772 :
5773 582 : offsets[j] = word_offset;
5774 582 : my_command->argv[j++] = pg_strdup(word_buf.data);
5775 582 : my_command->argc++;
5776 : }
5777 :
5778 : /* Save line, trimming any trailing newline */
5779 262 : my_command->first_line =
5780 262 : expr_scanner_get_substring(sstate,
5781 : start_offset,
5782 : true);
5783 :
5784 262 : if (my_command->meta == META_SLEEP)
5785 : {
5786 18 : if (my_command->argc < 2)
5787 2 : syntax_error(source, lineno, my_command->first_line, my_command->argv[0],
5788 : "missing argument", NULL, -1);
5789 :
5790 16 : if (my_command->argc > 3)
5791 2 : syntax_error(source, lineno, my_command->first_line, my_command->argv[0],
5792 : "too many arguments", NULL,
5793 2 : offsets[3] - start_offset);
5794 :
5795 : /*
5796 : * Split argument into number and unit to allow "sleep 1ms" etc. We
5797 : * don't have to terminate the number argument with null because it
5798 : * will be parsed with atoi, which ignores trailing non-digit
5799 : * characters.
5800 : */
5801 14 : if (my_command->argv[1][0] != ':')
5802 : {
5803 8 : char *c = my_command->argv[1];
5804 8 : bool have_digit = false;
5805 :
5806 : /* Skip sign */
5807 8 : if (*c == '+' || *c == '-')
5808 0 : c++;
5809 :
5810 : /* Require at least one digit */
5811 8 : if (*c && isdigit((unsigned char) *c))
5812 8 : have_digit = true;
5813 :
5814 : /* Eat all digits */
5815 20 : while (*c && isdigit((unsigned char) *c))
5816 12 : c++;
5817 :
5818 8 : if (*c)
5819 : {
5820 2 : if (my_command->argc == 2 && have_digit)
5821 : {
5822 2 : my_command->argv[2] = c;
5823 2 : offsets[2] = offsets[1] + (c - my_command->argv[1]);
5824 2 : my_command->argc = 3;
5825 : }
5826 : else
5827 : {
5828 : /*
5829 : * Raise an error if argument starts with non-digit
5830 : * character (after sign).
5831 : */
5832 0 : syntax_error(source, lineno, my_command->first_line, my_command->argv[0],
5833 : "invalid sleep time, must be an integer",
5834 0 : my_command->argv[1], offsets[1] - start_offset);
5835 : }
5836 : }
5837 : }
5838 :
5839 14 : if (my_command->argc == 3)
5840 : {
5841 18 : if (pg_strcasecmp(my_command->argv[2], "us") != 0 &&
5842 12 : pg_strcasecmp(my_command->argv[2], "ms") != 0 &&
5843 4 : pg_strcasecmp(my_command->argv[2], "s") != 0)
5844 2 : syntax_error(source, lineno, my_command->first_line, my_command->argv[0],
5845 : "unrecognized time unit, must be us, ms or s",
5846 2 : my_command->argv[2], offsets[2] - start_offset);
5847 : }
5848 : }
5849 244 : else if (my_command->meta == META_SETSHELL)
5850 : {
5851 8 : if (my_command->argc < 3)
5852 2 : syntax_error(source, lineno, my_command->first_line, my_command->argv[0],
5853 : "missing argument", NULL, -1);
5854 : }
5855 236 : else if (my_command->meta == META_SHELL)
5856 : {
5857 8 : if (my_command->argc < 2)
5858 2 : syntax_error(source, lineno, my_command->first_line, my_command->argv[0],
5859 : "missing command", NULL, -1);
5860 : }
5861 228 : else if (my_command->meta == META_ELSE || my_command->meta == META_ENDIF ||
5862 158 : my_command->meta == META_STARTPIPELINE ||
5863 116 : my_command->meta == META_ENDPIPELINE ||
5864 82 : my_command->meta == META_SYNCPIPELINE)
5865 : {
5866 156 : if (my_command->argc != 1)
5867 4 : syntax_error(source, lineno, my_command->first_line, my_command->argv[0],
5868 : "unexpected argument", NULL, -1);
5869 : }
5870 72 : else if (my_command->meta == META_GSET || my_command->meta == META_ASET)
5871 : {
5872 70 : if (my_command->argc > 2)
5873 2 : syntax_error(source, lineno, my_command->first_line, my_command->argv[0],
5874 : "too many arguments", NULL, -1);
5875 : }
5876 : else
5877 : {
5878 : /* my_command->meta == META_NONE */
5879 2 : syntax_error(source, lineno, my_command->first_line, my_command->argv[0],
5880 : "invalid command", NULL, -1);
5881 : }
5882 :
5883 244 : termPQExpBuffer(&word_buf);
5884 :
5885 244 : return my_command;
5886 : }
5887 :
5888 : static void
5889 12 : ConditionError(const char *desc, int cmdn, const char *msg)
5890 : {
5891 12 : pg_fatal("condition error in script \"%s\" command %d: %s",
5892 : desc, cmdn, msg);
5893 : }
5894 :
5895 : /*
5896 : * Partial evaluation of conditionals before recording and running the script.
5897 : */
5898 : static void
5899 496 : CheckConditional(const ParsedScript *ps)
5900 : {
5901 : /* statically check conditional structure */
5902 496 : ConditionalStack cs = conditional_stack_create();
5903 : int i;
5904 :
5905 2248 : for (i = 0; ps->commands[i] != NULL; i++)
5906 : {
5907 1762 : Command *cmd = ps->commands[i];
5908 :
5909 1762 : if (cmd->type == META_COMMAND)
5910 : {
5911 922 : switch (cmd->meta)
5912 : {
5913 40 : case META_IF:
5914 40 : conditional_stack_push(cs, IFSTATE_FALSE);
5915 40 : break;
5916 24 : case META_ELIF:
5917 24 : if (conditional_stack_empty(cs))
5918 2 : ConditionError(ps->desc, i + 1, "\\elif without matching \\if");
5919 22 : if (conditional_stack_peek(cs) == IFSTATE_ELSE_FALSE)
5920 2 : ConditionError(ps->desc, i + 1, "\\elif after \\else");
5921 20 : break;
5922 26 : case META_ELSE:
5923 26 : if (conditional_stack_empty(cs))
5924 2 : ConditionError(ps->desc, i + 1, "\\else without matching \\if");
5925 24 : if (conditional_stack_peek(cs) == IFSTATE_ELSE_FALSE)
5926 2 : ConditionError(ps->desc, i + 1, "\\else after \\else");
5927 22 : conditional_stack_poke(cs, IFSTATE_ELSE_FALSE);
5928 22 : break;
5929 36 : case META_ENDIF:
5930 36 : if (!conditional_stack_pop(cs))
5931 2 : ConditionError(ps->desc, i + 1, "\\endif without matching \\if");
5932 34 : break;
5933 796 : default:
5934 : /* ignore anything else... */
5935 796 : break;
5936 : }
5937 : }
5938 : }
5939 486 : if (!conditional_stack_empty(cs))
5940 2 : ConditionError(ps->desc, i + 1, "\\if without matching \\endif");
5941 484 : conditional_stack_destroy(cs);
5942 484 : }
5943 :
5944 : /*
5945 : * Parse a script (either the contents of a file, or a built-in script)
5946 : * and add it to the list of scripts.
5947 : */
5948 : static void
5949 566 : ParseScript(const char *script, const char *desc, int weight)
5950 : {
5951 : ParsedScript ps;
5952 : PsqlScanState sstate;
5953 : PQExpBufferData line_buf;
5954 : int alloc_num;
5955 : int index;
5956 :
5957 : #define COMMANDS_ALLOC_NUM 128
5958 566 : alloc_num = COMMANDS_ALLOC_NUM;
5959 :
5960 : /* Initialize all fields of ps */
5961 566 : ps.desc = desc;
5962 566 : ps.weight = weight;
5963 566 : ps.commands = (Command **) pg_malloc(sizeof(Command *) * alloc_num);
5964 566 : initStats(&ps.stats, 0);
5965 :
5966 : /* Prepare to parse script */
5967 566 : sstate = psql_scan_create(&pgbench_callbacks);
5968 :
5969 : /*
5970 : * Ideally, we'd scan scripts using the encoding and stdstrings settings
5971 : * we get from a DB connection. However, without major rearrangement of
5972 : * pgbench's argument parsing, we can't have a DB connection at the time
5973 : * we parse scripts. Using SQL_ASCII (encoding 0) should work well enough
5974 : * with any backend-safe encoding, though conceivably we could be fooled
5975 : * if a script file uses a client-only encoding. We also assume that
5976 : * stdstrings should be true, which is a bit riskier.
5977 : */
5978 566 : psql_scan_setup(sstate, script, strlen(script), 0, true);
5979 :
5980 566 : initPQExpBuffer(&line_buf);
5981 :
5982 566 : index = 0;
5983 :
5984 : for (;;)
5985 1776 : {
5986 : PsqlScanResult sr;
5987 : promptStatus_t prompt;
5988 2342 : Command *command = NULL;
5989 :
5990 2342 : resetPQExpBuffer(&line_buf);
5991 :
5992 2342 : sr = psql_scan(sstate, &line_buf, &prompt);
5993 :
5994 : /* If we collected a new SQL command, process that */
5995 2342 : command = create_sql_command(&line_buf, desc);
5996 :
5997 : /* store new command */
5998 2342 : if (command)
5999 846 : ps.commands[index++] = command;
6000 :
6001 : /* If we reached a backslash, process that */
6002 2342 : if (sr == PSCAN_BACKSLASH)
6003 : {
6004 : int lineno;
6005 : int start_offset;
6006 :
6007 : /* Capture location of the backslash */
6008 1064 : psql_scan_get_location(sstate, &lineno, &start_offset);
6009 1064 : start_offset--;
6010 :
6011 1064 : command = process_backslash_command(sstate, desc,
6012 : lineno, start_offset);
6013 :
6014 1004 : if (command)
6015 : {
6016 : /*
6017 : * If this is gset or aset, merge into the preceding command.
6018 : * (We don't use a command slot in this case).
6019 : */
6020 1004 : if (command->meta == META_GSET || command->meta == META_ASET)
6021 62 : {
6022 : Command *cmd;
6023 :
6024 68 : if (index == 0)
6025 2 : syntax_error(desc, lineno, NULL, NULL,
6026 : "\\gset must follow an SQL command",
6027 : NULL, -1);
6028 :
6029 66 : cmd = ps.commands[index - 1];
6030 :
6031 66 : if (cmd->type != SQL_COMMAND ||
6032 64 : cmd->varprefix != NULL)
6033 4 : syntax_error(desc, lineno, NULL, NULL,
6034 : "\\gset must follow an SQL command",
6035 4 : cmd->first_line, -1);
6036 :
6037 : /* get variable prefix */
6038 62 : if (command->argc <= 1 || command->argv[1][0] == '\0')
6039 58 : cmd->varprefix = pg_strdup("");
6040 : else
6041 4 : cmd->varprefix = pg_strdup(command->argv[1]);
6042 :
6043 : /* update the sql command meta */
6044 62 : cmd->meta = command->meta;
6045 :
6046 : /* cleanup unused command */
6047 62 : free_command(command);
6048 :
6049 62 : continue;
6050 : }
6051 :
6052 : /* Attach any other backslash command as a new command */
6053 936 : ps.commands[index++] = command;
6054 : }
6055 : }
6056 :
6057 : /*
6058 : * Since we used a command slot, allocate more if needed. Note we
6059 : * always allocate one more in order to accommodate the NULL
6060 : * terminator below.
6061 : */
6062 2214 : if (index >= alloc_num)
6063 : {
6064 0 : alloc_num += COMMANDS_ALLOC_NUM;
6065 0 : ps.commands = (Command **)
6066 0 : pg_realloc(ps.commands, sizeof(Command *) * alloc_num);
6067 : }
6068 :
6069 : /* Done if we reached EOF */
6070 2214 : if (sr == PSCAN_INCOMPLETE || sr == PSCAN_EOL)
6071 : break;
6072 : }
6073 :
6074 500 : ps.commands[index] = NULL;
6075 :
6076 500 : addScript(&ps);
6077 :
6078 484 : termPQExpBuffer(&line_buf);
6079 484 : psql_scan_finish(sstate);
6080 484 : psql_scan_destroy(sstate);
6081 484 : }
6082 :
6083 : /*
6084 : * Read the entire contents of file fd, and return it in a malloc'd buffer.
6085 : *
6086 : * The buffer will typically be larger than necessary, but we don't care
6087 : * in this program, because we'll free it as soon as we've parsed the script.
6088 : */
6089 : static char *
6090 260 : read_file_contents(FILE *fd)
6091 : {
6092 : char *buf;
6093 260 : size_t buflen = BUFSIZ;
6094 260 : size_t used = 0;
6095 :
6096 260 : buf = (char *) pg_malloc(buflen);
6097 :
6098 : for (;;)
6099 0 : {
6100 : size_t nread;
6101 :
6102 260 : nread = fread(buf + used, 1, BUFSIZ, fd);
6103 260 : used += nread;
6104 : /* If fread() read less than requested, must be EOF or error */
6105 260 : if (nread < BUFSIZ)
6106 260 : break;
6107 : /* Enlarge buf so we can read some more */
6108 0 : buflen += BUFSIZ;
6109 0 : buf = (char *) pg_realloc(buf, buflen);
6110 : }
6111 : /* There is surely room for a terminator */
6112 260 : buf[used] = '\0';
6113 :
6114 260 : return buf;
6115 : }
6116 :
6117 : /*
6118 : * Given a file name, read it and add its script to the list.
6119 : * "-" means to read stdin.
6120 : * NB: filename must be storage that won't disappear.
6121 : */
6122 : static void
6123 262 : process_file(const char *filename, int weight)
6124 : {
6125 : FILE *fd;
6126 : char *buf;
6127 :
6128 : /* Slurp the file contents into "buf" */
6129 262 : if (strcmp(filename, "-") == 0)
6130 0 : fd = stdin;
6131 262 : else if ((fd = fopen(filename, "r")) == NULL)
6132 2 : pg_fatal("could not open file \"%s\": %m", filename);
6133 :
6134 260 : buf = read_file_contents(fd);
6135 :
6136 260 : if (ferror(fd))
6137 0 : pg_fatal("could not read file \"%s\": %m", filename);
6138 :
6139 260 : if (fd != stdin)
6140 260 : fclose(fd);
6141 :
6142 260 : ParseScript(buf, filename, weight);
6143 :
6144 180 : free(buf);
6145 180 : }
6146 :
6147 : /* Parse the given builtin script and add it to the list. */
6148 : static void
6149 306 : process_builtin(const BuiltinScript *bi, int weight)
6150 : {
6151 306 : ParseScript(bi->script, bi->desc, weight);
6152 304 : }
6153 :
6154 : /* show available builtin scripts */
6155 : static void
6156 6 : listAvailableScripts(void)
6157 : {
6158 : int i;
6159 :
6160 6 : fprintf(stderr, "Available builtin scripts:\n");
6161 24 : for (i = 0; i < lengthof(builtin_script); i++)
6162 18 : fprintf(stderr, " %13s: %s\n", builtin_script[i].name, builtin_script[i].desc);
6163 6 : fprintf(stderr, "\n");
6164 6 : }
6165 :
6166 : /* return builtin script "name" if unambiguous, fails if not found */
6167 : static const BuiltinScript *
6168 312 : findBuiltin(const char *name)
6169 : {
6170 : int i,
6171 312 : found = 0,
6172 312 : len = strlen(name);
6173 312 : const BuiltinScript *result = NULL;
6174 :
6175 1248 : for (i = 0; i < lengthof(builtin_script); i++)
6176 : {
6177 936 : if (strncmp(builtin_script[i].name, name, len) == 0)
6178 : {
6179 312 : result = &builtin_script[i];
6180 312 : found++;
6181 : }
6182 : }
6183 :
6184 : /* ok, unambiguous result */
6185 312 : if (found == 1)
6186 308 : return result;
6187 :
6188 : /* error cases */
6189 4 : if (found == 0)
6190 2 : pg_log_error("no builtin script found for name \"%s\"", name);
6191 : else /* found > 1 */
6192 2 : pg_log_error("ambiguous builtin name: %d builtin scripts found for prefix \"%s\"", found, name);
6193 :
6194 4 : listAvailableScripts();
6195 4 : exit(1);
6196 : }
6197 :
6198 : /*
6199 : * Determine the weight specification from a script option (-b, -f), if any,
6200 : * and return it as an integer (1 is returned if there's no weight). The
6201 : * script name is returned in *script as a malloc'd string.
6202 : */
6203 : static int
6204 284 : parseScriptWeight(const char *option, char **script)
6205 : {
6206 : char *sep;
6207 : int weight;
6208 :
6209 284 : if ((sep = strrchr(option, WSEP)))
6210 : {
6211 18 : int namelen = sep - option;
6212 : long wtmp;
6213 : char *badp;
6214 :
6215 : /* generate the script name */
6216 18 : *script = pg_malloc(namelen + 1);
6217 18 : strncpy(*script, option, namelen);
6218 18 : (*script)[namelen] = '\0';
6219 :
6220 : /* process digits of the weight spec */
6221 18 : errno = 0;
6222 18 : wtmp = strtol(sep + 1, &badp, 10);
6223 18 : if (errno != 0 || badp == sep + 1 || *badp != '\0')
6224 2 : pg_fatal("invalid weight specification: %s", sep);
6225 16 : if (wtmp > INT_MAX || wtmp < 0)
6226 2 : pg_fatal("weight specification out of range (0 .. %d): %lld",
6227 : INT_MAX, (long long) wtmp);
6228 14 : weight = wtmp;
6229 : }
6230 : else
6231 : {
6232 266 : *script = pg_strdup(option);
6233 266 : weight = 1;
6234 : }
6235 :
6236 280 : return weight;
6237 : }
6238 :
6239 : /* append a script to the list of scripts to process */
6240 : static void
6241 500 : addScript(const ParsedScript *script)
6242 : {
6243 500 : if (script->commands == NULL || script->commands[0] == NULL)
6244 2 : pg_fatal("empty command list for script \"%s\"", script->desc);
6245 :
6246 498 : if (num_scripts >= MAX_SCRIPTS)
6247 2 : pg_fatal("at most %d SQL scripts are allowed", MAX_SCRIPTS);
6248 :
6249 496 : CheckConditional(script);
6250 :
6251 484 : sql_script[num_scripts] = *script;
6252 484 : num_scripts++;
6253 484 : }
6254 :
6255 : /*
6256 : * Print progress report.
6257 : *
6258 : * On entry, *last and *last_report contain the statistics and time of last
6259 : * progress report. On exit, they are updated with the new stats.
6260 : */
6261 : static void
6262 0 : printProgressReport(TState *threads, int64 test_start, pg_time_usec_t now,
6263 : StatsData *last, int64 *last_report)
6264 : {
6265 : /* generate and show report */
6266 0 : pg_time_usec_t run = now - *last_report;
6267 : int64 cnt,
6268 : failures,
6269 : retried;
6270 : double tps,
6271 : total_run,
6272 : latency,
6273 : sqlat,
6274 : lag,
6275 : stdev;
6276 : char tbuf[315];
6277 : StatsData cur;
6278 :
6279 : /*
6280 : * Add up the statistics of all threads.
6281 : *
6282 : * XXX: No locking. There is no guarantee that we get an atomic snapshot
6283 : * of the transaction count and latencies, so these figures can well be
6284 : * off by a small amount. The progress report's purpose is to give a
6285 : * quick overview of how the test is going, so that shouldn't matter too
6286 : * much. (If a read from a 64-bit integer is not atomic, you might get a
6287 : * "torn" read and completely bogus latencies though!)
6288 : */
6289 0 : initStats(&cur, 0);
6290 0 : for (int i = 0; i < nthreads; i++)
6291 : {
6292 0 : mergeSimpleStats(&cur.latency, &threads[i].stats.latency);
6293 0 : mergeSimpleStats(&cur.lag, &threads[i].stats.lag);
6294 0 : cur.cnt += threads[i].stats.cnt;
6295 0 : cur.skipped += threads[i].stats.skipped;
6296 0 : cur.retries += threads[i].stats.retries;
6297 0 : cur.retried += threads[i].stats.retried;
6298 0 : cur.serialization_failures +=
6299 0 : threads[i].stats.serialization_failures;
6300 0 : cur.deadlock_failures += threads[i].stats.deadlock_failures;
6301 : }
6302 :
6303 : /* we count only actually executed transactions */
6304 0 : cnt = cur.cnt - last->cnt;
6305 0 : total_run = (now - test_start) / 1000000.0;
6306 0 : tps = 1000000.0 * cnt / run;
6307 0 : if (cnt > 0)
6308 : {
6309 0 : latency = 0.001 * (cur.latency.sum - last->latency.sum) / cnt;
6310 0 : sqlat = 1.0 * (cur.latency.sum2 - last->latency.sum2) / cnt;
6311 0 : stdev = 0.001 * sqrt(sqlat - 1000000.0 * latency * latency);
6312 0 : lag = 0.001 * (cur.lag.sum - last->lag.sum) / cnt;
6313 : }
6314 : else
6315 : {
6316 0 : latency = sqlat = stdev = lag = 0;
6317 : }
6318 0 : failures = getFailures(&cur) - getFailures(last);
6319 0 : retried = cur.retried - last->retried;
6320 :
6321 0 : if (progress_timestamp)
6322 : {
6323 0 : snprintf(tbuf, sizeof(tbuf), "%.3f s",
6324 0 : PG_TIME_GET_DOUBLE(now + epoch_shift));
6325 : }
6326 : else
6327 : {
6328 : /* round seconds are expected, but the thread may be late */
6329 0 : snprintf(tbuf, sizeof(tbuf), "%.1f s", total_run);
6330 : }
6331 :
6332 0 : fprintf(stderr,
6333 : "progress: %s, %.1f tps, lat %.3f ms stddev %.3f, " INT64_FORMAT " failed",
6334 : tbuf, tps, latency, stdev, failures);
6335 :
6336 0 : if (throttle_delay)
6337 : {
6338 0 : fprintf(stderr, ", lag %.3f ms", lag);
6339 0 : if (latency_limit)
6340 0 : fprintf(stderr, ", " INT64_FORMAT " skipped",
6341 0 : cur.skipped - last->skipped);
6342 : }
6343 :
6344 : /* it can be non-zero only if max_tries is not equal to one */
6345 0 : if (max_tries != 1)
6346 0 : fprintf(stderr,
6347 : ", " INT64_FORMAT " retried, " INT64_FORMAT " retries",
6348 0 : retried, cur.retries - last->retries);
6349 0 : fprintf(stderr, "\n");
6350 :
6351 0 : *last = cur;
6352 0 : *last_report = now;
6353 0 : }
6354 :
6355 : static void
6356 30 : printSimpleStats(const char *prefix, SimpleStats *ss)
6357 : {
6358 30 : if (ss->count > 0)
6359 : {
6360 30 : double latency = ss->sum / ss->count;
6361 30 : double stddev = sqrt(ss->sum2 / ss->count - latency * latency);
6362 :
6363 30 : printf("%s average = %.3f ms\n", prefix, 0.001 * latency);
6364 30 : printf("%s stddev = %.3f ms\n", prefix, 0.001 * stddev);
6365 : }
6366 30 : }
6367 :
6368 : /* print version banner */
6369 : static void
6370 174 : printVersion(PGconn *con)
6371 : {
6372 174 : int server_ver = PQserverVersion(con);
6373 174 : int client_ver = PG_VERSION_NUM;
6374 :
6375 174 : if (server_ver != client_ver)
6376 : {
6377 : const char *server_version;
6378 : char sverbuf[32];
6379 :
6380 : /* Try to get full text form, might include "devel" etc */
6381 0 : server_version = PQparameterStatus(con, "server_version");
6382 : /* Otherwise fall back on server_ver */
6383 0 : if (!server_version)
6384 : {
6385 0 : formatPGVersionNumber(server_ver, true,
6386 : sverbuf, sizeof(sverbuf));
6387 0 : server_version = sverbuf;
6388 : }
6389 :
6390 0 : printf(_("%s (%s, server %s)\n"),
6391 : "pgbench", PG_VERSION, server_version);
6392 : }
6393 : /* For version match, only print pgbench version */
6394 : else
6395 174 : printf("%s (%s)\n", "pgbench", PG_VERSION);
6396 174 : fflush(stdout);
6397 174 : }
6398 :
6399 : /* print out results */
6400 : static void
6401 170 : printResults(StatsData *total,
6402 : pg_time_usec_t total_duration, /* benchmarking time */
6403 : pg_time_usec_t conn_total_duration, /* is_connect */
6404 : pg_time_usec_t conn_elapsed_duration, /* !is_connect */
6405 : int64 latency_late)
6406 : {
6407 : /* tps is about actually executed transactions during benchmarking */
6408 170 : int64 failures = getFailures(total);
6409 170 : int64 total_cnt = total->cnt + total->skipped + failures;
6410 170 : double bench_duration = PG_TIME_GET_DOUBLE(total_duration);
6411 170 : double tps = total->cnt / bench_duration;
6412 :
6413 : /* Report test parameters. */
6414 170 : printf("transaction type: %s\n",
6415 : num_scripts == 1 ? sql_script[0].desc : "multiple scripts");
6416 170 : printf("scaling factor: %d\n", scale);
6417 : /* only print partitioning information if some partitioning was detected */
6418 170 : if (partition_method != PART_NONE)
6419 12 : printf("partition method: %s\npartitions: %d\n",
6420 : PARTITION_METHOD[partition_method], partitions);
6421 170 : printf("query mode: %s\n", QUERYMODE[querymode]);
6422 170 : printf("number of clients: %d\n", nclients);
6423 170 : printf("number of threads: %d\n", nthreads);
6424 :
6425 170 : if (max_tries)
6426 170 : printf("maximum number of tries: %u\n", max_tries);
6427 :
6428 170 : if (duration <= 0)
6429 : {
6430 170 : printf("number of transactions per client: %d\n", nxacts);
6431 170 : printf("number of transactions actually processed: " INT64_FORMAT "/%d\n",
6432 : total->cnt, nxacts * nclients);
6433 : }
6434 : else
6435 : {
6436 0 : printf("duration: %d s\n", duration);
6437 0 : printf("number of transactions actually processed: " INT64_FORMAT "\n",
6438 : total->cnt);
6439 : }
6440 :
6441 : /*
6442 : * Remaining stats are nonsensical if we failed to execute any xacts due
6443 : * to others than serialization or deadlock errors
6444 : */
6445 170 : if (total_cnt <= 0)
6446 100 : return;
6447 :
6448 70 : printf("number of failed transactions: " INT64_FORMAT " (%.3f%%)\n",
6449 : failures, 100.0 * failures / total_cnt);
6450 :
6451 70 : if (failures_detailed)
6452 : {
6453 0 : printf("number of serialization failures: " INT64_FORMAT " (%.3f%%)\n",
6454 : total->serialization_failures,
6455 : 100.0 * total->serialization_failures / total_cnt);
6456 0 : printf("number of deadlock failures: " INT64_FORMAT " (%.3f%%)\n",
6457 : total->deadlock_failures,
6458 : 100.0 * total->deadlock_failures / total_cnt);
6459 : }
6460 :
6461 : /* it can be non-zero only if max_tries is not equal to one */
6462 70 : if (max_tries != 1)
6463 : {
6464 4 : printf("number of transactions retried: " INT64_FORMAT " (%.3f%%)\n",
6465 : total->retried, 100.0 * total->retried / total_cnt);
6466 4 : printf("total number of retries: " INT64_FORMAT "\n", total->retries);
6467 : }
6468 :
6469 70 : if (throttle_delay && latency_limit)
6470 4 : printf("number of transactions skipped: " INT64_FORMAT " (%.3f%%)\n",
6471 : total->skipped, 100.0 * total->skipped / total_cnt);
6472 :
6473 70 : if (latency_limit)
6474 4 : printf("number of transactions above the %.1f ms latency limit: " INT64_FORMAT "/" INT64_FORMAT " (%.3f%%)\n",
6475 : latency_limit / 1000.0, latency_late, total->cnt,
6476 : (total->cnt > 0) ? 100.0 * latency_late / total->cnt : 0.0);
6477 :
6478 70 : if (throttle_delay || progress || latency_limit)
6479 4 : printSimpleStats("latency", &total->latency);
6480 : else
6481 : {
6482 : /* no measurement, show average latency computed from run time */
6483 66 : printf("latency average = %.3f ms%s\n",
6484 : 0.001 * total_duration * nclients / total_cnt,
6485 : failures > 0 ? " (including failures)" : "");
6486 : }
6487 :
6488 70 : if (throttle_delay)
6489 : {
6490 : /*
6491 : * Report average transaction lag under rate limit throttling. This
6492 : * is the delay between scheduled and actual start times for the
6493 : * transaction. The measured lag may be caused by thread/client load,
6494 : * the database load, or the Poisson throttling process.
6495 : */
6496 4 : printf("rate limit schedule lag: avg %.3f (max %.3f) ms\n",
6497 : 0.001 * total->lag.sum / total->cnt, 0.001 * total->lag.max);
6498 : }
6499 :
6500 : /*
6501 : * Under -C/--connect, each transaction incurs a significant connection
6502 : * cost, it would not make much sense to ignore it in tps, and it would
6503 : * not be tps anyway.
6504 : *
6505 : * Otherwise connections are made just once at the beginning of the run
6506 : * and should not impact performance but for very short run, so they are
6507 : * (right)fully ignored in tps.
6508 : */
6509 70 : if (is_connect)
6510 : {
6511 4 : printf("average connection time = %.3f ms\n", 0.001 * conn_total_duration / (total->cnt + failures));
6512 4 : printf("tps = %f (including reconnection times)\n", tps);
6513 : }
6514 : else
6515 : {
6516 66 : printf("initial connection time = %.3f ms\n", 0.001 * conn_elapsed_duration);
6517 66 : printf("tps = %f (without initial connection time)\n", tps);
6518 : }
6519 :
6520 : /* Report per-script/command statistics */
6521 70 : if (per_script_stats || report_per_command)
6522 : {
6523 : int i;
6524 :
6525 42 : for (i = 0; i < num_scripts; i++)
6526 : {
6527 30 : if (per_script_stats)
6528 : {
6529 26 : StatsData *sstats = &sql_script[i].stats;
6530 26 : int64 script_failures = getFailures(sstats);
6531 26 : int64 script_total_cnt =
6532 26 : sstats->cnt + sstats->skipped + script_failures;
6533 :
6534 26 : printf("SQL script %d: %s\n"
6535 : " - weight: %d (targets %.1f%% of total)\n"
6536 : " - " INT64_FORMAT " transactions (%.1f%% of total)\n",
6537 : i + 1, sql_script[i].desc,
6538 : sql_script[i].weight,
6539 : 100.0 * sql_script[i].weight / total_weight,
6540 : script_total_cnt,
6541 : 100.0 * script_total_cnt / total_cnt);
6542 :
6543 26 : if (script_total_cnt > 0)
6544 : {
6545 26 : printf(" - number of transactions actually processed: " INT64_FORMAT " (tps = %f)\n",
6546 : sstats->cnt, sstats->cnt / bench_duration);
6547 :
6548 26 : printf(" - number of failed transactions: " INT64_FORMAT " (%.3f%%)\n",
6549 : script_failures,
6550 : 100.0 * script_failures / script_total_cnt);
6551 :
6552 26 : if (failures_detailed)
6553 : {
6554 0 : printf(" - number of serialization failures: " INT64_FORMAT " (%.3f%%)\n",
6555 : sstats->serialization_failures,
6556 : (100.0 * sstats->serialization_failures /
6557 : script_total_cnt));
6558 0 : printf(" - number of deadlock failures: " INT64_FORMAT " (%.3f%%)\n",
6559 : sstats->deadlock_failures,
6560 : (100.0 * sstats->deadlock_failures /
6561 : script_total_cnt));
6562 : }
6563 :
6564 : /*
6565 : * it can be non-zero only if max_tries is not equal to
6566 : * one
6567 : */
6568 26 : if (max_tries != 1)
6569 : {
6570 0 : printf(" - number of transactions retried: " INT64_FORMAT " (%.3f%%)\n",
6571 : sstats->retried,
6572 : 100.0 * sstats->retried / script_total_cnt);
6573 0 : printf(" - total number of retries: " INT64_FORMAT "\n",
6574 : sstats->retries);
6575 : }
6576 :
6577 26 : if (throttle_delay && latency_limit)
6578 0 : printf(" - number of transactions skipped: " INT64_FORMAT " (%.3f%%)\n",
6579 : sstats->skipped,
6580 : 100.0 * sstats->skipped / script_total_cnt);
6581 :
6582 : }
6583 26 : printSimpleStats(" - latency", &sstats->latency);
6584 : }
6585 :
6586 : /*
6587 : * Report per-command statistics: latencies, retries after errors,
6588 : * failures (errors without retrying).
6589 : */
6590 30 : if (report_per_command)
6591 : {
6592 : Command **commands;
6593 :
6594 4 : printf("%sstatement latencies in milliseconds%s:\n",
6595 : per_script_stats ? " - " : "",
6596 : (max_tries == 1 ?
6597 : " and failures" :
6598 : ", failures and retries"));
6599 :
6600 4 : for (commands = sql_script[i].commands;
6601 10 : *commands != NULL;
6602 6 : commands++)
6603 : {
6604 6 : SimpleStats *cstats = &(*commands)->stats;
6605 :
6606 6 : if (max_tries == 1)
6607 6 : printf(" %11.3f %10" PRId64 " %s\n",
6608 : (cstats->count > 0) ?
6609 : 1000.0 * cstats->sum / cstats->count : 0.0,
6610 : (*commands)->failures,
6611 : (*commands)->first_line);
6612 : else
6613 0 : printf(" %11.3f %10" PRId64 " %10" PRId64 " %s\n",
6614 : (cstats->count > 0) ?
6615 : 1000.0 * cstats->sum / cstats->count : 0.0,
6616 : (*commands)->failures,
6617 : (*commands)->retries,
6618 : (*commands)->first_line);
6619 : }
6620 : }
6621 : }
6622 : }
6623 : }
6624 :
6625 : /*
6626 : * Set up a random seed according to seed parameter (NULL means default),
6627 : * and initialize base_random_sequence for use in initializing other sequences.
6628 : */
6629 : static bool
6630 360 : set_random_seed(const char *seed)
6631 : {
6632 : uint64 iseed;
6633 :
6634 360 : if (seed == NULL || strcmp(seed, "time") == 0)
6635 : {
6636 : /* rely on current time */
6637 352 : iseed = pg_time_now();
6638 : }
6639 8 : else if (strcmp(seed, "rand") == 0)
6640 : {
6641 : /* use some "strong" random source */
6642 0 : if (!pg_strong_random(&iseed, sizeof(iseed)))
6643 : {
6644 0 : pg_log_error("could not generate random seed");
6645 0 : return false;
6646 : }
6647 : }
6648 : else
6649 : {
6650 : char garbage;
6651 :
6652 8 : if (sscanf(seed, "%" SCNu64 "%c", &iseed, &garbage) != 1)
6653 : {
6654 2 : pg_log_error("unrecognized random seed option \"%s\"", seed);
6655 2 : pg_log_error_detail("Expecting an unsigned integer, \"time\" or \"rand\".");
6656 2 : return false;
6657 : }
6658 : }
6659 :
6660 358 : if (seed != NULL)
6661 6 : pg_log_info("setting random seed to %" PRIu64, iseed);
6662 :
6663 358 : random_seed = iseed;
6664 :
6665 : /* Initialize base_random_sequence using seed */
6666 358 : pg_prng_seed(&base_random_sequence, iseed);
6667 :
6668 358 : return true;
6669 : }
6670 :
6671 : int
6672 356 : main(int argc, char **argv)
6673 : {
6674 : static struct option long_options[] = {
6675 : /* systematic long/short named options */
6676 : {"builtin", required_argument, NULL, 'b'},
6677 : {"client", required_argument, NULL, 'c'},
6678 : {"connect", no_argument, NULL, 'C'},
6679 : {"dbname", required_argument, NULL, 'd'},
6680 : {"define", required_argument, NULL, 'D'},
6681 : {"file", required_argument, NULL, 'f'},
6682 : {"fillfactor", required_argument, NULL, 'F'},
6683 : {"host", required_argument, NULL, 'h'},
6684 : {"initialize", no_argument, NULL, 'i'},
6685 : {"init-steps", required_argument, NULL, 'I'},
6686 : {"jobs", required_argument, NULL, 'j'},
6687 : {"log", no_argument, NULL, 'l'},
6688 : {"latency-limit", required_argument, NULL, 'L'},
6689 : {"no-vacuum", no_argument, NULL, 'n'},
6690 : {"port", required_argument, NULL, 'p'},
6691 : {"progress", required_argument, NULL, 'P'},
6692 : {"protocol", required_argument, NULL, 'M'},
6693 : {"quiet", no_argument, NULL, 'q'},
6694 : {"report-per-command", no_argument, NULL, 'r'},
6695 : {"rate", required_argument, NULL, 'R'},
6696 : {"scale", required_argument, NULL, 's'},
6697 : {"select-only", no_argument, NULL, 'S'},
6698 : {"skip-some-updates", no_argument, NULL, 'N'},
6699 : {"time", required_argument, NULL, 'T'},
6700 : {"transactions", required_argument, NULL, 't'},
6701 : {"username", required_argument, NULL, 'U'},
6702 : {"vacuum-all", no_argument, NULL, 'v'},
6703 : /* long-named only options */
6704 : {"unlogged-tables", no_argument, NULL, 1},
6705 : {"tablespace", required_argument, NULL, 2},
6706 : {"index-tablespace", required_argument, NULL, 3},
6707 : {"sampling-rate", required_argument, NULL, 4},
6708 : {"aggregate-interval", required_argument, NULL, 5},
6709 : {"progress-timestamp", no_argument, NULL, 6},
6710 : {"log-prefix", required_argument, NULL, 7},
6711 : {"foreign-keys", no_argument, NULL, 8},
6712 : {"random-seed", required_argument, NULL, 9},
6713 : {"show-script", required_argument, NULL, 10},
6714 : {"partitions", required_argument, NULL, 11},
6715 : {"partition-method", required_argument, NULL, 12},
6716 : {"failures-detailed", no_argument, NULL, 13},
6717 : {"max-tries", required_argument, NULL, 14},
6718 : {"verbose-errors", no_argument, NULL, 15},
6719 : {"exit-on-abort", no_argument, NULL, 16},
6720 : {"debug", no_argument, NULL, 17},
6721 : {NULL, 0, NULL, 0}
6722 : };
6723 :
6724 : int c;
6725 356 : bool is_init_mode = false; /* initialize mode? */
6726 356 : char *initialize_steps = NULL;
6727 356 : bool foreign_keys = false;
6728 356 : bool is_no_vacuum = false;
6729 356 : bool do_vacuum_accounts = false; /* vacuum accounts table? */
6730 : int optindex;
6731 356 : bool scale_given = false;
6732 :
6733 356 : bool benchmarking_option_set = false;
6734 356 : bool initialization_option_set = false;
6735 356 : bool internal_script_used = false;
6736 :
6737 : CState *state; /* status of clients */
6738 : TState *threads; /* array of thread */
6739 :
6740 : pg_time_usec_t
6741 : start_time, /* start up time */
6742 356 : bench_start = 0, /* first recorded benchmarking time */
6743 : conn_total_duration; /* cumulated connection time in
6744 : * threads */
6745 356 : int64 latency_late = 0;
6746 : StatsData stats;
6747 : int weight;
6748 :
6749 : int i;
6750 : int nclients_dealt;
6751 :
6752 : #ifdef HAVE_GETRLIMIT
6753 : struct rlimit rlim;
6754 : #endif
6755 :
6756 : PGconn *con;
6757 : char *env;
6758 :
6759 356 : int exit_code = 0;
6760 : struct timeval tv;
6761 :
6762 : /*
6763 : * Record difference between Unix time and instr_time time. We'll use
6764 : * this for logging and aggregation.
6765 : */
6766 356 : gettimeofday(&tv, NULL);
6767 356 : epoch_shift = tv.tv_sec * INT64CONST(1000000) + tv.tv_usec - pg_time_now();
6768 :
6769 356 : pg_logging_init(argv[0]);
6770 356 : progname = get_progname(argv[0]);
6771 :
6772 356 : if (argc > 1)
6773 : {
6774 356 : if (strcmp(argv[1], "--help") == 0 || strcmp(argv[1], "-?") == 0)
6775 : {
6776 2 : usage();
6777 2 : exit(0);
6778 : }
6779 354 : if (strcmp(argv[1], "--version") == 0 || strcmp(argv[1], "-V") == 0)
6780 : {
6781 2 : puts("pgbench (PostgreSQL) " PG_VERSION);
6782 2 : exit(0);
6783 : }
6784 : }
6785 :
6786 352 : state = (CState *) pg_malloc0(sizeof(CState));
6787 :
6788 : /* set random seed early, because it may be used while parsing scripts. */
6789 352 : if (!set_random_seed(getenv("PGBENCH_RANDOM_SEED")))
6790 0 : pg_fatal("error while setting random seed from PGBENCH_RANDOM_SEED environment variable");
6791 :
6792 2478 : while ((c = getopt_long(argc, argv, "b:c:Cd:D:f:F:h:iI:j:lL:M:nNp:P:qrR:s:St:T:U:v", long_options, &optindex)) != -1)
6793 : {
6794 : char *script;
6795 :
6796 2264 : switch (c)
6797 : {
6798 24 : case 'b':
6799 24 : if (strcmp(optarg, "list") == 0)
6800 : {
6801 2 : listAvailableScripts();
6802 2 : exit(0);
6803 : }
6804 22 : weight = parseScriptWeight(optarg, &script);
6805 18 : process_builtin(findBuiltin(script), weight);
6806 14 : benchmarking_option_set = true;
6807 14 : internal_script_used = true;
6808 14 : break;
6809 50 : case 'c':
6810 50 : benchmarking_option_set = true;
6811 50 : if (!option_parse_int(optarg, "-c/--clients", 1, INT_MAX,
6812 : &nclients))
6813 : {
6814 2 : exit(1);
6815 : }
6816 : #ifdef HAVE_GETRLIMIT
6817 48 : if (getrlimit(RLIMIT_NOFILE, &rlim) == -1)
6818 0 : pg_fatal("getrlimit failed: %m");
6819 :
6820 48 : if (rlim.rlim_max < nclients + 3)
6821 : {
6822 0 : pg_log_error("need at least %d open files, but system limit is %ld",
6823 : nclients + 3, (long) rlim.rlim_max);
6824 0 : pg_log_error_hint("Reduce number of clients, or use limit/ulimit to increase the system limit.");
6825 0 : exit(1);
6826 : }
6827 :
6828 48 : if (rlim.rlim_cur < nclients + 3)
6829 : {
6830 0 : rlim.rlim_cur = nclients + 3;
6831 0 : if (setrlimit(RLIMIT_NOFILE, &rlim) == -1)
6832 : {
6833 0 : pg_log_error("need at least %d open files, but couldn't raise the limit: %m",
6834 : nclients + 3);
6835 0 : pg_log_error_hint("Reduce number of clients, or use limit/ulimit to increase the system limit.");
6836 0 : exit(1);
6837 : }
6838 : }
6839 : #endif /* HAVE_GETRLIMIT */
6840 48 : break;
6841 4 : case 'C':
6842 4 : benchmarking_option_set = true;
6843 4 : is_connect = true;
6844 4 : break;
6845 0 : case 'd':
6846 0 : dbName = pg_strdup(optarg);
6847 0 : break;
6848 866 : case 'D':
6849 : {
6850 : char *p;
6851 :
6852 866 : benchmarking_option_set = true;
6853 :
6854 866 : if ((p = strchr(optarg, '=')) == NULL || p == optarg || *(p + 1) == '\0')
6855 2 : pg_fatal("invalid variable definition: \"%s\"", optarg);
6856 :
6857 864 : *p++ = '\0';
6858 864 : if (!putVariable(&state[0].variables, "option", optarg, p))
6859 0 : exit(1);
6860 : }
6861 864 : break;
6862 262 : case 'f':
6863 262 : weight = parseScriptWeight(optarg, &script);
6864 262 : process_file(script, weight);
6865 180 : benchmarking_option_set = true;
6866 180 : break;
6867 6 : case 'F':
6868 6 : initialization_option_set = true;
6869 6 : if (!option_parse_int(optarg, "-F/--fillfactor", 10, 100,
6870 : &fillfactor))
6871 2 : exit(1);
6872 4 : break;
6873 2 : case 'h':
6874 2 : pghost = pg_strdup(optarg);
6875 2 : break;
6876 18 : case 'i':
6877 18 : is_init_mode = true;
6878 18 : break;
6879 8 : case 'I':
6880 8 : pg_free(initialize_steps);
6881 8 : initialize_steps = pg_strdup(optarg);
6882 8 : checkInitSteps(initialize_steps);
6883 6 : initialization_option_set = true;
6884 6 : break;
6885 8 : case 'j': /* jobs */
6886 8 : benchmarking_option_set = true;
6887 8 : if (!option_parse_int(optarg, "-j/--jobs", 1, INT_MAX,
6888 : &nthreads))
6889 : {
6890 2 : exit(1);
6891 : }
6892 6 : break;
6893 14 : case 'l':
6894 14 : benchmarking_option_set = true;
6895 14 : use_log = true;
6896 14 : break;
6897 6 : case 'L':
6898 : {
6899 6 : double limit_ms = atof(optarg);
6900 :
6901 6 : if (limit_ms <= 0.0)
6902 2 : pg_fatal("invalid latency limit: \"%s\"", optarg);
6903 4 : benchmarking_option_set = true;
6904 4 : latency_limit = (int64) (limit_ms * 1000);
6905 : }
6906 4 : break;
6907 176 : case 'M':
6908 176 : benchmarking_option_set = true;
6909 482 : for (querymode = 0; querymode < NUM_QUERYMODE; querymode++)
6910 480 : if (strcmp(optarg, QUERYMODE[querymode]) == 0)
6911 174 : break;
6912 176 : if (querymode >= NUM_QUERYMODE)
6913 2 : pg_fatal("invalid query mode (-M): \"%s\"", optarg);
6914 174 : break;
6915 198 : case 'n':
6916 198 : is_no_vacuum = true;
6917 198 : break;
6918 2 : case 'N':
6919 2 : process_builtin(findBuiltin("simple-update"), 1);
6920 2 : benchmarking_option_set = true;
6921 2 : internal_script_used = true;
6922 2 : break;
6923 2 : case 'p':
6924 2 : pgport = pg_strdup(optarg);
6925 2 : break;
6926 4 : case 'P':
6927 4 : benchmarking_option_set = true;
6928 4 : if (!option_parse_int(optarg, "-P/--progress", 1, INT_MAX,
6929 : &progress))
6930 2 : exit(1);
6931 2 : break;
6932 2 : case 'q':
6933 2 : initialization_option_set = true;
6934 2 : use_quiet = true;
6935 2 : break;
6936 4 : case 'r':
6937 4 : benchmarking_option_set = true;
6938 4 : report_per_command = true;
6939 4 : break;
6940 6 : case 'R':
6941 : {
6942 : /* get a double from the beginning of option value */
6943 6 : double throttle_value = atof(optarg);
6944 :
6945 6 : benchmarking_option_set = true;
6946 :
6947 6 : if (throttle_value <= 0.0)
6948 2 : pg_fatal("invalid rate limit: \"%s\"", optarg);
6949 : /* Invert rate limit into per-transaction delay in usec */
6950 4 : throttle_delay = 1000000.0 / throttle_value;
6951 : }
6952 4 : break;
6953 6 : case 's':
6954 6 : scale_given = true;
6955 6 : if (!option_parse_int(optarg, "-s/--scale", 1, INT_MAX,
6956 : &scale))
6957 2 : exit(1);
6958 4 : break;
6959 268 : case 'S':
6960 268 : process_builtin(findBuiltin("select-only"), 1);
6961 266 : benchmarking_option_set = true;
6962 266 : internal_script_used = true;
6963 266 : break;
6964 220 : case 't':
6965 220 : benchmarking_option_set = true;
6966 220 : if (!option_parse_int(optarg, "-t/--transactions", 1, INT_MAX,
6967 : &nxacts))
6968 2 : exit(1);
6969 218 : break;
6970 10 : case 'T':
6971 10 : benchmarking_option_set = true;
6972 10 : if (!option_parse_int(optarg, "-T/--time", 1, INT_MAX,
6973 : &duration))
6974 2 : exit(1);
6975 8 : break;
6976 2 : case 'U':
6977 2 : username = pg_strdup(optarg);
6978 2 : break;
6979 2 : case 'v':
6980 2 : benchmarking_option_set = true;
6981 2 : do_vacuum_accounts = true;
6982 2 : break;
6983 4 : case 1: /* unlogged-tables */
6984 4 : initialization_option_set = true;
6985 4 : unlogged_tables = true;
6986 4 : break;
6987 2 : case 2: /* tablespace */
6988 2 : initialization_option_set = true;
6989 2 : tablespace = pg_strdup(optarg);
6990 2 : break;
6991 2 : case 3: /* index-tablespace */
6992 2 : initialization_option_set = true;
6993 2 : index_tablespace = pg_strdup(optarg);
6994 2 : break;
6995 10 : case 4: /* sampling-rate */
6996 10 : benchmarking_option_set = true;
6997 10 : sample_rate = atof(optarg);
6998 10 : if (sample_rate <= 0.0 || sample_rate > 1.0)
6999 2 : pg_fatal("invalid sampling rate: \"%s\"", optarg);
7000 8 : break;
7001 12 : case 5: /* aggregate-interval */
7002 12 : benchmarking_option_set = true;
7003 12 : if (!option_parse_int(optarg, "--aggregate-interval", 1, INT_MAX,
7004 : &agg_interval))
7005 2 : exit(1);
7006 10 : break;
7007 4 : case 6: /* progress-timestamp */
7008 4 : progress_timestamp = true;
7009 4 : benchmarking_option_set = true;
7010 4 : break;
7011 8 : case 7: /* log-prefix */
7012 8 : benchmarking_option_set = true;
7013 8 : logfile_prefix = pg_strdup(optarg);
7014 8 : break;
7015 4 : case 8: /* foreign-keys */
7016 4 : initialization_option_set = true;
7017 4 : foreign_keys = true;
7018 4 : break;
7019 8 : case 9: /* random-seed */
7020 8 : benchmarking_option_set = true;
7021 8 : if (!set_random_seed(optarg))
7022 2 : pg_fatal("error while setting random seed from --random-seed option");
7023 6 : break;
7024 2 : case 10: /* list */
7025 : {
7026 2 : const BuiltinScript *s = findBuiltin(optarg);
7027 :
7028 2 : fprintf(stderr, "-- %s: %s\n%s\n", s->name, s->desc, s->script);
7029 2 : exit(0);
7030 : }
7031 : break;
7032 6 : case 11: /* partitions */
7033 6 : initialization_option_set = true;
7034 6 : if (!option_parse_int(optarg, "--partitions", 0, INT_MAX,
7035 : &partitions))
7036 2 : exit(1);
7037 4 : break;
7038 6 : case 12: /* partition-method */
7039 6 : initialization_option_set = true;
7040 6 : if (pg_strcasecmp(optarg, "range") == 0)
7041 0 : partition_method = PART_RANGE;
7042 6 : else if (pg_strcasecmp(optarg, "hash") == 0)
7043 4 : partition_method = PART_HASH;
7044 : else
7045 2 : pg_fatal("invalid partition method, expecting \"range\" or \"hash\", got: \"%s\"",
7046 : optarg);
7047 4 : break;
7048 0 : case 13: /* failures-detailed */
7049 0 : benchmarking_option_set = true;
7050 0 : failures_detailed = true;
7051 0 : break;
7052 8 : case 14: /* max-tries */
7053 : {
7054 8 : int32 max_tries_arg = atoi(optarg);
7055 :
7056 8 : if (max_tries_arg < 0)
7057 2 : pg_fatal("invalid number of maximum tries: \"%s\"", optarg);
7058 :
7059 6 : benchmarking_option_set = true;
7060 6 : max_tries = (uint32) max_tries_arg;
7061 : }
7062 6 : break;
7063 4 : case 15: /* verbose-errors */
7064 4 : benchmarking_option_set = true;
7065 4 : verbose_errors = true;
7066 4 : break;
7067 4 : case 16: /* exit-on-abort */
7068 4 : benchmarking_option_set = true;
7069 4 : exit_on_abort = true;
7070 4 : break;
7071 4 : case 17: /* debug */
7072 4 : pg_logging_increase_verbosity();
7073 4 : break;
7074 6 : default:
7075 : /* getopt_long already emitted a complaint */
7076 6 : pg_log_error_hint("Try \"%s --help\" for more information.", progname);
7077 6 : exit(1);
7078 : }
7079 : }
7080 :
7081 : /* set default script if none */
7082 214 : if (num_scripts == 0 && !is_init_mode)
7083 : {
7084 22 : process_builtin(findBuiltin("tpcb-like"), 1);
7085 22 : benchmarking_option_set = true;
7086 22 : internal_script_used = true;
7087 : }
7088 :
7089 : /* complete SQL command initialization and compute total weight */
7090 440 : for (i = 0; i < num_scripts; i++)
7091 : {
7092 228 : Command **commands = sql_script[i].commands;
7093 :
7094 1456 : for (int j = 0; commands[j] != NULL; j++)
7095 1230 : if (commands[j]->type == SQL_COMMAND)
7096 584 : postprocess_sql_command(commands[j]);
7097 :
7098 : /* cannot overflow: weight is 32b, total_weight 64b */
7099 226 : total_weight += sql_script[i].weight;
7100 : }
7101 :
7102 212 : if (total_weight == 0 && !is_init_mode)
7103 2 : pg_fatal("total script weight must not be zero");
7104 :
7105 : /* show per script stats if several scripts are used */
7106 210 : if (num_scripts > 1)
7107 8 : per_script_stats = true;
7108 :
7109 : /*
7110 : * Don't need more threads than there are clients. (This is not merely an
7111 : * optimization; throttle_delay is calculated incorrectly below if some
7112 : * threads have no clients assigned to them.)
7113 : */
7114 210 : if (nthreads > nclients)
7115 2 : nthreads = nclients;
7116 :
7117 : /*
7118 : * Convert throttle_delay to a per-thread delay time. Note that this
7119 : * might be a fractional number of usec, but that's OK, since it's just
7120 : * the center of a Poisson distribution of delays.
7121 : */
7122 210 : throttle_delay *= nthreads;
7123 :
7124 210 : if (dbName == NULL)
7125 : {
7126 210 : if (argc > optind)
7127 2 : dbName = argv[optind++];
7128 : else
7129 : {
7130 208 : if ((env = getenv("PGDATABASE")) != NULL && *env != '\0')
7131 180 : dbName = env;
7132 28 : else if ((env = getenv("PGUSER")) != NULL && *env != '\0')
7133 0 : dbName = env;
7134 : else
7135 28 : dbName = get_user_name_or_exit(progname);
7136 : }
7137 : }
7138 :
7139 210 : if (optind < argc)
7140 : {
7141 0 : pg_log_error("too many command-line arguments (first is \"%s\")",
7142 : argv[optind]);
7143 0 : pg_log_error_hint("Try \"%s --help\" for more information.", progname);
7144 0 : exit(1);
7145 : }
7146 :
7147 210 : if (is_init_mode)
7148 : {
7149 10 : if (benchmarking_option_set)
7150 2 : pg_fatal("some of the specified options cannot be used in initialization (-i) mode");
7151 :
7152 8 : if (partitions == 0 && partition_method != PART_NONE)
7153 2 : pg_fatal("--partition-method requires greater than zero --partitions");
7154 :
7155 : /* set default method */
7156 6 : if (partitions > 0 && partition_method == PART_NONE)
7157 2 : partition_method = PART_RANGE;
7158 :
7159 6 : if (initialize_steps == NULL)
7160 2 : initialize_steps = pg_strdup(DEFAULT_INIT_STEPS);
7161 :
7162 6 : if (is_no_vacuum)
7163 : {
7164 : /* Remove any vacuum step in initialize_steps */
7165 : char *p;
7166 :
7167 8 : while ((p = strchr(initialize_steps, 'v')) != NULL)
7168 6 : *p = ' ';
7169 : }
7170 :
7171 6 : if (foreign_keys)
7172 : {
7173 : /* Add 'f' to end of initialize_steps, if not already there */
7174 4 : if (strchr(initialize_steps, 'f') == NULL)
7175 : {
7176 : initialize_steps = (char *)
7177 4 : pg_realloc(initialize_steps,
7178 4 : strlen(initialize_steps) + 2);
7179 4 : strcat(initialize_steps, "f");
7180 : }
7181 : }
7182 :
7183 6 : runInitSteps(initialize_steps);
7184 6 : exit(0);
7185 : }
7186 : else
7187 : {
7188 200 : if (initialization_option_set)
7189 4 : pg_fatal("some of the specified options cannot be used in benchmarking mode");
7190 : }
7191 :
7192 196 : if (nxacts > 0 && duration > 0)
7193 4 : pg_fatal("specify either a number of transactions (-t) or a duration (-T), not both");
7194 :
7195 : /* Use DEFAULT_NXACTS if neither nxacts nor duration is specified. */
7196 192 : if (nxacts <= 0 && duration <= 0)
7197 16 : nxacts = DEFAULT_NXACTS;
7198 :
7199 : /* --sampling-rate may be used only with -l */
7200 192 : if (sample_rate > 0.0 && !use_log)
7201 2 : pg_fatal("log sampling (--sampling-rate) is allowed only when logging transactions (-l)");
7202 :
7203 : /* --sampling-rate may not be used with --aggregate-interval */
7204 190 : if (sample_rate > 0.0 && agg_interval > 0)
7205 2 : pg_fatal("log sampling (--sampling-rate) and aggregation (--aggregate-interval) cannot be used at the same time");
7206 :
7207 188 : if (agg_interval > 0 && !use_log)
7208 2 : pg_fatal("log aggregation is allowed only when actually logging transactions");
7209 :
7210 186 : if (!use_log && logfile_prefix)
7211 2 : pg_fatal("log file prefix (--log-prefix) is allowed only when logging transactions (-l)");
7212 :
7213 184 : if (duration > 0 && agg_interval > duration)
7214 2 : pg_fatal("number of seconds for aggregation (%d) must not be higher than test duration (%d)", agg_interval, duration);
7215 :
7216 182 : if (duration > 0 && agg_interval > 0 && duration % agg_interval != 0)
7217 2 : pg_fatal("duration (%d) must be a multiple of aggregation interval (%d)", duration, agg_interval);
7218 :
7219 180 : if (progress_timestamp && progress == 0)
7220 2 : pg_fatal("--progress-timestamp is allowed only under --progress");
7221 :
7222 178 : if (!max_tries)
7223 : {
7224 2 : if (!latency_limit && duration <= 0)
7225 2 : pg_fatal("an unlimited number of transaction tries can only be used with --latency-limit or a duration (-T)");
7226 : }
7227 :
7228 : /*
7229 : * save main process id in the global variable because process id will be
7230 : * changed after fork.
7231 : */
7232 176 : main_pid = (int) getpid();
7233 :
7234 176 : if (nclients > 1)
7235 : {
7236 30 : state = (CState *) pg_realloc(state, sizeof(CState) * nclients);
7237 30 : memset(state + 1, 0, sizeof(CState) * (nclients - 1));
7238 :
7239 : /* copy any -D switch values to all clients */
7240 110 : for (i = 1; i < nclients; i++)
7241 : {
7242 : int j;
7243 :
7244 80 : state[i].id = i;
7245 82 : for (j = 0; j < state[0].variables.nvars; j++)
7246 : {
7247 2 : Variable *var = &state[0].variables.vars[j];
7248 :
7249 2 : if (var->value.type != PGBT_NO_VALUE)
7250 : {
7251 0 : if (!putVariableValue(&state[i].variables, "startup",
7252 0 : var->name, &var->value))
7253 0 : exit(1);
7254 : }
7255 : else
7256 : {
7257 2 : if (!putVariable(&state[i].variables, "startup",
7258 2 : var->name, var->svalue))
7259 0 : exit(1);
7260 : }
7261 : }
7262 : }
7263 : }
7264 :
7265 : /* other CState initializations */
7266 432 : for (i = 0; i < nclients; i++)
7267 : {
7268 256 : state[i].cstack = conditional_stack_create();
7269 256 : initRandomState(&state[i].cs_func_rs);
7270 : }
7271 :
7272 : /* opening connection... */
7273 176 : con = doConnect();
7274 176 : if (con == NULL)
7275 2 : pg_fatal("could not create connection for setup");
7276 :
7277 : /* report pgbench and server versions */
7278 174 : printVersion(con);
7279 :
7280 174 : pg_log_debug("pghost: %s pgport: %s nclients: %d %s: %d dbName: %s",
7281 : PQhost(con), PQport(con), nclients,
7282 : duration <= 0 ? "nxacts" : "duration",
7283 : duration <= 0 ? nxacts : duration, PQdb(con));
7284 :
7285 174 : if (internal_script_used)
7286 14 : GetTableInfo(con, scale_given);
7287 :
7288 : /*
7289 : * :scale variables normally get -s or database scale, but don't override
7290 : * an explicit -D switch
7291 : */
7292 172 : if (lookupVariable(&state[0].variables, "scale") == NULL)
7293 : {
7294 424 : for (i = 0; i < nclients; i++)
7295 : {
7296 252 : if (!putVariableInt(&state[i].variables, "startup", "scale", scale))
7297 0 : exit(1);
7298 : }
7299 : }
7300 :
7301 : /*
7302 : * Define a :client_id variable that is unique per connection. But don't
7303 : * override an explicit -D switch.
7304 : */
7305 172 : if (lookupVariable(&state[0].variables, "client_id") == NULL)
7306 : {
7307 424 : for (i = 0; i < nclients; i++)
7308 252 : if (!putVariableInt(&state[i].variables, "startup", "client_id", i))
7309 0 : exit(1);
7310 : }
7311 :
7312 : /* set default seed for hash functions */
7313 172 : if (lookupVariable(&state[0].variables, "default_seed") == NULL)
7314 : {
7315 172 : uint64 seed = pg_prng_uint64(&base_random_sequence);
7316 :
7317 424 : for (i = 0; i < nclients; i++)
7318 252 : if (!putVariableInt(&state[i].variables, "startup", "default_seed",
7319 : (int64) seed))
7320 0 : exit(1);
7321 : }
7322 :
7323 : /* set random seed unless overwritten */
7324 172 : if (lookupVariable(&state[0].variables, "random_seed") == NULL)
7325 : {
7326 424 : for (i = 0; i < nclients; i++)
7327 252 : if (!putVariableInt(&state[i].variables, "startup", "random_seed",
7328 : random_seed))
7329 0 : exit(1);
7330 : }
7331 :
7332 172 : if (!is_no_vacuum)
7333 : {
7334 20 : fprintf(stderr, "starting vacuum...");
7335 20 : tryExecuteStatement(con, "vacuum pgbench_branches");
7336 20 : tryExecuteStatement(con, "vacuum pgbench_tellers");
7337 20 : tryExecuteStatement(con, "truncate pgbench_history");
7338 20 : fprintf(stderr, "end.\n");
7339 :
7340 20 : if (do_vacuum_accounts)
7341 : {
7342 0 : fprintf(stderr, "starting vacuum pgbench_accounts...");
7343 0 : tryExecuteStatement(con, "vacuum analyze pgbench_accounts");
7344 0 : fprintf(stderr, "end.\n");
7345 : }
7346 : }
7347 172 : PQfinish(con);
7348 :
7349 : /* set up thread data structures */
7350 172 : threads = (TState *) pg_malloc(sizeof(TState) * nthreads);
7351 172 : nclients_dealt = 0;
7352 :
7353 346 : for (i = 0; i < nthreads; i++)
7354 : {
7355 174 : TState *thread = &threads[i];
7356 :
7357 174 : thread->tid = i;
7358 174 : thread->state = &state[nclients_dealt];
7359 174 : thread->nstate =
7360 174 : (nclients - nclients_dealt + nthreads - i - 1) / (nthreads - i);
7361 174 : initRandomState(&thread->ts_choose_rs);
7362 174 : initRandomState(&thread->ts_throttle_rs);
7363 174 : initRandomState(&thread->ts_sample_rs);
7364 174 : thread->logfile = NULL; /* filled in later */
7365 174 : thread->latency_late = 0;
7366 174 : initStats(&thread->stats, 0);
7367 :
7368 174 : nclients_dealt += thread->nstate;
7369 : }
7370 :
7371 : /* all clients must be assigned to a thread */
7372 : Assert(nclients_dealt == nclients);
7373 :
7374 : /* get start up time for the whole computation */
7375 172 : start_time = pg_time_now();
7376 :
7377 : /* set alarm if duration is specified. */
7378 172 : if (duration > 0)
7379 0 : setalarm(duration);
7380 :
7381 172 : errno = THREAD_BARRIER_INIT(&barrier, nthreads);
7382 172 : if (errno != 0)
7383 0 : pg_fatal("could not initialize barrier: %m");
7384 :
7385 : /* start all threads but thread 0 which is executed directly later */
7386 174 : for (i = 1; i < nthreads; i++)
7387 : {
7388 2 : TState *thread = &threads[i];
7389 :
7390 2 : thread->create_time = pg_time_now();
7391 2 : errno = THREAD_CREATE(&thread->thread, threadRun, thread);
7392 :
7393 2 : if (errno != 0)
7394 0 : pg_fatal("could not create thread: %m");
7395 : }
7396 :
7397 : /* compute when to stop */
7398 172 : threads[0].create_time = pg_time_now();
7399 172 : if (duration > 0)
7400 0 : end_time = threads[0].create_time + (int64) 1000000 * duration;
7401 :
7402 : /* run thread 0 directly */
7403 172 : (void) threadRun(&threads[0]);
7404 :
7405 : /* wait for other threads and accumulate results */
7406 170 : initStats(&stats, 0);
7407 170 : conn_total_duration = 0;
7408 :
7409 340 : for (i = 0; i < nthreads; i++)
7410 : {
7411 170 : TState *thread = &threads[i];
7412 :
7413 170 : if (i > 0)
7414 0 : THREAD_JOIN(thread->thread);
7415 :
7416 418 : for (int j = 0; j < thread->nstate; j++)
7417 248 : if (thread->state[j].state != CSTATE_FINISHED)
7418 102 : exit_code = 2;
7419 :
7420 : /* aggregate thread level stats */
7421 170 : mergeSimpleStats(&stats.latency, &thread->stats.latency);
7422 170 : mergeSimpleStats(&stats.lag, &thread->stats.lag);
7423 170 : stats.cnt += thread->stats.cnt;
7424 170 : stats.skipped += thread->stats.skipped;
7425 170 : stats.retries += thread->stats.retries;
7426 170 : stats.retried += thread->stats.retried;
7427 170 : stats.serialization_failures += thread->stats.serialization_failures;
7428 170 : stats.deadlock_failures += thread->stats.deadlock_failures;
7429 170 : latency_late += thread->latency_late;
7430 170 : conn_total_duration += thread->conn_duration;
7431 :
7432 : /* first recorded benchmarking start time */
7433 170 : if (bench_start == 0 || thread->bench_start < bench_start)
7434 170 : bench_start = thread->bench_start;
7435 : }
7436 :
7437 : /*
7438 : * All connections should be already closed in threadRun(), so this
7439 : * disconnect_all() will be a no-op, but clean up the connections just to
7440 : * be sure. We don't need to measure the disconnection delays here.
7441 : */
7442 170 : disconnect_all(state, nclients);
7443 :
7444 : /*
7445 : * Beware that performance of short benchmarks with many threads and
7446 : * possibly long transactions can be deceptive because threads do not
7447 : * start and finish at the exact same time. The total duration computed
7448 : * here encompasses all transactions so that tps shown is somehow slightly
7449 : * underestimated.
7450 : */
7451 170 : printResults(&stats, pg_time_now() - bench_start, conn_total_duration,
7452 : bench_start - start_time, latency_late);
7453 :
7454 170 : THREAD_BARRIER_DESTROY(&barrier);
7455 :
7456 170 : if (exit_code != 0)
7457 102 : pg_log_error("Run was aborted; the above results are incomplete.");
7458 :
7459 170 : return exit_code;
7460 : }
7461 :
7462 : static THREAD_FUNC_RETURN_TYPE THREAD_FUNC_CC
7463 174 : threadRun(void *arg)
7464 : {
7465 174 : TState *thread = (TState *) arg;
7466 174 : CState *state = thread->state;
7467 : pg_time_usec_t start;
7468 174 : int nstate = thread->nstate;
7469 174 : int remains = nstate; /* number of remaining clients */
7470 174 : socket_set *sockets = alloc_socket_set(nstate);
7471 : int64 thread_start,
7472 : last_report,
7473 : next_report;
7474 : StatsData last,
7475 : aggs;
7476 :
7477 : /* open log file if requested */
7478 174 : if (use_log)
7479 : {
7480 : char logpath[MAXPGPATH];
7481 4 : char *prefix = logfile_prefix ? logfile_prefix : "pgbench_log";
7482 :
7483 4 : if (thread->tid == 0)
7484 4 : snprintf(logpath, sizeof(logpath), "%s.%d", prefix, main_pid);
7485 : else
7486 0 : snprintf(logpath, sizeof(logpath), "%s.%d.%d", prefix, main_pid, thread->tid);
7487 :
7488 4 : thread->logfile = fopen(logpath, "w");
7489 :
7490 4 : if (thread->logfile == NULL)
7491 0 : pg_fatal("could not open logfile \"%s\": %m", logpath);
7492 : }
7493 :
7494 : /* explicitly initialize the state machines */
7495 426 : for (int i = 0; i < nstate; i++)
7496 252 : state[i].state = CSTATE_CHOOSE_SCRIPT;
7497 :
7498 : /* READY */
7499 174 : THREAD_BARRIER_WAIT(&barrier);
7500 :
7501 174 : thread_start = pg_time_now();
7502 174 : thread->started_time = thread_start;
7503 174 : thread->conn_duration = 0;
7504 174 : last_report = thread_start;
7505 174 : next_report = last_report + (int64) 1000000 * progress;
7506 :
7507 : /* STEADY */
7508 174 : if (!is_connect)
7509 : {
7510 : /* make connections to the database before starting */
7511 408 : for (int i = 0; i < nstate; i++)
7512 : {
7513 238 : if ((state[i].con = doConnect()) == NULL)
7514 : {
7515 : /* coldly abort on initial connection failure */
7516 0 : pg_fatal("could not create connection for client %d",
7517 : state[i].id);
7518 : }
7519 : }
7520 : }
7521 :
7522 : /* GO */
7523 174 : THREAD_BARRIER_WAIT(&barrier);
7524 :
7525 174 : start = pg_time_now();
7526 174 : thread->bench_start = start;
7527 174 : thread->throttle_trigger = start;
7528 :
7529 : /*
7530 : * The log format currently has Unix epoch timestamps with whole numbers
7531 : * of seconds. Round the first aggregate's start time down to the nearest
7532 : * Unix epoch second (the very first aggregate might really have started a
7533 : * fraction of a second later, but later aggregates are measured from the
7534 : * whole number time that is actually logged).
7535 : */
7536 174 : initStats(&aggs, (start + epoch_shift) / 1000000 * 1000000);
7537 174 : last = aggs;
7538 :
7539 : /* loop till all clients have terminated */
7540 32866 : while (remains > 0)
7541 : {
7542 : int nsocks; /* number of sockets to be waited for */
7543 : pg_time_usec_t min_usec;
7544 32696 : pg_time_usec_t now = 0; /* set this only if needed */
7545 :
7546 : /*
7547 : * identify which client sockets should be checked for input, and
7548 : * compute the nearest time (if any) at which we need to wake up.
7549 : */
7550 32696 : clear_socket_set(sockets);
7551 32696 : nsocks = 0;
7552 32696 : min_usec = PG_INT64_MAX;
7553 147220 : for (int i = 0; i < nstate; i++)
7554 : {
7555 128858 : CState *st = &state[i];
7556 :
7557 128858 : if (st->state == CSTATE_SLEEP || st->state == CSTATE_THROTTLE)
7558 6 : {
7559 : /* a nap from the script, or under throttling */
7560 : pg_time_usec_t this_usec;
7561 :
7562 : /* get current time if needed */
7563 6 : pg_time_now_lazy(&now);
7564 :
7565 : /* min_usec should be the minimum delay across all clients */
7566 12 : this_usec = (st->state == CSTATE_SLEEP ?
7567 6 : st->sleep_until : st->txn_scheduled) - now;
7568 6 : if (min_usec > this_usec)
7569 6 : min_usec = this_usec;
7570 : }
7571 128852 : else if (st->state == CSTATE_WAIT_RESULT ||
7572 22154 : st->state == CSTATE_WAIT_ROLLBACK_RESULT)
7573 106700 : {
7574 : /*
7575 : * waiting for result from server - nothing to do unless the
7576 : * socket is readable
7577 : */
7578 106700 : int sock = PQsocket(st->con);
7579 :
7580 106700 : if (sock < 0)
7581 : {
7582 0 : pg_log_error("invalid socket: %s", PQerrorMessage(st->con));
7583 2 : goto done;
7584 : }
7585 :
7586 106700 : add_socket_to_set(sockets, sock, nsocks++);
7587 : }
7588 22152 : else if (st->state != CSTATE_ABORTED &&
7589 22152 : st->state != CSTATE_FINISHED)
7590 : {
7591 : /*
7592 : * This client thread is ready to do something, so we don't
7593 : * want to wait. No need to examine additional clients.
7594 : */
7595 14334 : min_usec = 0;
7596 14334 : break;
7597 : }
7598 : }
7599 :
7600 : /* also wake up to print the next progress report on time */
7601 32696 : if (progress && min_usec > 0 && thread->tid == 0)
7602 : {
7603 0 : pg_time_now_lazy(&now);
7604 :
7605 0 : if (now >= next_report)
7606 0 : min_usec = 0;
7607 0 : else if ((next_report - now) < min_usec)
7608 0 : min_usec = next_report - now;
7609 : }
7610 :
7611 : /*
7612 : * If no clients are ready to execute actions, sleep until we receive
7613 : * data on some client socket or the timeout (if any) elapses.
7614 : */
7615 32696 : if (min_usec > 0)
7616 : {
7617 18362 : int rc = 0;
7618 :
7619 18362 : if (min_usec != PG_INT64_MAX)
7620 : {
7621 6 : if (nsocks > 0)
7622 : {
7623 0 : rc = wait_on_socket_set(sockets, min_usec);
7624 : }
7625 : else /* nothing active, simple sleep */
7626 : {
7627 6 : pg_usleep(min_usec);
7628 : }
7629 : }
7630 : else /* no explicit delay, wait without timeout */
7631 : {
7632 18356 : rc = wait_on_socket_set(sockets, 0);
7633 : }
7634 :
7635 18360 : if (rc < 0)
7636 : {
7637 0 : if (errno == EINTR)
7638 : {
7639 : /* On EINTR, go back to top of loop */
7640 0 : continue;
7641 : }
7642 : /* must be something wrong */
7643 0 : pg_log_error("%s() failed: %m", SOCKET_WAIT_METHOD);
7644 0 : goto done;
7645 : }
7646 : }
7647 : else
7648 : {
7649 : /* min_usec <= 0, i.e. something needs to be executed now */
7650 :
7651 : /* If we didn't wait, don't try to read any data */
7652 14334 : clear_socket_set(sockets);
7653 : }
7654 :
7655 : /* ok, advance the state machine of each connection */
7656 32694 : nsocks = 0;
7657 190290 : for (int i = 0; i < nstate; i++)
7658 : {
7659 157598 : CState *st = &state[i];
7660 :
7661 157598 : if (st->state == CSTATE_WAIT_RESULT ||
7662 24554 : st->state == CSTATE_WAIT_ROLLBACK_RESULT)
7663 19962 : {
7664 : /* don't call advanceConnectionState unless data is available */
7665 133046 : int sock = PQsocket(st->con);
7666 :
7667 133046 : if (sock < 0)
7668 : {
7669 0 : pg_log_error("invalid socket: %s", PQerrorMessage(st->con));
7670 0 : goto done;
7671 : }
7672 :
7673 133046 : if (!socket_has_input(sockets, sock, nsocks++))
7674 113084 : continue;
7675 : }
7676 24552 : else if (st->state == CSTATE_FINISHED ||
7677 15494 : st->state == CSTATE_ABORTED)
7678 : {
7679 : /* this client is done, no need to consider it anymore */
7680 9058 : continue;
7681 : }
7682 :
7683 35456 : advanceConnectionState(thread, st, &aggs);
7684 :
7685 : /*
7686 : * If --exit-on-abort is used, the program is going to exit when
7687 : * any client is aborted.
7688 : */
7689 35456 : if (exit_on_abort && st->state == CSTATE_ABORTED)
7690 2 : goto done;
7691 :
7692 : /*
7693 : * If advanceConnectionState changed client to finished state,
7694 : * that's one fewer client that remains.
7695 : */
7696 35454 : else if (st->state == CSTATE_FINISHED ||
7697 35308 : st->state == CSTATE_ABORTED)
7698 248 : remains--;
7699 : }
7700 :
7701 : /* progress report is made by thread 0 for all threads */
7702 32692 : if (progress && thread->tid == 0)
7703 : {
7704 0 : pg_time_usec_t now2 = pg_time_now();
7705 :
7706 0 : if (now2 >= next_report)
7707 : {
7708 : /*
7709 : * Horrible hack: this relies on the thread pointer we are
7710 : * passed to be equivalent to threads[0], that is the first
7711 : * entry of the threads array. That is why this MUST be done
7712 : * by thread 0 and not any other.
7713 : */
7714 0 : printProgressReport(thread, thread_start, now2,
7715 : &last, &last_report);
7716 :
7717 : /*
7718 : * Ensure that the next report is in the future, in case
7719 : * pgbench/postgres got stuck somewhere.
7720 : */
7721 : do
7722 : {
7723 0 : next_report += (int64) 1000000 * progress;
7724 0 : } while (now2 >= next_report);
7725 : }
7726 : }
7727 : }
7728 :
7729 170 : done:
7730 172 : if (exit_on_abort)
7731 : {
7732 : /*
7733 : * Abort if any client is not finished, meaning some error occurred.
7734 : */
7735 6 : for (int i = 0; i < nstate; i++)
7736 : {
7737 4 : if (state[i].state != CSTATE_FINISHED)
7738 : {
7739 2 : pg_log_error("Run was aborted due to an error in thread %d",
7740 : thread->tid);
7741 2 : exit(2);
7742 : }
7743 : }
7744 : }
7745 :
7746 170 : disconnect_all(state, nstate);
7747 :
7748 170 : if (thread->logfile)
7749 : {
7750 4 : if (agg_interval > 0)
7751 : {
7752 : /* log aggregated but not yet reported transactions */
7753 0 : doLog(thread, state, &aggs, false, 0, 0);
7754 : }
7755 4 : fclose(thread->logfile);
7756 4 : thread->logfile = NULL;
7757 : }
7758 170 : free_socket_set(sockets);
7759 170 : THREAD_FUNC_RETURN;
7760 : }
7761 :
7762 : static void
7763 966 : finishCon(CState *st)
7764 : {
7765 966 : if (st->con != NULL)
7766 : {
7767 456 : PQfinish(st->con);
7768 456 : st->con = NULL;
7769 : }
7770 966 : }
7771 :
7772 : /*
7773 : * Support for duration option: set timer_exceeded after so many seconds.
7774 : */
7775 :
7776 : #ifndef WIN32
7777 :
7778 : static void
7779 0 : handle_sig_alarm(SIGNAL_ARGS)
7780 : {
7781 0 : timer_exceeded = true;
7782 0 : }
7783 :
7784 : static void
7785 0 : setalarm(int seconds)
7786 : {
7787 0 : pqsignal(SIGALRM, handle_sig_alarm);
7788 0 : alarm(seconds);
7789 0 : }
7790 :
7791 : #else /* WIN32 */
7792 :
7793 : static VOID CALLBACK
7794 : win32_timer_callback(PVOID lpParameter, BOOLEAN TimerOrWaitFired)
7795 : {
7796 : timer_exceeded = true;
7797 : }
7798 :
7799 : static void
7800 : setalarm(int seconds)
7801 : {
7802 : HANDLE queue;
7803 : HANDLE timer;
7804 :
7805 : /* This function will be called at most once, so we can cheat a bit. */
7806 : queue = CreateTimerQueue();
7807 : if (seconds > ((DWORD) -1) / 1000 ||
7808 : !CreateTimerQueueTimer(&timer, queue,
7809 : win32_timer_callback, NULL, seconds * 1000, 0,
7810 : WT_EXECUTEINTIMERTHREAD | WT_EXECUTEONLYONCE))
7811 : pg_fatal("failed to set timer");
7812 : }
7813 :
7814 : #endif /* WIN32 */
7815 :
7816 :
7817 : /*
7818 : * These functions provide an abstraction layer that hides the syscall
7819 : * we use to wait for input on a set of sockets.
7820 : *
7821 : * Currently there are two implementations, based on ppoll(2) and select(2).
7822 : * ppoll() is preferred where available due to its typically higher ceiling
7823 : * on the number of usable sockets. We do not use the more-widely-available
7824 : * poll(2) because it only offers millisecond timeout resolution, which could
7825 : * be problematic with high --rate settings.
7826 : *
7827 : * Function APIs:
7828 : *
7829 : * alloc_socket_set: allocate an empty socket set with room for up to
7830 : * "count" sockets.
7831 : *
7832 : * free_socket_set: deallocate a socket set.
7833 : *
7834 : * clear_socket_set: reset a socket set to empty.
7835 : *
7836 : * add_socket_to_set: add socket with indicated FD to slot "idx" in the
7837 : * socket set. Slots must be filled in order, starting with 0.
7838 : *
7839 : * wait_on_socket_set: wait for input on any socket in set, or for timeout
7840 : * to expire. timeout is measured in microseconds; 0 means wait forever.
7841 : * Returns result code of underlying syscall (>=0 if OK, else see errno).
7842 : *
7843 : * socket_has_input: after waiting, call this to see if given socket has
7844 : * input. fd and idx parameters should match some previous call to
7845 : * add_socket_to_set.
7846 : *
7847 : * Note that wait_on_socket_set destructively modifies the state of the
7848 : * socket set. After checking for input, caller must apply clear_socket_set
7849 : * and add_socket_to_set again before waiting again.
7850 : */
7851 :
7852 : #ifdef POLL_USING_PPOLL
7853 :
7854 : static socket_set *
7855 174 : alloc_socket_set(int count)
7856 : {
7857 : socket_set *sa;
7858 :
7859 174 : sa = (socket_set *) pg_malloc0(offsetof(socket_set, pollfds) +
7860 : sizeof(struct pollfd) * count);
7861 174 : sa->maxfds = count;
7862 174 : sa->curfds = 0;
7863 174 : return sa;
7864 : }
7865 :
7866 : static void
7867 170 : free_socket_set(socket_set *sa)
7868 : {
7869 170 : pg_free(sa);
7870 170 : }
7871 :
7872 : static void
7873 47030 : clear_socket_set(socket_set *sa)
7874 : {
7875 47030 : sa->curfds = 0;
7876 47030 : }
7877 :
7878 : static void
7879 106700 : add_socket_to_set(socket_set *sa, int fd, int idx)
7880 : {
7881 : Assert(idx < sa->maxfds && idx == sa->curfds);
7882 106700 : sa->pollfds[idx].fd = fd;
7883 106700 : sa->pollfds[idx].events = POLLIN;
7884 106700 : sa->pollfds[idx].revents = 0;
7885 106700 : sa->curfds++;
7886 106700 : }
7887 :
7888 : static int
7889 18356 : wait_on_socket_set(socket_set *sa, int64 usecs)
7890 : {
7891 18356 : if (usecs > 0)
7892 : {
7893 : struct timespec timeout;
7894 :
7895 0 : timeout.tv_sec = usecs / 1000000;
7896 0 : timeout.tv_nsec = (usecs % 1000000) * 1000;
7897 0 : return ppoll(sa->pollfds, sa->curfds, &timeout, NULL);
7898 : }
7899 : else
7900 : {
7901 18356 : return ppoll(sa->pollfds, sa->curfds, NULL, NULL);
7902 : }
7903 : }
7904 :
7905 : static bool
7906 133046 : socket_has_input(socket_set *sa, int fd, int idx)
7907 : {
7908 : /*
7909 : * In some cases, threadRun will apply clear_socket_set and then try to
7910 : * apply socket_has_input anyway with arguments that it used before that,
7911 : * or might've used before that except that it exited its setup loop
7912 : * early. Hence, if the socket set is empty, silently return false
7913 : * regardless of the parameters. If it's not empty, we can Assert that
7914 : * the parameters match a previous call.
7915 : */
7916 133046 : if (sa->curfds == 0)
7917 51500 : return false;
7918 :
7919 : Assert(idx < sa->curfds && sa->pollfds[idx].fd == fd);
7920 81546 : return (sa->pollfds[idx].revents & POLLIN) != 0;
7921 : }
7922 :
7923 : #endif /* POLL_USING_PPOLL */
7924 :
7925 : #ifdef POLL_USING_SELECT
7926 :
7927 : static socket_set *
7928 : alloc_socket_set(int count)
7929 : {
7930 : return (socket_set *) pg_malloc0(sizeof(socket_set));
7931 : }
7932 :
7933 : static void
7934 : free_socket_set(socket_set *sa)
7935 : {
7936 : pg_free(sa);
7937 : }
7938 :
7939 : static void
7940 : clear_socket_set(socket_set *sa)
7941 : {
7942 : FD_ZERO(&sa->fds);
7943 : sa->maxfd = -1;
7944 : }
7945 :
7946 : static void
7947 : add_socket_to_set(socket_set *sa, int fd, int idx)
7948 : {
7949 : /* See connect_slot() for background on this code. */
7950 : #ifdef WIN32
7951 : if (sa->fds.fd_count + 1 >= FD_SETSIZE)
7952 : {
7953 : pg_log_error("too many concurrent database clients for this platform: %d",
7954 : sa->fds.fd_count + 1);
7955 : exit(1);
7956 : }
7957 : #else
7958 : if (fd < 0 || fd >= FD_SETSIZE)
7959 : {
7960 : pg_log_error("socket file descriptor out of range for select(): %d",
7961 : fd);
7962 : pg_log_error_hint("Try fewer concurrent database clients.");
7963 : exit(1);
7964 : }
7965 : #endif
7966 : FD_SET(fd, &sa->fds);
7967 : if (fd > sa->maxfd)
7968 : sa->maxfd = fd;
7969 : }
7970 :
7971 : static int
7972 : wait_on_socket_set(socket_set *sa, int64 usecs)
7973 : {
7974 : if (usecs > 0)
7975 : {
7976 : struct timeval timeout;
7977 :
7978 : timeout.tv_sec = usecs / 1000000;
7979 : timeout.tv_usec = usecs % 1000000;
7980 : return select(sa->maxfd + 1, &sa->fds, NULL, NULL, &timeout);
7981 : }
7982 : else
7983 : {
7984 : return select(sa->maxfd + 1, &sa->fds, NULL, NULL, NULL);
7985 : }
7986 : }
7987 :
7988 : static bool
7989 : socket_has_input(socket_set *sa, int fd, int idx)
7990 : {
7991 : return (FD_ISSET(fd, &sa->fds) != 0);
7992 : }
7993 :
7994 : #endif /* POLL_USING_SELECT */
|