LCOV - code coverage report
Current view: top level - src/bin/pg_archivecleanup - pg_archivecleanup.c (source / functions) Hit Total Coverage
Test: PostgreSQL 18devel Lines: 129 133 97.0 %
Date: 2025-01-18 04:15:08 Functions: 6 6 100.0 %
Legend: Lines: hit not hit

          Line data    Source code
       1             : /*
       2             :  * pg_archivecleanup.c
       3             :  *
       4             :  * To be used as archive_cleanup_command to clean an archive when using
       5             :  * standby mode.
       6             :  *
       7             :  * src/bin/pg_archivecleanup/pg_archivecleanup.c
       8             :  */
       9             : #include "postgres_fe.h"
      10             : 
      11             : #include <ctype.h>
      12             : #include <dirent.h>
      13             : #include <sys/stat.h>
      14             : #include <fcntl.h>
      15             : #include <signal.h>
      16             : #include <sys/time.h>
      17             : 
      18             : #include "access/xlog_internal.h"
      19             : #include "common/logging.h"
      20             : #include "getopt_long.h"
      21             : 
      22             : static const char *progname;
      23             : 
      24             : /* Options and defaults */
      25             : static bool dryrun = false;     /* are we performing a dry-run operation? */
      26             : static bool cleanBackupHistory = false; /* remove files including backup
      27             :                                          * history files */
      28             : static char *additional_ext = NULL; /* Extension to remove from filenames */
      29             : 
      30             : static char *archiveLocation;   /* where to find the archive? */
      31             : static char *restartWALFileName;    /* the file from which we can restart
      32             :                                      * restore */
      33             : static char exclusiveCleanupFileName[MAXFNAMELEN];  /* the oldest file we want
      34             :                                                      * to remain in archive */
      35             : 
      36             : 
      37             : /* =====================================================================
      38             :  *
      39             :  *        Customizable section
      40             :  *
      41             :  * =====================================================================
      42             :  *
      43             :  *  Currently, this section assumes that the Archive is a locally
      44             :  *  accessible directory. If you want to make other assumptions,
      45             :  *  such as using a vendor-specific archive and access API, these
      46             :  *  routines are the ones you'll need to change. You're
      47             :  *  encouraged to submit any changes to pgsql-hackers@lists.postgresql.org
      48             :  *  or personally to the current maintainer. Those changes may be
      49             :  *  folded in to later versions of this program.
      50             :  */
      51             : 
      52             : /*
      53             :  *  Initialize allows customized commands into the archive cleanup program.
      54             :  *
      55             :  *  You may wish to add code to check for tape libraries, etc..
      56             :  */
      57             : static void
      58          14 : Initialize(void)
      59             : {
      60             :     /*
      61             :      * This code assumes that archiveLocation is a directory, so we use stat
      62             :      * to test if it's accessible.
      63             :      */
      64             :     struct stat stat_buf;
      65             : 
      66          14 :     if (stat(archiveLocation, &stat_buf) != 0 ||
      67          12 :         !S_ISDIR(stat_buf.st_mode))
      68             :     {
      69           2 :         pg_log_error("archive location \"%s\" does not exist",
      70             :                      archiveLocation);
      71           2 :         exit(2);
      72             :     }
      73          12 : }
      74             : 
      75             : static void
      76          82 : TrimExtension(char *filename, char *extension)
      77             : {
      78             :     int         flen;
      79             :     int         elen;
      80             : 
      81          82 :     if (extension == NULL)
      82          28 :         return;
      83             : 
      84          54 :     elen = strlen(extension);
      85          54 :     flen = strlen(filename);
      86             : 
      87          54 :     if (flen > elen && strcmp(filename + flen - elen, extension) == 0)
      88           6 :         filename[flen - elen] = '\0';
      89             : }
      90             : 
      91             : static void
      92          10 : CleanupPriorWALFiles(void)
      93             : {
      94             :     int         rc;
      95             :     DIR        *xldir;
      96             :     struct dirent *xlde;
      97             :     char        walfile[MAXPGPATH];
      98             : 
      99          10 :     xldir = opendir(archiveLocation);
     100          10 :     if (xldir == NULL)
     101           0 :         pg_fatal("could not open archive location \"%s\": %m",
     102             :                  archiveLocation);
     103             : 
     104          80 :     while (errno = 0, (xlde = readdir(xldir)) != NULL)
     105             :     {
     106             :         char        WALFilePath[MAXPGPATH * 2]; /* the file path including
     107             :                                                  * archive */
     108             : 
     109             :         /*
     110             :          * Truncation is essentially harmless, because we skip files whose
     111             :          * format is different from WAL files and backup history files. (In
     112             :          * principle, one could use a 1000-character additional_ext and get
     113             :          * trouble.)
     114             :          */
     115          70 :         strlcpy(walfile, xlde->d_name, MAXPGPATH);
     116          70 :         TrimExtension(walfile, additional_ext);
     117             : 
     118             :         /*
     119             :          * Ignore anything does that not look like a WAL segment, a .partial
     120             :          * WAL segment or a backup history file (if requested).
     121             :          */
     122          70 :         if (!IsXLogFileName(walfile) && !IsPartialXLogFileName(walfile) &&
     123          36 :             !(cleanBackupHistory && IsBackupHistoryFileName(walfile)))
     124          54 :             continue;
     125             : 
     126             :         /*
     127             :          * We ignore the timeline part of the XLOG segment identifiers in
     128             :          * deciding whether a segment is still needed.  This ensures that we
     129             :          * won't prematurely remove a segment from a parent timeline. We could
     130             :          * probably be a little more proactive about removing segments of
     131             :          * non-parent timelines, but that would be a whole lot more
     132             :          * complicated.
     133             :          *
     134             :          * We use the alphanumeric sorting property of the filenames to decide
     135             :          * which ones are earlier than the exclusiveCleanupFileName file. Note
     136             :          * that this means files are not removed in the order they were
     137             :          * originally written, in case this worries you.
     138             :          */
     139          36 :         if (strcmp(walfile + 8, exclusiveCleanupFileName + 8) >= 0)
     140          18 :             continue;
     141             : 
     142             :         /*
     143             :          * Use the original file name again now, including any extension that
     144             :          * might have been chopped off before testing the sequence.
     145             :          */
     146          18 :         snprintf(WALFilePath, sizeof(WALFilePath), "%s/%s",
     147          18 :                  archiveLocation, xlde->d_name);
     148             : 
     149          18 :         if (dryrun)
     150             :         {
     151             :             /*
     152             :              * Prints the name of the file to be removed and skips the actual
     153             :              * removal.  The regular printout is so that the user can pipe the
     154             :              * output into some other program.
     155             :              */
     156           2 :             printf("%s\n", WALFilePath);
     157           2 :             pg_log_debug("file \"%s\" would be removed", WALFilePath);
     158           2 :             continue;
     159             :         }
     160             : 
     161          16 :         pg_log_debug("removing file \"%s\"", WALFilePath);
     162             : 
     163          16 :         rc = unlink(WALFilePath);
     164          16 :         if (rc != 0)
     165           0 :             pg_fatal("could not remove file \"%s\": %m",
     166             :                      WALFilePath);
     167             :     }
     168             : 
     169          10 :     if (errno)
     170           0 :         pg_fatal("could not read archive location \"%s\": %m",
     171             :                  archiveLocation);
     172          10 :     if (closedir(xldir))
     173           0 :         pg_fatal("could not close archive location \"%s\": %m",
     174             :                  archiveLocation);
     175          10 : }
     176             : 
     177             : /*
     178             :  * SetWALFileNameForCleanup()
     179             :  *
     180             :  *    Set the earliest WAL filename that we want to keep on the archive
     181             :  *    and decide whether we need cleanup
     182             :  */
     183             : static void
     184          12 : SetWALFileNameForCleanup(void)
     185             : {
     186          12 :     bool        fnameOK = false;
     187             : 
     188          12 :     TrimExtension(restartWALFileName, additional_ext);
     189             : 
     190             :     /*
     191             :      * If restartWALFileName is a WAL file name then just use it directly. If
     192             :      * restartWALFileName is a .partial or .backup filename, make sure we use
     193             :      * the prefix of the filename, otherwise we will remove wrong files since
     194             :      * 000000010000000000000010.partial and
     195             :      * 000000010000000000000010.00000020.backup are after
     196             :      * 000000010000000000000010.
     197             :      */
     198          12 :     if (IsXLogFileName(restartWALFileName))
     199             :     {
     200           6 :         strcpy(exclusiveCleanupFileName, restartWALFileName);
     201           6 :         fnameOK = true;
     202             :     }
     203           6 :     else if (IsPartialXLogFileName(restartWALFileName))
     204             :     {
     205             :         int         args;
     206           2 :         uint32      tli = 1,
     207           2 :                     log = 0,
     208           2 :                     seg = 0;
     209             : 
     210           2 :         args = sscanf(restartWALFileName, "%08X%08X%08X.partial",
     211             :                       &tli, &log, &seg);
     212           2 :         if (args == 3)
     213             :         {
     214           2 :             fnameOK = true;
     215             : 
     216             :             /*
     217             :              * Use just the prefix of the filename, ignore everything after
     218             :              * first period
     219             :              */
     220           2 :             XLogFileNameById(exclusiveCleanupFileName, tli, log, seg);
     221             :         }
     222             :     }
     223           4 :     else if (IsBackupHistoryFileName(restartWALFileName))
     224             :     {
     225             :         int         args;
     226           2 :         uint32      tli = 1,
     227           2 :                     log = 0,
     228           2 :                     seg = 0,
     229           2 :                     offset = 0;
     230             : 
     231           2 :         args = sscanf(restartWALFileName, "%08X%08X%08X.%08X.backup", &tli, &log, &seg, &offset);
     232           2 :         if (args == 4)
     233             :         {
     234           2 :             fnameOK = true;
     235             : 
     236             :             /*
     237             :              * Use just the prefix of the filename, ignore everything after
     238             :              * first period
     239             :              */
     240           2 :             XLogFileNameById(exclusiveCleanupFileName, tli, log, seg);
     241             :         }
     242             :     }
     243             : 
     244          12 :     if (!fnameOK)
     245             :     {
     246           2 :         pg_log_error("invalid file name argument");
     247           2 :         pg_log_error_hint("Try \"%s --help\" for more information.", progname);
     248           2 :         exit(2);
     249             :     }
     250          10 : }
     251             : 
     252             : /* =====================================================================
     253             :  *        End of Customizable section
     254             :  * =====================================================================
     255             :  */
     256             : 
     257             : static void
     258           2 : usage(void)
     259             : {
     260           2 :     printf(_("%s removes older WAL files from PostgreSQL archives.\n\n"), progname);
     261           2 :     printf(_("Usage:\n"));
     262           2 :     printf(_("  %s [OPTION]... ARCHIVELOCATION OLDESTKEPTWALFILE\n"), progname);
     263           2 :     printf(_("\nOptions:\n"));
     264           2 :     printf(_("  -b, --clean-backup-history  clean up files including backup history files\n"));
     265           2 :     printf(_("  -d, --debug                 generate debug output (verbose mode)\n"));
     266           2 :     printf(_("  -n, --dry-run               dry run, show the names of the files that would be\n"
     267             :              "                              removed\n"));
     268           2 :     printf(_("  -V, --version               output version information, then exit\n"));
     269           2 :     printf(_("  -x, --strip-extension=EXT   strip this extension before identifying files for\n"
     270             :              "                              clean up\n"));
     271           2 :     printf(_("  -?, --help                  show this help, then exit\n"));
     272           2 :     printf(_("\n"
     273             :              "For use as \"archive_cleanup_command\" in postgresql.conf:\n"
     274             :              "  archive_cleanup_command = 'pg_archivecleanup [OPTION]... ARCHIVELOCATION %%r'\n"
     275             :              "e.g.\n"
     276             :              "  archive_cleanup_command = 'pg_archivecleanup /mnt/server/archiverdir %%r'\n"));
     277           2 :     printf(_("\n"
     278             :              "Or for use as a standalone archive cleaner:\n"
     279             :              "e.g.\n"
     280             :              "  pg_archivecleanup /mnt/server/archiverdir 000000010000000000000010.00000020.backup\n"));
     281           2 :     printf(_("\nReport bugs to <%s>.\n"), PACKAGE_BUGREPORT);
     282           2 :     printf(_("%s home page: <%s>\n"), PACKAGE_NAME, PACKAGE_URL);
     283           2 : }
     284             : 
     285             : /*------------ MAIN ----------------------------------------*/
     286             : int
     287          26 : main(int argc, char **argv)
     288             : {
     289             :     static struct option long_options[] = {
     290             :         {"clean-backup-history", no_argument, NULL, 'b'},
     291             :         {"debug", no_argument, NULL, 'd'},
     292             :         {"dry-run", no_argument, NULL, 'n'},
     293             :         {"strip-extension", required_argument, NULL, 'x'},
     294             :         {NULL, 0, NULL, 0}
     295             :     };
     296             :     int         c;
     297             : 
     298          26 :     pg_logging_init(argv[0]);
     299          26 :     set_pglocale_pgservice(argv[0], PG_TEXTDOMAIN("pg_archivecleanup"));
     300          26 :     progname = get_progname(argv[0]);
     301             : 
     302          26 :     if (argc > 1)
     303             :     {
     304          24 :         if (strcmp(argv[1], "--help") == 0 || strcmp(argv[1], "-?") == 0)
     305             :         {
     306           2 :             usage();
     307           2 :             exit(0);
     308             :         }
     309          22 :         if (strcmp(argv[1], "--version") == 0 || strcmp(argv[1], "-V") == 0)
     310             :         {
     311           2 :             puts("pg_archivecleanup (PostgreSQL) " PG_VERSION);
     312           2 :             exit(0);
     313             :         }
     314             :     }
     315             : 
     316          34 :     while ((c = getopt_long(argc, argv, "bdnx:", long_options, NULL)) != -1)
     317             :     {
     318          14 :         switch (c)
     319             :         {
     320           2 :             case 'b':           /* Remove backup history files as well */
     321           2 :                 cleanBackupHistory = true;
     322           2 :                 break;
     323           2 :             case 'd':           /* Debug mode */
     324           2 :                 pg_logging_increase_verbosity();
     325           2 :                 break;
     326           2 :             case 'n':           /* Dry-Run mode */
     327           2 :                 dryrun = true;
     328           2 :                 break;
     329           6 :             case 'x':
     330           6 :                 additional_ext = pg_strdup(optarg); /* Extension to remove
     331             :                                                      * from xlogfile names */
     332           6 :                 break;
     333           2 :             default:
     334             :                 /* getopt already emitted a complaint */
     335           2 :                 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
     336           2 :                 exit(2);
     337             :         }
     338             :     }
     339             : 
     340             :     /*
     341             :      * We will go to the archiveLocation to check restartWALFileName.
     342             :      * restartWALFileName may not exist anymore, which would not be an error,
     343             :      * so we separate the archiveLocation and restartWALFileName so we can
     344             :      * check separately whether archiveLocation exists, if not that is an
     345             :      * error
     346             :      */
     347          20 :     if (optind < argc)
     348             :     {
     349          18 :         archiveLocation = argv[optind];
     350          18 :         optind++;
     351             :     }
     352             :     else
     353             :     {
     354           2 :         pg_log_error("must specify archive location");
     355           2 :         pg_log_error_hint("Try \"%s --help\" for more information.", progname);
     356           2 :         exit(2);
     357             :     }
     358             : 
     359          18 :     if (optind < argc)
     360             :     {
     361          16 :         restartWALFileName = argv[optind];
     362          16 :         optind++;
     363             :     }
     364             :     else
     365             :     {
     366           2 :         pg_log_error("must specify oldest kept WAL file");
     367           2 :         pg_log_error_hint("Try \"%s --help\" for more information.", progname);
     368           2 :         exit(2);
     369             :     }
     370             : 
     371          16 :     if (optind < argc)
     372             :     {
     373           2 :         pg_log_error("too many command-line arguments");
     374           2 :         pg_log_error_hint("Try \"%s --help\" for more information.", progname);
     375           2 :         exit(2);
     376             :     }
     377             : 
     378             :     /*
     379             :      * Check archive exists and other initialization if required.
     380             :      */
     381          14 :     Initialize();
     382             : 
     383             :     /*
     384             :      * Check filename is a valid name, then process to find cut-off
     385             :      */
     386          12 :     SetWALFileNameForCleanup();
     387             : 
     388          10 :     pg_log_debug("keeping WAL file \"%s/%s\" and later",
     389             :                  archiveLocation, exclusiveCleanupFileName);
     390             : 
     391             :     /*
     392             :      * Remove WAL files older than cut-off
     393             :      */
     394          10 :     CleanupPriorWALFiles();
     395             : 
     396          10 :     exit(0);
     397             : }

Generated by: LCOV version 1.14