LCOV - code coverage report
Current view: top level - src/bin/pg_dump - pg_backup_directory.c (source / functions) Hit Total Coverage
Test: PostgreSQL 18devel Lines: 241 294 82.0 %
Date: 2025-01-18 04:15:08 Functions: 27 27 100.0 %
Legend: Lines: hit not hit

          Line data    Source code
       1             : /*-------------------------------------------------------------------------
       2             :  *
       3             :  * pg_backup_directory.c
       4             :  *
       5             :  *  A directory format dump is a directory, which contains a "toc.dat" file
       6             :  *  for the TOC, and a separate file for each data entry, named "<oid>.dat".
       7             :  *  Large objects are stored in separate files named "blob_<oid>.dat",
       8             :  *  and there's a plain-text TOC file for each BLOBS TOC entry named
       9             :  *  "blobs_<dumpID>.toc" (or just "blobs.toc" in archive versions before 16).
      10             :  *
      11             :  *  If compression is used, each data file is individually compressed and the
      12             :  *  ".gz" suffix is added to the filenames. The TOC files are never
      13             :  *  compressed by pg_dump, however they are accepted with the .gz suffix too,
      14             :  *  in case the user has manually compressed them with 'gzip'.
      15             :  *
      16             :  *  NOTE: This format is identical to the files written in the tar file in
      17             :  *  the 'tar' format, except that we don't write the restore.sql file (TODO),
      18             :  *  and the tar format doesn't support compression. Please keep the formats in
      19             :  *  sync.
      20             :  *
      21             :  *
      22             :  *  Portions Copyright (c) 1996-2025, PostgreSQL Global Development Group
      23             :  *  Portions Copyright (c) 1994, Regents of the University of California
      24             :  *  Portions Copyright (c) 2000, Philip Warner
      25             :  *
      26             :  *  Rights are granted to use this software in any way so long
      27             :  *  as this notice is not removed.
      28             :  *
      29             :  *  The author is not responsible for loss or damages that may
      30             :  *  result from its use.
      31             :  *
      32             :  * IDENTIFICATION
      33             :  *      src/bin/pg_dump/pg_backup_directory.c
      34             :  *
      35             :  *-------------------------------------------------------------------------
      36             :  */
      37             : #include "postgres_fe.h"
      38             : 
      39             : #include <dirent.h>
      40             : #include <sys/stat.h>
      41             : 
      42             : #include "common/file_utils.h"
      43             : #include "compress_io.h"
      44             : #include "parallel.h"
      45             : #include "pg_backup_utils.h"
      46             : 
      47             : typedef struct
      48             : {
      49             :     /*
      50             :      * Our archive location. This is basically what the user specified as his
      51             :      * backup file but of course here it is a directory.
      52             :      */
      53             :     char       *directory;
      54             : 
      55             :     CompressFileHandle *dataFH; /* currently open data file */
      56             :     CompressFileHandle *LOsTocFH;   /* file handle for blobs_NNN.toc */
      57             :     ParallelState *pstate;      /* for parallel backup / restore */
      58             : } lclContext;
      59             : 
      60             : typedef struct
      61             : {
      62             :     char       *filename;       /* filename excluding the directory (basename) */
      63             : } lclTocEntry;
      64             : 
      65             : /* prototypes for private functions */
      66             : static void _ArchiveEntry(ArchiveHandle *AH, TocEntry *te);
      67             : static void _StartData(ArchiveHandle *AH, TocEntry *te);
      68             : static void _EndData(ArchiveHandle *AH, TocEntry *te);
      69             : static void _WriteData(ArchiveHandle *AH, const void *data, size_t dLen);
      70             : static int  _WriteByte(ArchiveHandle *AH, const int i);
      71             : static int  _ReadByte(ArchiveHandle *AH);
      72             : static void _WriteBuf(ArchiveHandle *AH, const void *buf, size_t len);
      73             : static void _ReadBuf(ArchiveHandle *AH, void *buf, size_t len);
      74             : static void _CloseArchive(ArchiveHandle *AH);
      75             : static void _ReopenArchive(ArchiveHandle *AH);
      76             : static void _PrintTocData(ArchiveHandle *AH, TocEntry *te);
      77             : 
      78             : static void _WriteExtraToc(ArchiveHandle *AH, TocEntry *te);
      79             : static void _ReadExtraToc(ArchiveHandle *AH, TocEntry *te);
      80             : static void _PrintExtraToc(ArchiveHandle *AH, TocEntry *te);
      81             : 
      82             : static void _StartLOs(ArchiveHandle *AH, TocEntry *te);
      83             : static void _StartLO(ArchiveHandle *AH, TocEntry *te, Oid oid);
      84             : static void _EndLO(ArchiveHandle *AH, TocEntry *te, Oid oid);
      85             : static void _EndLOs(ArchiveHandle *AH, TocEntry *te);
      86             : static void _LoadLOs(ArchiveHandle *AH, TocEntry *te);
      87             : 
      88             : static void _PrepParallelRestore(ArchiveHandle *AH);
      89             : static void _Clone(ArchiveHandle *AH);
      90             : static void _DeClone(ArchiveHandle *AH);
      91             : 
      92             : static int  _WorkerJobRestoreDirectory(ArchiveHandle *AH, TocEntry *te);
      93             : static int  _WorkerJobDumpDirectory(ArchiveHandle *AH, TocEntry *te);
      94             : 
      95             : static void setFilePath(ArchiveHandle *AH, char *buf,
      96             :                         const char *relativeFilename);
      97             : 
      98             : /*
      99             :  *  Init routine required by ALL formats. This is a global routine
     100             :  *  and should be declared in pg_backup_archiver.h
     101             :  *
     102             :  *  Its task is to create any extra archive context (using AH->formatData),
     103             :  *  and to initialize the supported function pointers.
     104             :  *
     105             :  *  It should also prepare whatever its input source is for reading/writing,
     106             :  *  and in the case of a read mode connection, it should load the Header & TOC.
     107             :  */
     108             : void
     109          44 : InitArchiveFmt_Directory(ArchiveHandle *AH)
     110             : {
     111             :     lclContext *ctx;
     112             : 
     113             :     /* Assuming static functions, this can be copied for each format. */
     114          44 :     AH->ArchiveEntryPtr = _ArchiveEntry;
     115          44 :     AH->StartDataPtr = _StartData;
     116          44 :     AH->WriteDataPtr = _WriteData;
     117          44 :     AH->EndDataPtr = _EndData;
     118          44 :     AH->WriteBytePtr = _WriteByte;
     119          44 :     AH->ReadBytePtr = _ReadByte;
     120          44 :     AH->WriteBufPtr = _WriteBuf;
     121          44 :     AH->ReadBufPtr = _ReadBuf;
     122          44 :     AH->ClosePtr = _CloseArchive;
     123          44 :     AH->ReopenPtr = _ReopenArchive;
     124          44 :     AH->PrintTocDataPtr = _PrintTocData;
     125          44 :     AH->ReadExtraTocPtr = _ReadExtraToc;
     126          44 :     AH->WriteExtraTocPtr = _WriteExtraToc;
     127          44 :     AH->PrintExtraTocPtr = _PrintExtraToc;
     128             : 
     129          44 :     AH->StartLOsPtr = _StartLOs;
     130          44 :     AH->StartLOPtr = _StartLO;
     131          44 :     AH->EndLOPtr = _EndLO;
     132          44 :     AH->EndLOsPtr = _EndLOs;
     133             : 
     134          44 :     AH->PrepParallelRestorePtr = _PrepParallelRestore;
     135          44 :     AH->ClonePtr = _Clone;
     136          44 :     AH->DeClonePtr = _DeClone;
     137             : 
     138          44 :     AH->WorkerJobRestorePtr = _WorkerJobRestoreDirectory;
     139          44 :     AH->WorkerJobDumpPtr = _WorkerJobDumpDirectory;
     140             : 
     141             :     /* Set up our private context */
     142          44 :     ctx = (lclContext *) pg_malloc0(sizeof(lclContext));
     143          44 :     AH->formatData = ctx;
     144             : 
     145          44 :     ctx->dataFH = NULL;
     146          44 :     ctx->LOsTocFH = NULL;
     147             : 
     148             :     /*
     149             :      * Now open the TOC file
     150             :      */
     151             : 
     152          44 :     if (!AH->fSpec || strcmp(AH->fSpec, "") == 0)
     153           0 :         pg_fatal("no output directory specified");
     154             : 
     155          44 :     ctx->directory = AH->fSpec;
     156             : 
     157          44 :     if (AH->mode == archModeWrite)
     158             :     {
     159             :         struct stat st;
     160          20 :         bool        is_empty = false;
     161             : 
     162             :         /* we accept an empty existing directory */
     163          20 :         if (stat(ctx->directory, &st) == 0 && S_ISDIR(st.st_mode))
     164             :         {
     165           0 :             DIR        *dir = opendir(ctx->directory);
     166             : 
     167           0 :             if (dir)
     168             :             {
     169             :                 struct dirent *d;
     170             : 
     171           0 :                 is_empty = true;
     172           0 :                 while (errno = 0, (d = readdir(dir)))
     173             :                 {
     174           0 :                     if (strcmp(d->d_name, ".") != 0 && strcmp(d->d_name, "..") != 0)
     175             :                     {
     176           0 :                         is_empty = false;
     177           0 :                         break;
     178             :                     }
     179             :                 }
     180             : 
     181           0 :                 if (errno)
     182           0 :                     pg_fatal("could not read directory \"%s\": %m",
     183             :                              ctx->directory);
     184             : 
     185           0 :                 if (closedir(dir))
     186           0 :                     pg_fatal("could not close directory \"%s\": %m",
     187             :                              ctx->directory);
     188             :             }
     189             :         }
     190             : 
     191          20 :         if (!is_empty && mkdir(ctx->directory, 0700) < 0)
     192           0 :             pg_fatal("could not create directory \"%s\": %m",
     193             :                      ctx->directory);
     194             :     }
     195             :     else
     196             :     {                           /* Read Mode */
     197             :         char        fname[MAXPGPATH];
     198             :         CompressFileHandle *tocFH;
     199             : 
     200          24 :         setFilePath(AH, fname, "toc.dat");
     201             : 
     202          24 :         tocFH = InitDiscoverCompressFileHandle(fname, PG_BINARY_R);
     203          24 :         if (tocFH == NULL)
     204           0 :             pg_fatal("could not open input file \"%s\": %m", fname);
     205             : 
     206          24 :         ctx->dataFH = tocFH;
     207             : 
     208             :         /*
     209             :          * The TOC of a directory format dump shares the format code of the
     210             :          * tar format.
     211             :          */
     212          24 :         AH->format = archTar;
     213          24 :         ReadHead(AH);
     214          24 :         AH->format = archDirectory;
     215          24 :         ReadToc(AH);
     216             : 
     217             :         /* Nothing else in the file, so close it again... */
     218          24 :         if (!EndCompressFileHandle(tocFH))
     219           0 :             pg_fatal("could not close TOC file: %m");
     220          24 :         ctx->dataFH = NULL;
     221             :     }
     222          44 : }
     223             : 
     224             : /*
     225             :  * Called by the Archiver when the dumper creates a new TOC entry.
     226             :  *
     227             :  * We determine the filename for this entry.
     228             : */
     229             : static void
     230        2630 : _ArchiveEntry(ArchiveHandle *AH, TocEntry *te)
     231             : {
     232             :     lclTocEntry *tctx;
     233             :     char        fn[MAXPGPATH];
     234             : 
     235        2630 :     tctx = (lclTocEntry *) pg_malloc0(sizeof(lclTocEntry));
     236        2630 :     if (strcmp(te->desc, "BLOBS") == 0)
     237             :     {
     238          16 :         snprintf(fn, MAXPGPATH, "blobs_%d.toc", te->dumpId);
     239          16 :         tctx->filename = pg_strdup(fn);
     240             :     }
     241        2614 :     else if (te->dataDumper)
     242             :     {
     243         290 :         snprintf(fn, MAXPGPATH, "%d.dat", te->dumpId);
     244         290 :         tctx->filename = pg_strdup(fn);
     245             :     }
     246             :     else
     247        2324 :         tctx->filename = NULL;
     248             : 
     249        2630 :     te->formatData = tctx;
     250        2630 : }
     251             : 
     252             : /*
     253             :  * Called by the Archiver to save any extra format-related TOC entry
     254             :  * data.
     255             :  *
     256             :  * Use the Archiver routines to write data - they are non-endian, and
     257             :  * maintain other important file information.
     258             :  */
     259             : static void
     260        2630 : _WriteExtraToc(ArchiveHandle *AH, TocEntry *te)
     261             : {
     262        2630 :     lclTocEntry *tctx = (lclTocEntry *) te->formatData;
     263             : 
     264             :     /*
     265             :      * A dumpable object has set tctx->filename, any other object has not.
     266             :      * (see _ArchiveEntry).
     267             :      */
     268        2630 :     if (tctx->filename)
     269         306 :         WriteStr(AH, tctx->filename);
     270             :     else
     271        2324 :         WriteStr(AH, "");
     272        2630 : }
     273             : 
     274             : /*
     275             :  * Called by the Archiver to read any extra format-related TOC data.
     276             :  *
     277             :  * Needs to match the order defined in _WriteExtraToc, and should also
     278             :  * use the Archiver input routines.
     279             :  */
     280             : static void
     281        3212 : _ReadExtraToc(ArchiveHandle *AH, TocEntry *te)
     282             : {
     283        3212 :     lclTocEntry *tctx = (lclTocEntry *) te->formatData;
     284             : 
     285        3212 :     if (tctx == NULL)
     286             :     {
     287        3212 :         tctx = (lclTocEntry *) pg_malloc0(sizeof(lclTocEntry));
     288        3212 :         te->formatData = tctx;
     289             :     }
     290             : 
     291        3212 :     tctx->filename = ReadStr(AH);
     292        3212 :     if (strlen(tctx->filename) == 0)
     293             :     {
     294        2840 :         free(tctx->filename);
     295        2840 :         tctx->filename = NULL;
     296             :     }
     297        3212 : }
     298             : 
     299             : /*
     300             :  * Called by the Archiver when restoring an archive to output a comment
     301             :  * that includes useful information about the TOC entry.
     302             :  */
     303             : static void
     304        2380 : _PrintExtraToc(ArchiveHandle *AH, TocEntry *te)
     305             : {
     306        2380 :     lclTocEntry *tctx = (lclTocEntry *) te->formatData;
     307             : 
     308        2380 :     if (AH->public.verbose && tctx->filename)
     309           0 :         ahprintf(AH, "-- File: %s\n", tctx->filename);
     310        2380 : }
     311             : 
     312             : /*
     313             :  * Called by the archiver when saving TABLE DATA (not schema). This routine
     314             :  * should save whatever format-specific information is needed to read
     315             :  * the archive back.
     316             :  *
     317             :  * It is called just prior to the dumper's 'DataDumper' routine being called.
     318             :  *
     319             :  * We create the data file for writing.
     320             :  */
     321             : static void
     322         290 : _StartData(ArchiveHandle *AH, TocEntry *te)
     323             : {
     324         290 :     lclTocEntry *tctx = (lclTocEntry *) te->formatData;
     325         290 :     lclContext *ctx = (lclContext *) AH->formatData;
     326             :     char        fname[MAXPGPATH];
     327             : 
     328         290 :     setFilePath(AH, fname, tctx->filename);
     329             : 
     330         290 :     ctx->dataFH = InitCompressFileHandle(AH->compression_spec);
     331             : 
     332         290 :     if (!ctx->dataFH->open_write_func(fname, PG_BINARY_W, ctx->dataFH))
     333           0 :         pg_fatal("could not open output file \"%s\": %m", fname);
     334         290 : }
     335             : 
     336             : /*
     337             :  * Called by archiver when dumper calls WriteData. This routine is
     338             :  * called for both LO and table data; it is the responsibility of
     339             :  * the format to manage each kind of data using StartLO/StartData.
     340             :  *
     341             :  * It should only be called from within a DataDumper routine.
     342             :  *
     343             :  * We write the data to the open data file.
     344             :  */
     345             : static void
     346       48556 : _WriteData(ArchiveHandle *AH, const void *data, size_t dLen)
     347             : {
     348       48556 :     lclContext *ctx = (lclContext *) AH->formatData;
     349       48556 :     CompressFileHandle *CFH = ctx->dataFH;
     350             : 
     351       48556 :     errno = 0;
     352       48556 :     if (dLen > 0 && !CFH->write_func(data, dLen, CFH))
     353             :     {
     354             :         /* if write didn't set errno, assume problem is no disk space */
     355           0 :         if (errno == 0)
     356           0 :             errno = ENOSPC;
     357           0 :         pg_fatal("could not write to output file: %s",
     358             :                  CFH->get_error_func(CFH));
     359             :     }
     360       48556 : }
     361             : 
     362             : /*
     363             :  * Called by the archiver when a dumper's 'DataDumper' routine has
     364             :  * finished.
     365             :  *
     366             :  * We close the data file.
     367             :  */
     368             : static void
     369         290 : _EndData(ArchiveHandle *AH, TocEntry *te)
     370             : {
     371         290 :     lclContext *ctx = (lclContext *) AH->formatData;
     372             : 
     373             :     /* Close the file */
     374         290 :     if (!EndCompressFileHandle(ctx->dataFH))
     375           0 :         pg_fatal("could not close data file: %m");
     376             : 
     377         290 :     ctx->dataFH = NULL;
     378         290 : }
     379             : 
     380             : /*
     381             :  * Print data for a given file (can be a LO as well)
     382             :  */
     383             : static void
     384         308 : _PrintFileData(ArchiveHandle *AH, char *filename)
     385             : {
     386         308 :     size_t      cnt = 0;
     387             :     char       *buf;
     388             :     size_t      buflen;
     389             :     CompressFileHandle *CFH;
     390             : 
     391         308 :     if (!filename)
     392           0 :         return;
     393             : 
     394         308 :     CFH = InitDiscoverCompressFileHandle(filename, PG_BINARY_R);
     395         308 :     if (!CFH)
     396           0 :         pg_fatal("could not open input file \"%s\": %m", filename);
     397             : 
     398         308 :     buflen = DEFAULT_IO_BUFFER_SIZE;
     399         308 :     buf = pg_malloc(buflen);
     400             : 
     401         694 :     while (CFH->read_func(buf, buflen, &cnt, CFH) && cnt > 0)
     402             :     {
     403         386 :         ahwrite(buf, 1, cnt, AH);
     404             :     }
     405             : 
     406         308 :     free(buf);
     407         308 :     if (!EndCompressFileHandle(CFH))
     408           0 :         pg_fatal("could not close data file \"%s\": %m", filename);
     409             : }
     410             : 
     411             : /*
     412             :  * Print data for a given TOC entry
     413             : */
     414             : static void
     415         308 : _PrintTocData(ArchiveHandle *AH, TocEntry *te)
     416             : {
     417         308 :     lclTocEntry *tctx = (lclTocEntry *) te->formatData;
     418             : 
     419         308 :     if (!tctx->filename)
     420           0 :         return;
     421             : 
     422         308 :     if (strcmp(te->desc, "BLOBS") == 0)
     423          16 :         _LoadLOs(AH, te);
     424             :     else
     425             :     {
     426             :         char        fname[MAXPGPATH];
     427             : 
     428         292 :         setFilePath(AH, fname, tctx->filename);
     429         292 :         _PrintFileData(AH, fname);
     430             :     }
     431             : }
     432             : 
     433             : static void
     434          16 : _LoadLOs(ArchiveHandle *AH, TocEntry *te)
     435             : {
     436             :     Oid         oid;
     437          16 :     lclContext *ctx = (lclContext *) AH->formatData;
     438          16 :     lclTocEntry *tctx = (lclTocEntry *) te->formatData;
     439             :     CompressFileHandle *CFH;
     440             :     char        tocfname[MAXPGPATH];
     441             :     char        line[MAXPGPATH];
     442             : 
     443          16 :     StartRestoreLOs(AH);
     444             : 
     445             :     /*
     446             :      * Note: before archive v16, there was always only one BLOBS TOC entry,
     447             :      * now there can be multiple.  We don't need to worry what version we are
     448             :      * reading though, because tctx->filename should be correct either way.
     449             :      */
     450          16 :     setFilePath(AH, tocfname, tctx->filename);
     451             : 
     452          16 :     CFH = ctx->LOsTocFH = InitDiscoverCompressFileHandle(tocfname, PG_BINARY_R);
     453             : 
     454          16 :     if (ctx->LOsTocFH == NULL)
     455           0 :         pg_fatal("could not open large object TOC file \"%s\" for input: %m",
     456             :                  tocfname);
     457             : 
     458             :     /* Read the LOs TOC file line-by-line, and process each LO */
     459          32 :     while ((CFH->gets_func(line, MAXPGPATH, CFH)) != NULL)
     460             :     {
     461             :         char        lofname[MAXPGPATH + 1];
     462             :         char        path[MAXPGPATH];
     463             : 
     464             :         /* Can't overflow because line and lofname are the same length */
     465          16 :         if (sscanf(line, "%u %" CppAsString2(MAXPGPATH) "s\n", &oid, lofname) != 2)
     466           0 :             pg_fatal("invalid line in large object TOC file \"%s\": \"%s\"",
     467             :                      tocfname, line);
     468             : 
     469          16 :         StartRestoreLO(AH, oid, AH->public.ropt->dropSchema);
     470          16 :         snprintf(path, MAXPGPATH, "%s/%s", ctx->directory, lofname);
     471          16 :         _PrintFileData(AH, path);
     472          16 :         EndRestoreLO(AH, oid);
     473             :     }
     474          16 :     if (!CFH->eof_func(CFH))
     475           0 :         pg_fatal("error reading large object TOC file \"%s\"",
     476             :                  tocfname);
     477             : 
     478          16 :     if (!EndCompressFileHandle(ctx->LOsTocFH))
     479           0 :         pg_fatal("could not close large object TOC file \"%s\": %m",
     480             :                  tocfname);
     481             : 
     482          16 :     ctx->LOsTocFH = NULL;
     483             : 
     484          16 :     EndRestoreLOs(AH);
     485          16 : }
     486             : 
     487             : 
     488             : /*
     489             :  * Write a byte of data to the archive.
     490             :  * Called by the archiver to do integer & byte output to the archive.
     491             :  * These routines are only used to read & write the headers & TOC.
     492             :  */
     493             : static int
     494      259240 : _WriteByte(ArchiveHandle *AH, const int i)
     495             : {
     496      259240 :     unsigned char c = (unsigned char) i;
     497      259240 :     lclContext *ctx = (lclContext *) AH->formatData;
     498      259240 :     CompressFileHandle *CFH = ctx->dataFH;
     499             : 
     500      259240 :     errno = 0;
     501      259240 :     if (!CFH->write_func(&c, 1, CFH))
     502             :     {
     503             :         /* if write didn't set errno, assume problem is no disk space */
     504           0 :         if (errno == 0)
     505           0 :             errno = ENOSPC;
     506           0 :         pg_fatal("could not write to output file: %s",
     507             :                  CFH->get_error_func(CFH));
     508             :     }
     509             : 
     510      259240 :     return 1;
     511             : }
     512             : 
     513             : /*
     514             :  * Read a byte of data from the archive.
     515             :  * Called by the archiver to read bytes & integers from the archive.
     516             :  * These routines are only used to read & write headers & TOC.
     517             :  * EOF should be treated as a fatal error.
     518             :  */
     519             : static int
     520      316468 : _ReadByte(ArchiveHandle *AH)
     521             : {
     522      316468 :     lclContext *ctx = (lclContext *) AH->formatData;
     523      316468 :     CompressFileHandle *CFH = ctx->dataFH;
     524             : 
     525      316468 :     return CFH->getc_func(CFH);
     526             : }
     527             : 
     528             : /*
     529             :  * Write a buffer of data to the archive.
     530             :  * Called by the archiver to write a block of bytes to the TOC or a data file.
     531             :  */
     532             : static void
     533       29682 : _WriteBuf(ArchiveHandle *AH, const void *buf, size_t len)
     534             : {
     535       29682 :     lclContext *ctx = (lclContext *) AH->formatData;
     536       29682 :     CompressFileHandle *CFH = ctx->dataFH;
     537             : 
     538       29682 :     errno = 0;
     539       29682 :     if (!CFH->write_func(buf, len, CFH))
     540             :     {
     541             :         /* if write didn't set errno, assume problem is no disk space */
     542           0 :         if (errno == 0)
     543           0 :             errno = ENOSPC;
     544           0 :         pg_fatal("could not write to output file: %s",
     545             :                  CFH->get_error_func(CFH));
     546             :     }
     547       29682 : }
     548             : 
     549             : /*
     550             :  * Read a block of bytes from the archive.
     551             :  *
     552             :  * Called by the archiver to read a block of bytes from the archive
     553             :  */
     554             : static void
     555       36220 : _ReadBuf(ArchiveHandle *AH, void *buf, size_t len)
     556             : {
     557       36220 :     lclContext *ctx = (lclContext *) AH->formatData;
     558       36220 :     CompressFileHandle *CFH = ctx->dataFH;
     559             : 
     560             :     /*
     561             :      * If there was an I/O error, we already exited in readF(), so here we
     562             :      * exit on short reads.
     563             :      */
     564       36220 :     if (!CFH->read_func(buf, len, NULL, CFH))
     565           0 :         pg_fatal("could not read from input file: end of file");
     566       36220 : }
     567             : 
     568             : /*
     569             :  * Close the archive.
     570             :  *
     571             :  * When writing the archive, this is the routine that actually starts
     572             :  * the process of saving it to files. No data should be written prior
     573             :  * to this point, since the user could sort the TOC after creating it.
     574             :  *
     575             :  * If an archive is to be written, this routine must call:
     576             :  *      WriteHead           to save the archive header
     577             :  *      WriteToc            to save the TOC entries
     578             :  *      WriteDataChunks     to save all data & LOs.
     579             :  */
     580             : static void
     581          44 : _CloseArchive(ArchiveHandle *AH)
     582             : {
     583          44 :     lclContext *ctx = (lclContext *) AH->formatData;
     584             : 
     585          44 :     if (AH->mode == archModeWrite)
     586             :     {
     587             :         CompressFileHandle *tocFH;
     588          20 :         pg_compress_specification compression_spec = {0};
     589             :         char        fname[MAXPGPATH];
     590             : 
     591          20 :         setFilePath(AH, fname, "toc.dat");
     592             : 
     593             :         /* this will actually fork the processes for a parallel backup */
     594          20 :         ctx->pstate = ParallelBackupStart(AH);
     595             : 
     596             :         /* The TOC is always created uncompressed */
     597          20 :         compression_spec.algorithm = PG_COMPRESSION_NONE;
     598          20 :         tocFH = InitCompressFileHandle(compression_spec);
     599          20 :         if (!tocFH->open_write_func(fname, PG_BINARY_W, tocFH))
     600           0 :             pg_fatal("could not open output file \"%s\": %m", fname);
     601          20 :         ctx->dataFH = tocFH;
     602             : 
     603             :         /*
     604             :          * Write 'tar' in the format field of the toc.dat file. The directory
     605             :          * is compatible with 'tar', so there's no point having a different
     606             :          * format code for it.
     607             :          */
     608          20 :         AH->format = archTar;
     609          20 :         WriteHead(AH);
     610          20 :         AH->format = archDirectory;
     611          20 :         WriteToc(AH);
     612          20 :         if (!EndCompressFileHandle(tocFH))
     613           0 :             pg_fatal("could not close TOC file: %m");
     614          20 :         WriteDataChunks(AH, ctx->pstate);
     615             : 
     616          20 :         ParallelBackupEnd(AH, ctx->pstate);
     617             : 
     618             :         /*
     619             :          * In directory mode, there is no need to sync all the entries
     620             :          * individually. Just recurse once through all the files generated.
     621             :          */
     622          20 :         if (AH->dosync)
     623           8 :             sync_dir_recurse(ctx->directory, AH->sync_method);
     624             :     }
     625          44 :     AH->FH = NULL;
     626          44 : }
     627             : 
     628             : /*
     629             :  * Reopen the archive's file handle.
     630             :  */
     631             : static void
     632          28 : _ReopenArchive(ArchiveHandle *AH)
     633             : {
     634             :     /*
     635             :      * Our TOC is in memory, our data files are opened by each child anyway as
     636             :      * they are separate. We support reopening the archive by just doing
     637             :      * nothing.
     638             :      */
     639          28 : }
     640             : 
     641             : /*
     642             :  * LO support
     643             :  */
     644             : 
     645             : /*
     646             :  * Called by the archiver when starting to save BLOB DATA (not schema).
     647             :  * It is called just prior to the dumper's DataDumper routine.
     648             :  *
     649             :  * We open the large object TOC file here, so that we can append a line to
     650             :  * it for each LO.
     651             :  */
     652             : static void
     653          16 : _StartLOs(ArchiveHandle *AH, TocEntry *te)
     654             : {
     655          16 :     lclContext *ctx = (lclContext *) AH->formatData;
     656          16 :     lclTocEntry *tctx = (lclTocEntry *) te->formatData;
     657          16 :     pg_compress_specification compression_spec = {0};
     658             :     char        fname[MAXPGPATH];
     659             : 
     660          16 :     setFilePath(AH, fname, tctx->filename);
     661             : 
     662             :     /* The LO TOC file is never compressed */
     663          16 :     compression_spec.algorithm = PG_COMPRESSION_NONE;
     664          16 :     ctx->LOsTocFH = InitCompressFileHandle(compression_spec);
     665          16 :     if (!ctx->LOsTocFH->open_write_func(fname, "ab", ctx->LOsTocFH))
     666           0 :         pg_fatal("could not open output file \"%s\": %m", fname);
     667          16 : }
     668             : 
     669             : /*
     670             :  * Called by the archiver when we're about to start dumping a LO.
     671             :  *
     672             :  * We create a file to write the LO to.
     673             :  */
     674             : static void
     675          16 : _StartLO(ArchiveHandle *AH, TocEntry *te, Oid oid)
     676             : {
     677          16 :     lclContext *ctx = (lclContext *) AH->formatData;
     678             :     char        fname[MAXPGPATH];
     679             : 
     680          16 :     snprintf(fname, MAXPGPATH, "%s/blob_%u.dat", ctx->directory, oid);
     681             : 
     682          16 :     ctx->dataFH = InitCompressFileHandle(AH->compression_spec);
     683          16 :     if (!ctx->dataFH->open_write_func(fname, PG_BINARY_W, ctx->dataFH))
     684           0 :         pg_fatal("could not open output file \"%s\": %m", fname);
     685          16 : }
     686             : 
     687             : /*
     688             :  * Called by the archiver when the dumper is finished writing a LO.
     689             :  *
     690             :  * We close the LO file and write an entry to the LO TOC file for it.
     691             :  */
     692             : static void
     693          16 : _EndLO(ArchiveHandle *AH, TocEntry *te, Oid oid)
     694             : {
     695          16 :     lclContext *ctx = (lclContext *) AH->formatData;
     696          16 :     CompressFileHandle *CFH = ctx->LOsTocFH;
     697             :     char        buf[50];
     698             :     int         len;
     699             : 
     700             :     /* Close the BLOB data file itself */
     701          16 :     if (!EndCompressFileHandle(ctx->dataFH))
     702           0 :         pg_fatal("could not close LO data file: %m");
     703          16 :     ctx->dataFH = NULL;
     704             : 
     705             :     /* register the LO in blobs_NNN.toc */
     706          16 :     len = snprintf(buf, sizeof(buf), "%u blob_%u.dat\n", oid, oid);
     707          16 :     if (!CFH->write_func(buf, len, CFH))
     708             :     {
     709             :         /* if write didn't set errno, assume problem is no disk space */
     710           0 :         if (errno == 0)
     711           0 :             errno = ENOSPC;
     712           0 :         pg_fatal("could not write to LOs TOC file: %s",
     713             :                  CFH->get_error_func(CFH));
     714             :     }
     715          16 : }
     716             : 
     717             : /*
     718             :  * Called by the archiver when finishing saving BLOB DATA.
     719             :  *
     720             :  * We close the LOs TOC file.
     721             :  */
     722             : static void
     723          16 : _EndLOs(ArchiveHandle *AH, TocEntry *te)
     724             : {
     725          16 :     lclContext *ctx = (lclContext *) AH->formatData;
     726             : 
     727          16 :     if (!EndCompressFileHandle(ctx->LOsTocFH))
     728           0 :         pg_fatal("could not close LOs TOC file: %m");
     729          16 :     ctx->LOsTocFH = NULL;
     730          16 : }
     731             : 
     732             : /*
     733             :  * Gets a relative file name and prepends the output directory, writing the
     734             :  * result to buf. The caller needs to make sure that buf is MAXPGPATH bytes
     735             :  * big. Can't use a static char[MAXPGPATH] inside the function because we run
     736             :  * multithreaded on Windows.
     737             :  */
     738             : static void
     739         690 : setFilePath(ArchiveHandle *AH, char *buf, const char *relativeFilename)
     740             : {
     741         690 :     lclContext *ctx = (lclContext *) AH->formatData;
     742             :     char       *dname;
     743             : 
     744         690 :     dname = ctx->directory;
     745             : 
     746         690 :     if (strlen(dname) + 1 + strlen(relativeFilename) + 1 > MAXPGPATH)
     747           0 :         pg_fatal("file name too long: \"%s\"", dname);
     748             : 
     749         690 :     strcpy(buf, dname);
     750         690 :     strcat(buf, "/");
     751         690 :     strcat(buf, relativeFilename);
     752         690 : }
     753             : 
     754             : /*
     755             :  * Prepare for parallel restore.
     756             :  *
     757             :  * The main thing that needs to happen here is to fill in TABLE DATA and BLOBS
     758             :  * TOC entries' dataLength fields with appropriate values to guide the
     759             :  * ordering of restore jobs.  The source of said data is format-dependent,
     760             :  * as is the exact meaning of the values.
     761             :  *
     762             :  * A format module might also choose to do other setup here.
     763             :  */
     764             : static void
     765           8 : _PrepParallelRestore(ArchiveHandle *AH)
     766             : {
     767             :     TocEntry   *te;
     768             : 
     769         200 :     for (te = AH->toc->next; te != AH->toc; te = te->next)
     770             :     {
     771         192 :         lclTocEntry *tctx = (lclTocEntry *) te->formatData;
     772             :         char        fname[MAXPGPATH];
     773             :         struct stat st;
     774             : 
     775             :         /*
     776             :          * A dumpable object has set tctx->filename, any other object has not.
     777             :          * (see _ArchiveEntry).
     778             :          */
     779         192 :         if (tctx->filename == NULL)
     780         160 :             continue;
     781             : 
     782             :         /* We may ignore items not due to be restored */
     783          32 :         if ((te->reqs & REQ_DATA) == 0)
     784           0 :             continue;
     785             : 
     786             :         /*
     787             :          * Stat the file and, if successful, put its size in dataLength.  When
     788             :          * using compression, the physical file size might not be a very good
     789             :          * guide to the amount of work involved in restoring the file, but we
     790             :          * only need an approximate indicator of that.
     791             :          */
     792          32 :         setFilePath(AH, fname, tctx->filename);
     793             : 
     794          32 :         if (stat(fname, &st) == 0)
     795           0 :             te->dataLength = st.st_size;
     796          32 :         else if (AH->compression_spec.algorithm != PG_COMPRESSION_NONE)
     797             :         {
     798          32 :             if (AH->compression_spec.algorithm == PG_COMPRESSION_GZIP)
     799          32 :                 strlcat(fname, ".gz", sizeof(fname));
     800           0 :             else if (AH->compression_spec.algorithm == PG_COMPRESSION_LZ4)
     801           0 :                 strlcat(fname, ".lz4", sizeof(fname));
     802           0 :             else if (AH->compression_spec.algorithm == PG_COMPRESSION_ZSTD)
     803           0 :                 strlcat(fname, ".zst", sizeof(fname));
     804             : 
     805          32 :             if (stat(fname, &st) == 0)
     806          32 :                 te->dataLength = st.st_size;
     807             :         }
     808             : 
     809             :         /*
     810             :          * If this is a BLOBS entry, what we stat'd was blobs_NNN.toc, which
     811             :          * most likely is a lot smaller than the actual blob data.  We don't
     812             :          * have a cheap way to estimate how much smaller, but fortunately it
     813             :          * doesn't matter too much as long as we get the LOs processed
     814             :          * reasonably early.  Arbitrarily scale up by a factor of 1K.
     815             :          */
     816          32 :         if (strcmp(te->desc, "BLOBS") == 0)
     817           0 :             te->dataLength *= 1024;
     818             :     }
     819           8 : }
     820             : 
     821             : /*
     822             :  * Clone format-specific fields during parallel restoration.
     823             :  */
     824             : static void
     825          52 : _Clone(ArchiveHandle *AH)
     826             : {
     827          52 :     lclContext *ctx = (lclContext *) AH->formatData;
     828             : 
     829          52 :     AH->formatData = (lclContext *) pg_malloc(sizeof(lclContext));
     830          52 :     memcpy(AH->formatData, ctx, sizeof(lclContext));
     831          52 :     ctx = (lclContext *) AH->formatData;
     832             : 
     833             :     /*
     834             :      * TOC-entry-local state isn't an issue because any one TOC entry is
     835             :      * touched by just one worker child.
     836             :      */
     837             : 
     838             :     /*
     839             :      * We also don't copy the ParallelState pointer (pstate), only the leader
     840             :      * process ever writes to it.
     841             :      */
     842          52 : }
     843             : 
     844             : static void
     845          52 : _DeClone(ArchiveHandle *AH)
     846             : {
     847          52 :     lclContext *ctx = (lclContext *) AH->formatData;
     848             : 
     849          52 :     free(ctx);
     850          52 : }
     851             : 
     852             : /*
     853             :  * This function is executed in the child of a parallel backup for a
     854             :  * directory-format archive and dumps the actual data for one TOC entry.
     855             :  */
     856             : static int
     857         236 : _WorkerJobDumpDirectory(ArchiveHandle *AH, TocEntry *te)
     858             : {
     859             :     /*
     860             :      * This function returns void. We either fail and die horribly or
     861             :      * succeed... A failure will be detected by the parent when the child dies
     862             :      * unexpectedly.
     863             :      */
     864         236 :     WriteDataChunksForTocEntry(AH, te);
     865             : 
     866         236 :     return 0;
     867             : }
     868             : 
     869             : /*
     870             :  * This function is executed in the child of a parallel restore from a
     871             :  * directory-format archive and restores the actual data for one TOC entry.
     872             :  */
     873             : static int
     874          92 : _WorkerJobRestoreDirectory(ArchiveHandle *AH, TocEntry *te)
     875             : {
     876          92 :     return parallel_restore(AH, te);
     877             : }

Generated by: LCOV version 1.14