Skip to content

Commit 6ee78a3

Browse files
knizhnikKonstantin Knizhnik
authored andcommitted
On demand downloading of SLRU segments (#332)
* On demand downloading of SLRU segments * Fix smgr_read_slru_segment * Determine SLRU kind in extension * Use ctl->PagePrecedes for SLRU page comparison in SimpleLruDownloadSegment to address wraparround --------- Co-authored-by: Konstantin Knizhnik <[email protected]>
1 parent 0ff55c5 commit 6ee78a3

File tree

3 files changed

+112
-14
lines changed

3 files changed

+112
-14
lines changed

src/backend/access/transam/slru.c

+92-13
Original file line numberDiff line numberDiff line change
@@ -59,6 +59,7 @@
5959
#include "pgstat.h"
6060
#include "storage/fd.h"
6161
#include "storage/shmem.h"
62+
#include "storage/smgr.h"
6263

6364
#define SlruFileName(ctl, path, seg) \
6465
snprintf(path, MAXPGPATH, "%s/%04X", (ctl)->Dir, seg)
@@ -617,6 +618,66 @@ SimpleLruWritePage(SlruCtl ctl, int slotno)
617618
SlruInternalWritePage(ctl, slotno, NULL);
618619
}
619620

621+
622+
/*
623+
* NEON: we do not want to include large pg_xact/multixact files in basebackup and prefer
624+
* to download them on demand to reduce startup time.
625+
* If SLRU segment is not found, we try to download it from page server
626+
*/
627+
static int
628+
SimpleLruDownloadSegment(SlruCtl ctl, int pageno, char const* path)
629+
{
630+
int segno;
631+
int fd = -1;
632+
int n_blocks;
633+
char* buffer;
634+
635+
static SMgrRelationData dummy_smgr_rel = {0};
636+
637+
/* If page is greater than latest written page, then do not try to download segment from server */
638+
if (ctl->PagePrecedes(ctl->shared->latest_page_number, pageno))
639+
return -1;
640+
641+
if (!dummy_smgr_rel.smgr)
642+
{
643+
RelFileNode rnode = {0};
644+
dummy_smgr_rel.smgr = smgr(InvalidBackendId, rnode);
645+
}
646+
segno = pageno / SLRU_PAGES_PER_SEGMENT;
647+
648+
buffer = palloc(BLCKSZ * SLRU_PAGES_PER_SEGMENT);
649+
n_blocks = smgr_read_slru_segment(&dummy_smgr_rel, path, segno, buffer);
650+
if (n_blocks > 0)
651+
{
652+
fd = OpenTransientFile(path, O_RDWR | O_CREAT | PG_BINARY);
653+
if (fd < 0)
654+
{
655+
slru_errcause = SLRU_OPEN_FAILED;
656+
slru_errno = errno;
657+
pfree(buffer);
658+
return -1;
659+
}
660+
errno = 0;
661+
pgstat_report_wait_start(WAIT_EVENT_SLRU_WRITE);
662+
if (pg_pwrite(fd, buffer, n_blocks*BLCKSZ, 0) != n_blocks*BLCKSZ)
663+
{
664+
pgstat_report_wait_end();
665+
/* if write didn't set errno, assume problem is no disk space */
666+
if (errno == 0)
667+
errno = ENOSPC;
668+
slru_errcause = SLRU_WRITE_FAILED;
669+
slru_errno = errno;
670+
671+
CloseTransientFile(fd);
672+
pfree(buffer);
673+
return -1;
674+
}
675+
pgstat_report_wait_end();
676+
}
677+
pfree(buffer);
678+
return fd;
679+
}
680+
620681
/*
621682
* Return whether the given page exists on disk.
622683
*
@@ -644,12 +705,18 @@ SimpleLruDoesPhysicalPageExist(SlruCtl ctl, int pageno)
644705
{
645706
/* expected: file doesn't exist */
646707
if (errno == ENOENT)
647-
return false;
648-
649-
/* report error normally */
650-
slru_errcause = SLRU_OPEN_FAILED;
651-
slru_errno = errno;
652-
SlruReportIOError(ctl, pageno, 0);
708+
{
709+
fd = SimpleLruDownloadSegment(ctl, pageno, path);
710+
if (fd < 0)
711+
return false;
712+
}
713+
else
714+
{
715+
/* report error normally */
716+
slru_errcause = SLRU_OPEN_FAILED;
717+
slru_errno = errno;
718+
SlruReportIOError(ctl, pageno, 0);
719+
}
653720
}
654721

655722
if ((endpos = lseek(fd, 0, SEEK_END)) < 0)
@@ -703,18 +770,30 @@ SlruPhysicalReadPage(SlruCtl ctl, int pageno, int slotno)
703770
fd = OpenTransientFile(path, O_RDONLY | PG_BINARY);
704771
if (fd < 0)
705772
{
706-
if (errno != ENOENT || !InRecovery)
773+
if (errno != ENOENT)
707774
{
708775
slru_errcause = SLRU_OPEN_FAILED;
709776
slru_errno = errno;
710777
return false;
711778
}
712-
713-
ereport(LOG,
714-
(errmsg("file \"%s\" doesn't exist, reading as zeroes",
715-
path)));
716-
MemSet(shared->page_buffer[slotno], 0, BLCKSZ);
717-
return true;
779+
fd = SimpleLruDownloadSegment(ctl, pageno, path);
780+
if (fd < 0)
781+
{
782+
if (!InRecovery)
783+
{
784+
slru_errcause = SLRU_OPEN_FAILED;
785+
slru_errno = errno;
786+
return false;
787+
}
788+
else
789+
{
790+
ereport(LOG,
791+
(errmsg("file \"%s\" doesn't exist, reading as zeroes",
792+
path)));
793+
MemSet(shared->page_buffer[slotno], 0, BLCKSZ);
794+
return true;
795+
}
796+
}
718797
}
719798

720799
errno = 0;

src/backend/storage/smgr/smgr.c

+16
Original file line numberDiff line numberDiff line change
@@ -570,6 +570,22 @@ smgrwrite(SMgrRelation reln, ForkNumber forknum, BlockNumber blocknum,
570570
buffer, skipFsync);
571571
}
572572

573+
/*
574+
* NEON: we do not want to include large pg_xact/multixact files in basebackup and prefer
575+
* to download them on demand to reduce startup time.
576+
* If SLRU segment is not found, we try to download it from page server
577+
*
578+
* This function returns number of blocks in segment. Usually it should be SLRU_PAGES_PER_SEGMENT but in case
579+
* of partial segment, it can be smaller. Zero value means that segment doesn't exist.
580+
* From Postgres point of view empty segment is the same as absent segment.
581+
*/
582+
int
583+
smgr_read_slru_segment(SMgrRelation reln, const char* path, int segno, void* buffer)
584+
{
585+
return (*reln->smgr).smgr_read_slru_segment ? (*reln->smgr).smgr_read_slru_segment(reln, path, segno, buffer) : 0;
586+
}
587+
588+
573589

574590
/*
575591
* smgrwriteback() -- Trigger kernel writeback for the supplied range of

src/include/storage/smgr.h

+4-1
Original file line numberDiff line numberDiff line change
@@ -88,7 +88,6 @@ typedef SMgrRelationData *SMgrRelation;
8888
#define SmgrIsTemp(smgr) \
8989
RelFileNodeBackendIsTemp((smgr)->smgr_rnode)
9090

91-
9291
/*
9392
* This struct of function pointers defines the API between smgr.c and
9493
* any individual storage manager module. Note that smgr subfunctions are
@@ -129,6 +128,8 @@ typedef struct f_smgr
129128
void (*smgr_start_unlogged_build) (SMgrRelation reln);
130129
void (*smgr_finish_unlogged_build_phase_1) (SMgrRelation reln);
131130
void (*smgr_end_unlogged_build) (SMgrRelation reln);
131+
132+
int (*smgr_read_slru_segment) (SMgrRelation reln, const char *path, int segno, void* buffer);
132133
} f_smgr;
133134

134135
typedef void (*smgr_init_hook_type) (void);
@@ -183,4 +184,6 @@ extern void smgr_start_unlogged_build(SMgrRelation reln);
183184
extern void smgr_finish_unlogged_build_phase_1(SMgrRelation reln);
184185
extern void smgr_end_unlogged_build(SMgrRelation reln);
185186

187+
extern int smgr_read_slru_segment(SMgrRelation reln, const char *path, int segno, void* buffer);
188+
186189
#endif /* SMGR_H */

0 commit comments

Comments
 (0)