/*------------------------------------------------------------------------- * * catalog.c: backup catalog opration * * Portions Copyright (c) 2009-2011, NIPPON TELEGRAPH AND TELEPHONE CORPORATION * Portions Copyright (c) 2015-2017, Postgres Professional * *------------------------------------------------------------------------- */ #include "pg_probackup.h" #include #include #include #include #include #include #include #include #include #include #include "pgut/pgut-port.h" static pgBackup *read_backup_from_file(const char *path); #define BOOL_TO_STR(val) ((val) ? "true" : "false") static bool exit_hook_registered = false; static char lock_file[MAXPGPATH]; static void unlink_lock_atexit(void) { int res; res = unlink(lock_file); if (res != 0 && res != ENOENT) elog(WARNING, "%s: %s", lock_file, strerror(errno)); } /* * Create a lockfile. */ void catalog_lock(bool check_catalog) { int fd; char buffer[MAXPGPATH * 2 + 256]; int ntries; int len; int encoded_pid; pid_t my_pid, my_p_pid; join_path_components(lock_file, backup_path, BACKUP_CATALOG_PID); /* * If the PID in the lockfile is our own PID or our parent's or * grandparent's PID, then the file must be stale (probably left over from * a previous system boot cycle). We need to check this because of the * likelihood that a reboot will assign exactly the same PID as we had in * the previous reboot, or one that's only one or two counts larger and * hence the lockfile's PID now refers to an ancestor shell process. We * allow pg_ctl to pass down its parent shell PID (our grandparent PID) * via the environment variable PG_GRANDPARENT_PID; this is so that * launching the postmaster via pg_ctl can be just as reliable as * launching it directly. There is no provision for detecting * further-removed ancestor processes, but if the init script is written * carefully then all but the immediate parent shell will be root-owned * processes and so the kill test will fail with EPERM. Note that we * cannot get a false negative this way, because an existing postmaster * would surely never launch a competing postmaster or pg_ctl process * directly. */ my_pid = getpid(); #ifndef WIN32 my_p_pid = getppid(); #else /* * Windows hasn't got getppid(), but doesn't need it since it's not using * real kill() either... */ my_p_pid = 0; #endif /* * We need a loop here because of race conditions. But don't loop forever * (for example, a non-writable $backup_path directory might cause a failure * that won't go away). 100 tries seems like plenty. */ for (ntries = 0;; ntries++) { /* * Try to create the lock file --- O_EXCL makes this atomic. * * Think not to make the file protection weaker than 0600. See * comments below. */ fd = open(lock_file, O_RDWR | O_CREAT | O_EXCL, 0600); if (fd >= 0) break; /* Success; exit the retry loop */ /* * Couldn't create the pid file. Probably it already exists. */ if ((errno != EEXIST && errno != EACCES) || ntries > 100) elog(ERROR, "could not create lock file \"%s\": %s", lock_file, strerror(errno)); /* * Read the file to get the old owner's PID. Note race condition * here: file might have been deleted since we tried to create it. */ fd = open(lock_file, O_RDONLY, 0600); if (fd < 0) { if (errno == ENOENT) continue; /* race condition; try again */ elog(ERROR, "could not open lock file \"%s\": %s", lock_file, strerror(errno)); } if ((len = read(fd, buffer, sizeof(buffer) - 1)) < 0) elog(ERROR, "could not read lock file \"%s\": %s", lock_file, strerror(errno)); close(fd); if (len == 0) elog(ERROR, "lock file \"%s\" is empty", lock_file); buffer[len] = '\0'; encoded_pid = atoi(buffer); if (encoded_pid <= 0) elog(ERROR, "bogus data in lock file \"%s\": \"%s\"", lock_file, buffer); /* * Check to see if the other process still exists * * Per discussion above, my_pid, my_p_pid can be * ignored as false matches. * * Normally kill() will fail with ESRCH if the given PID doesn't * exist. */ if (encoded_pid != my_pid && encoded_pid != my_p_pid) { if (kill(encoded_pid, 0) == 0 || (errno != ESRCH && errno != EPERM)) elog(ERROR, "lock file \"%s\" already exists", lock_file); } /* * Looks like nobody's home. Unlink the file and try again to create * it. Need a loop because of possible race condition against other * would-be creators. */ if (unlink(lock_file) < 0) elog(ERROR, "could not remove old lock file \"%s\": %s", lock_file, strerror(errno)); } /* * Successfully created the file, now fill it. */ snprintf(buffer, sizeof(buffer), "%d\n", my_pid); errno = 0; if (write(fd, buffer, strlen(buffer)) != strlen(buffer)) { int save_errno = errno; close(fd); unlink(lock_file); /* if write didn't set errno, assume problem is no disk space */ errno = save_errno ? save_errno : ENOSPC; elog(ERROR, "could not write lock file \"%s\": %s", lock_file, strerror(errno)); } if (fsync(fd) != 0) { int save_errno = errno; close(fd); unlink(lock_file); errno = save_errno; elog(ERROR, "could not write lock file \"%s\": %s", lock_file, strerror(errno)); } if (close(fd) != 0) { int save_errno = errno; unlink(lock_file); errno = save_errno; elog(ERROR, "could not write lock file \"%s\": %s", lock_file, strerror(errno)); } /* * Arrange to unlink the lock file(s) at proc_exit. */ if (!exit_hook_registered) { atexit(unlink_lock_atexit); exit_hook_registered = true; } if (check_catalog) { uint64 id; Assert(pgdata); /* Check system-identifier */ id = get_system_identifier(true); if (id != system_identifier) elog(ERROR, "Backup directory was initialized for system id = %ld, but target system id = %ld", system_identifier, id); } } /* * Create a pgBackup which taken at timestamp. * If no backup matches, return NULL. */ pgBackup * read_backup(time_t timestamp) { pgBackup tmp; char conf_path[MAXPGPATH]; tmp.start_time = timestamp; pgBackupGetPath(&tmp, conf_path, lengthof(conf_path), BACKUP_CONF_FILE); return read_backup_from_file(conf_path); } static bool IsDir(const char *dirpath, const char *entry) { char path[MAXPGPATH]; struct stat st; snprintf(path, MAXPGPATH, "%s/%s", dirpath, entry); return stat(path, &st) == 0 && S_ISDIR(st.st_mode); } /* * Create list fo backups started between begin and end from backup catalog. * If range was NULL, all of backup are listed. * The list is sorted in order of descending start time. */ parray * catalog_get_backup_list(time_t backup_id) { DIR *date_dir = NULL; struct dirent *date_ent = NULL; DIR *time_dir = NULL; char backups_path[MAXPGPATH]; char date_path[MAXPGPATH]; parray *backups = NULL; pgBackup *backup = NULL; /* open backup root directory */ join_path_components(backups_path, backup_path, BACKUPS_DIR); date_dir = opendir(backups_path); if (date_dir == NULL) { elog(WARNING, "cannot open directory \"%s\": %s", backups_path, strerror(errno)); goto err_proc; } /* scan date/time directories and list backups in the range */ backups = parray_new(); for (; (date_ent = readdir(date_dir)) != NULL; errno = 0) { char ini_path[MAXPGPATH]; /* skip not-directory entries and hidden entries */ if (!IsDir(backups_path, date_ent->d_name) || date_ent->d_name[0] == '.') continue; /* open subdirectory (date directory) and search time directory */ join_path_components(date_path, backups_path, date_ent->d_name); /* read backup information from backup.ini */ snprintf(ini_path, MAXPGPATH, "%s/%s", date_path, BACKUP_CONF_FILE); backup = read_backup_from_file(ini_path); /* ignore corrupted backup */ if (backup) { if (backup_id != 0 && backup_id != backup->start_time) { pgBackupFree(backup); continue; } parray_append(backups, backup); backup = NULL; } if (errno && errno != ENOENT) { elog(WARNING, "cannot read date directory \"%s\": %s", date_ent->d_name, strerror(errno)); goto err_proc; } } if (errno) { elog(WARNING, "cannot read backup root directory \"%s\": %s", backups_path, strerror(errno)); goto err_proc; } closedir(date_dir); date_dir = NULL; parray_qsort(backups, pgBackupCompareIdDesc); return backups; err_proc: if (time_dir) closedir(time_dir); if (date_dir) closedir(date_dir); if (backup) pgBackupFree(backup); if (backups) parray_walk(backups, pgBackupFree); parray_free(backups); return NULL; } /* * Find the last completed database backup from the backup list. */ pgBackup * catalog_get_last_data_backup(parray *backup_list, TimeLineID tli) { int i; pgBackup *backup = NULL; /* backup_list is sorted in order of descending ID */ for (i = 0; i < parray_num(backup_list); i++) { backup = (pgBackup *) parray_get(backup_list, i); /* * We need completed database backup in the case of a full or * differential backup on current timeline. */ if (backup->status == BACKUP_STATUS_OK && backup->tli == tli && (backup->backup_mode == BACKUP_MODE_DIFF_PAGE || backup->backup_mode == BACKUP_MODE_DIFF_PTRACK || backup->backup_mode == BACKUP_MODE_FULL)) return backup; } return NULL; } /* create backup directory in $BACKUP_PATH */ int pgBackupCreateDir(pgBackup *backup) { int i; char path[MAXPGPATH]; char *subdirs[] = { DATABASE_DIR, NULL }; pgBackupGetPath(backup, path, lengthof(path), NULL); if (!dir_is_empty(path)) elog(ERROR, "backup destination is not empty \"%s\"", path); dir_create_dir(path, DIR_PERMISSION); /* create directories for actual backup files */ for (i = 0; subdirs[i]; i++) { pgBackupGetPath(backup, path, lengthof(path), subdirs[i]); dir_create_dir(path, DIR_PERMISSION); } return 0; } /* * Write configuration section of backup.in to stream "out". */ void pgBackupWriteConfigSection(FILE *out, pgBackup *backup) { static const char *modes[] = { "", "PAGE", "PTRACK", "FULL"}; fprintf(out, "# configuration\n"); fprintf(out, "BACKUP_MODE=%s\n", modes[backup->backup_mode]); } /* * Write result section of backup.in to stream "out". */ void pgBackupWriteResultSection(FILE *out, pgBackup *backup) { char timestamp[20]; fprintf(out, "# result\n"); fprintf(out, "TIMELINEID=%d\n", backup->tli); fprintf(out, "START_LSN=%x/%08x\n", (uint32) (backup->start_lsn >> 32), (uint32) backup->start_lsn); fprintf(out, "STOP_LSN=%x/%08x\n", (uint32) (backup->stop_lsn >> 32), (uint32) backup->stop_lsn); time2iso(timestamp, lengthof(timestamp), backup->start_time); fprintf(out, "START_TIME='%s'\n", timestamp); if (backup->end_time > 0) { time2iso(timestamp, lengthof(timestamp), backup->end_time); fprintf(out, "END_TIME='%s'\n", timestamp); } fprintf(out, "RECOVERY_XID=" XID_FMT "\n", backup->recovery_xid); if (backup->recovery_time > 0) { time2iso(timestamp, lengthof(timestamp), backup->recovery_time); fprintf(out, "RECOVERY_TIME='%s'\n", timestamp); } if (backup->data_bytes != BYTES_INVALID) fprintf(out, "DATA_BYTES=" INT64_FORMAT "\n", backup->data_bytes); fprintf(out, "BLOCK_SIZE=%u\n", backup->block_size); fprintf(out, "XLOG_BLOCK_SIZE=%u\n", backup->wal_block_size); fprintf(out, "CHECKSUM_VERSION=%u\n", backup->checksum_version); fprintf(out, "STREAM=%u\n", backup->stream); fprintf(out, "STATUS=%s\n", status2str(backup->status)); if (backup->parent_backup != 0) { char *parent_backup = base36enc(backup->parent_backup); fprintf(out, "PARENT_BACKUP='%s'\n", parent_backup); free(parent_backup); } } /* create backup.conf */ void pgBackupWriteIni(pgBackup *backup) { FILE *fp = NULL; char ini_path[MAXPGPATH]; pgBackupGetPath(backup, ini_path, lengthof(ini_path), BACKUP_CONF_FILE); fp = fopen(ini_path, "wt"); if (fp == NULL) elog(ERROR, "cannot open configuration file \"%s\": %s", ini_path, strerror(errno)); /* configuration section */ pgBackupWriteConfigSection(fp, backup); /* result section */ pgBackupWriteResultSection(fp, backup); fclose(fp); } /* * Read backup.ini and create pgBackup. * - Comment starts with ';'. * - Do not care section. */ static pgBackup * read_backup_from_file(const char *path) { pgBackup *backup; char *backup_mode = NULL; char *start_lsn = NULL; char *stop_lsn = NULL; char *status = NULL; char *parent_backup = NULL; int i; pgut_option options[] = { {'s', 0, "backup-mode", NULL, SOURCE_FILE_STRICT}, {'u', 0, "timelineid", NULL, SOURCE_FILE_STRICT}, {'s', 0, "start-lsn", NULL, SOURCE_FILE_STRICT}, {'s', 0, "stop-lsn", NULL, SOURCE_FILE_STRICT}, {'t', 0, "start-time", NULL, SOURCE_FILE_STRICT}, {'t', 0, "end-time", NULL, SOURCE_FILE_STRICT}, {'U', 0, "recovery-xid", NULL, SOURCE_FILE_STRICT}, {'t', 0, "recovery-time", NULL, SOURCE_FILE_STRICT}, {'I', 0, "data-bytes", NULL, SOURCE_FILE_STRICT}, {'u', 0, "block-size", NULL, SOURCE_FILE_STRICT}, {'u', 0, "xlog-block-size", NULL, SOURCE_FILE_STRICT}, {'u', 0, "checksum_version", NULL, SOURCE_FILE_STRICT}, {'u', 0, "stream", NULL, SOURCE_FILE_STRICT}, {'s', 0, "status", NULL, SOURCE_FILE_STRICT}, {'s', 0, "parent_backup", NULL, SOURCE_FILE_STRICT}, {0} }; if (access(path, F_OK) != 0) return NULL; backup = pgut_new(pgBackup); init_backup(backup); i = 0; options[i++].var = &backup_mode; options[i++].var = &backup->tli; options[i++].var = &start_lsn; options[i++].var = &stop_lsn; options[i++].var = &backup->start_time; options[i++].var = &backup->end_time; options[i++].var = &backup->recovery_xid; options[i++].var = &backup->recovery_time; options[i++].var = &backup->data_bytes; options[i++].var = &backup->block_size; options[i++].var = &backup->wal_block_size; options[i++].var = &backup->checksum_version; options[i++].var = &backup->stream; options[i++].var = &status; options[i++].var = &parent_backup; Assert(i == lengthof(options) - 1); pgut_readopt(path, options, ERROR); if (backup_mode) { backup->backup_mode = parse_backup_mode(backup_mode); free(backup_mode); } if (start_lsn) { uint32 xlogid; uint32 xrecoff; if (sscanf(start_lsn, "%X/%X", &xlogid, &xrecoff) == 2) backup->start_lsn = (XLogRecPtr) ((uint64) xlogid << 32) | xrecoff; else elog(WARNING, "invalid START_LSN \"%s\"", start_lsn); free(start_lsn); } if (stop_lsn) { uint32 xlogid; uint32 xrecoff; if (sscanf(stop_lsn, "%X/%X", &xlogid, &xrecoff) == 2) backup->stop_lsn = (XLogRecPtr) ((uint64) xlogid << 32) | xrecoff; else elog(WARNING, "invalid STOP_LSN \"%s\"", stop_lsn); free(stop_lsn); } if (status) { if (strcmp(status, "OK") == 0) backup->status = BACKUP_STATUS_OK; else if (strcmp(status, "RUNNING") == 0) backup->status = BACKUP_STATUS_RUNNING; else if (strcmp(status, "ERROR") == 0) backup->status = BACKUP_STATUS_ERROR; else if (strcmp(status, "DELETING") == 0) backup->status = BACKUP_STATUS_DELETING; else if (strcmp(status, "DELETED") == 0) backup->status = BACKUP_STATUS_DELETED; else if (strcmp(status, "DONE") == 0) backup->status = BACKUP_STATUS_DONE; else if (strcmp(status, "CORRUPT") == 0) backup->status = BACKUP_STATUS_CORRUPT; else elog(WARNING, "invalid STATUS \"%s\"", status); free(status); } if (parent_backup) { backup->parent_backup = base36dec(parent_backup); free(parent_backup); } return backup; } BackupMode parse_backup_mode(const char *value) { const char *v = value; size_t len; /* Skip all spaces detected */ while (IsSpace(*v)) v++; len = strlen(v); if (len > 0 && pg_strncasecmp("full", v, strlen("full")) == 0) return BACKUP_MODE_FULL; else if (len > 0 && pg_strncasecmp("page", v, strlen("page")) == 0) return BACKUP_MODE_DIFF_PAGE; else if (len > 0 && pg_strncasecmp("ptrack", v, strlen("ptrack")) == 0) return BACKUP_MODE_DIFF_PTRACK; /* Backup mode is invalid, so leave with an error */ elog(ERROR, "invalid backup-mode \"%s\"", value); return BACKUP_MODE_INVALID; } /* free pgBackup object */ void pgBackupFree(void *backup) { free(backup); } /* Compare two pgBackup with their IDs (start time) in ascending order */ int pgBackupCompareId(const void *l, const void *r) { pgBackup *lp = *(pgBackup **)l; pgBackup *rp = *(pgBackup **)r; if (lp->start_time > rp->start_time) return 1; else if (lp->start_time < rp->start_time) return -1; else return 0; } /* Compare two pgBackup with their IDs in descending order */ int pgBackupCompareIdDesc(const void *l, const void *r) { return -pgBackupCompareId(l, r); } /* * Construct absolute path of the backup directory. * If subdir is not NULL, it will be appended after the path. */ void pgBackupGetPath(const pgBackup *backup, char *path, size_t len, const char *subdir) { char *datetime; datetime = base36enc(backup->start_time); if (subdir) snprintf(path, len, "%s/%s/%s/%s", backup_path, BACKUPS_DIR, datetime, subdir); else snprintf(path, len, "%s/%s/%s", backup_path, BACKUPS_DIR, datetime); free(datetime); make_native_path(path); } void init_backup(pgBackup *backup) { backup->backup_mode = BACKUP_MODE_INVALID; backup->status = BACKUP_STATUS_INVALID; backup->tli = 0; backup->start_lsn = 0; backup->stop_lsn = 0; backup->start_time = (time_t) 0; backup->end_time = (time_t) 0; backup->recovery_xid = 0; backup->recovery_time = (time_t) 0; backup->data_bytes = BYTES_INVALID; backup->stream = false; backup->parent_backup = 0; }