1
0
mirror of https://github.com/postgrespro/pg_probackup.git synced 2025-01-25 11:53:32 +02:00
pg_probackup/tests/archive.py

1697 lines
57 KiB
Python
Raw Normal View History

2017-07-12 17:28:28 +03:00
import os
import shutil
2018-10-18 15:05:51 +03:00
import gzip
2017-07-12 17:28:28 +03:00
import unittest
2018-11-24 22:57:27 +03:00
from .helpers.ptrack_helpers import ProbackupTest, ProbackupException, GdbException
2017-07-12 17:28:28 +03:00
from datetime import datetime, timedelta
import subprocess
from sys import exit
from time import sleep
2019-09-17 17:35:27 +03:00
from distutils.dir_util import copy_tree
2017-07-12 17:28:28 +03:00
module_name = 'archive'
class ArchiveTest(ProbackupTest, unittest.TestCase):
# @unittest.expectedFailure
# @unittest.skip("skip")
def test_pgpro434_1(self):
"""Description in jira issue PGPRO-434"""
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
2018-01-25 21:37:27 +03:00
node = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'node'),
2017-07-12 17:28:28 +03:00
set_replication=True,
initdb_params=['--data-checksums'],
2018-01-25 21:37:27 +03:00
pg_options={
2019-06-20 06:54:11 +03:00
'checkpoint_timeout': '30s'})
2017-07-12 17:28:28 +03:00
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
self.set_archiving(backup_dir, 'node', node)
node.slow_start()
2017-07-12 17:28:28 +03:00
node.safe_psql(
"postgres",
2018-01-25 21:37:27 +03:00
"create table t_heap as select 1 as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector from "
"generate_series(0,100) i")
2017-07-12 17:28:28 +03:00
result = node.safe_psql("postgres", "SELECT * FROM t_heap")
2018-01-25 21:37:27 +03:00
self.backup_node(
2018-11-12 11:51:58 +03:00
backup_dir, 'node', node)
2017-07-12 17:28:28 +03:00
node.cleanup()
self.restore_node(
2018-05-21 17:08:46 +03:00
backup_dir, 'node', node)
node.slow_start()
2017-07-12 17:28:28 +03:00
# Recreate backup catalog
self.clean_pb(backup_dir)
2017-07-12 17:28:28 +03:00
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
# Make backup
self.backup_node(backup_dir, 'node', node)
2017-07-12 17:28:28 +03:00
node.cleanup()
# Restore Database
2019-10-08 14:33:52 +03:00
self.restore_node(backup_dir, 'node', node)
node.slow_start()
2017-07-12 17:28:28 +03:00
2018-01-25 21:37:27 +03:00
self.assertEqual(
result, node.safe_psql("postgres", "SELECT * FROM t_heap"),
2017-07-12 17:28:28 +03:00
'data after restore not equal to original data')
# Clean after yourself
self.del_test_dir(module_name, fname)
# @unittest.skip("skip")
# @unittest.expectedFailure
2017-07-12 17:28:28 +03:00
def test_pgpro434_2(self):
"""
Check that timelines are correct.
WAITING PGPRO-1053 for --immediate
"""
2017-07-12 17:28:28 +03:00
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
2018-01-25 21:37:27 +03:00
node = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'node'),
2017-07-12 17:28:28 +03:00
set_replication=True,
initdb_params=['--data-checksums'],
2018-01-25 21:37:27 +03:00
pg_options={
'checkpoint_timeout': '30s'}
2017-07-12 17:28:28 +03:00
)
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
self.set_archiving(backup_dir, 'node', node)
node.slow_start()
2017-07-12 17:28:28 +03:00
# FIRST TIMELINE
node.safe_psql(
"postgres",
2018-01-25 21:37:27 +03:00
"create table t_heap as select 1 as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(0,100) i")
2017-07-12 17:28:28 +03:00
backup_id = self.backup_node(backup_dir, 'node', node)
node.safe_psql(
"postgres",
2018-01-25 21:37:27 +03:00
"insert into t_heap select 100501 as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(0,1) i")
2017-07-12 17:28:28 +03:00
# SECOND TIMELIN
node.cleanup()
self.restore_node(
backup_dir, 'node', node,
options=['--immediate', '--recovery-target-action=promote'])
node.slow_start()
2017-07-12 17:28:28 +03:00
if self.verbose:
2018-01-25 21:37:27 +03:00
print(node.safe_psql(
"postgres",
"select redo_wal_file from pg_control_checkpoint()"))
self.assertFalse(
node.execute(
"postgres",
"select exists(select 1 "
"from t_heap where id = 100501)")[0][0],
'data after restore not equal to original data')
2017-07-12 17:28:28 +03:00
node.safe_psql(
"postgres",
2018-01-25 21:37:27 +03:00
"insert into t_heap select 2 as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(100,200) i")
2017-07-12 17:28:28 +03:00
backup_id = self.backup_node(backup_dir, 'node', node)
2017-07-12 17:28:28 +03:00
node.safe_psql(
"postgres",
2018-01-25 21:37:27 +03:00
"insert into t_heap select 100502 as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(0,256) i")
2017-07-12 17:28:28 +03:00
# THIRD TIMELINE
node.cleanup()
self.restore_node(
backup_dir, 'node', node,
options=['--immediate', '--recovery-target-action=promote'])
node.slow_start()
2018-01-25 21:37:27 +03:00
2017-07-12 17:28:28 +03:00
if self.verbose:
2018-01-25 21:37:27 +03:00
print(
node.safe_psql(
"postgres",
"select redo_wal_file from pg_control_checkpoint()"))
node.safe_psql(
"postgres",
"insert into t_heap select 3 as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(200,300) i")
2017-07-12 17:28:28 +03:00
backup_id = self.backup_node(backup_dir, 'node', node)
2017-07-12 17:28:28 +03:00
result = node.safe_psql("postgres", "SELECT * FROM t_heap")
node.safe_psql(
"postgres",
2018-01-25 21:37:27 +03:00
"insert into t_heap select 100503 as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(0,256) i")
2017-07-12 17:28:28 +03:00
# FOURTH TIMELINE
node.cleanup()
self.restore_node(
backup_dir, 'node', node,
options=['--immediate', '--recovery-target-action=promote'])
node.slow_start()
2018-07-06 20:40:59 +03:00
2017-07-12 17:28:28 +03:00
if self.verbose:
print('Fourth timeline')
2018-01-25 21:37:27 +03:00
print(node.safe_psql(
"postgres",
"select redo_wal_file from pg_control_checkpoint()"))
2017-07-12 17:28:28 +03:00
# FIFTH TIMELINE
node.cleanup()
self.restore_node(
backup_dir, 'node', node,
options=['--immediate', '--recovery-target-action=promote'])
node.slow_start()
2017-07-12 17:28:28 +03:00
if self.verbose:
print('Fifth timeline')
2018-01-25 21:37:27 +03:00
print(node.safe_psql(
"postgres",
"select redo_wal_file from pg_control_checkpoint()"))
2017-07-12 17:28:28 +03:00
# SIXTH TIMELINE
node.cleanup()
self.restore_node(
backup_dir, 'node', node,
options=['--immediate', '--recovery-target-action=promote'])
node.slow_start()
2017-07-12 17:28:28 +03:00
if self.verbose:
print('Sixth timeline')
2018-01-25 21:37:27 +03:00
print(node.safe_psql(
"postgres",
"select redo_wal_file from pg_control_checkpoint()"))
self.assertFalse(
node.execute(
"postgres",
"select exists(select 1 from t_heap where id > 100500)")[0][0],
2017-07-12 17:28:28 +03:00
'data after restore not equal to original data')
2018-01-25 21:37:27 +03:00
self.assertEqual(
result,
node.safe_psql(
"postgres",
"SELECT * FROM t_heap"),
2017-07-12 17:28:28 +03:00
'data after restore not equal to original data')
# Clean after yourself
2017-10-09 15:32:48 +03:00
self.del_test_dir(module_name, fname)
2017-07-12 17:28:28 +03:00
# @unittest.skip("skip")
def test_pgpro434_3(self):
2018-11-24 22:57:27 +03:00
"""
Check pg_stop_backup_timeout, needed backup_timeout
Fixed in commit d84d79668b0c139 and assert fixed by ptrack 1.7
"""
2017-07-12 17:28:28 +03:00
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
2018-01-25 21:37:27 +03:00
node = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'node'),
2017-07-12 17:28:28 +03:00
set_replication=True,
initdb_params=['--data-checksums'])
2017-07-12 17:28:28 +03:00
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
self.set_archiving(backup_dir, 'node', node)
node.slow_start()
2018-11-16 09:35:41 +03:00
2018-11-24 22:57:27 +03:00
gdb = self.backup_node(
2018-01-25 21:37:27 +03:00
backup_dir, 'node', node,
options=[
"--archive-timeout=60",
2018-11-24 22:57:27 +03:00
"--log-level-file=info"],
gdb=True)
gdb.set_breakpoint('pg_stop_backup')
gdb.run_until_break()
2019-10-19 09:48:35 +03:00
self.set_auto_conf(node, {'archive_command': "'exit 1'"})
2018-11-24 22:57:27 +03:00
node.reload()
gdb.continue_execution_until_exit()
log_file = os.path.join(backup_dir, 'log', 'pg_probackup.log')
with open(log_file, 'r') as f:
log_content = f.read()
2019-07-19 20:05:30 +03:00
# in PG =< 9.6 pg_stop_backup always wait
if self.get_version(node) < 100000:
self.assertIn(
"ERROR: pg_stop_backup doesn't answer in 60 seconds, cancel it",
log_content)
else:
self.assertIn(
2019-09-17 17:35:27 +03:00
"ERROR: WAL segment 000000010000000000000002 could not be archived in 60 seconds",
2019-07-19 20:05:30 +03:00
log_content)
log_file = os.path.join(node.logs_dir, 'postgresql.log')
with open(log_file, 'r') as f:
log_content = f.read()
self.assertNotIn(
'FailedAssertion',
log_content,
'PostgreSQL crashed because of a failed assert')
# Clean after yourself
self.del_test_dir(module_name, fname)
# @unittest.skip("skip")
def test_pgpro434_4(self):
"""
Check pg_stop_backup_timeout, needed backup_timeout
Fixed in commit d84d79668b0c139 and assert fixed by ptrack 1.7
"""
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
node = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'node'),
set_replication=True,
initdb_params=['--data-checksums'])
2017-07-12 17:28:28 +03:00
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
self.set_archiving(backup_dir, 'node', node)
node.slow_start()
2018-11-16 09:35:41 +03:00
2018-11-24 22:57:27 +03:00
gdb = self.backup_node(
2018-01-25 21:37:27 +03:00
backup_dir, 'node', node,
options=[
"--archive-timeout=60",
2018-11-24 22:57:27 +03:00
"--log-level-file=info"],
gdb=True)
gdb.set_breakpoint('pg_stop_backup')
gdb.run_until_break()
2019-10-19 09:48:35 +03:00
self.set_auto_conf(node, {'archive_command': "'exit 1'"})
2018-11-24 22:57:27 +03:00
node.reload()
os.environ["PGAPPNAME"] = "foo"
pid = node.safe_psql(
"postgres",
"SELECT pid "
"FROM pg_stat_activity "
"WHERE application_name = 'pg_probackup'").rstrip()
os.environ["PGAPPNAME"] = "pg_probackup"
postgres_gdb = self.gdb_attach(pid)
postgres_gdb.set_breakpoint('do_pg_stop_backup')
postgres_gdb.continue_execution_until_running()
2018-11-24 22:57:27 +03:00
gdb.continue_execution_until_exit()
# gdb._execute('detach')
2018-11-24 22:57:27 +03:00
log_file = os.path.join(backup_dir, 'log', 'pg_probackup.log')
2018-11-24 22:57:27 +03:00
with open(log_file, 'r') as f:
log_content = f.read()
self.assertIn(
"ERROR: pg_stop_backup doesn't answer in 60 seconds, cancel it",
log_content)
2017-07-12 17:28:28 +03:00
log_file = os.path.join(node.logs_dir, 'postgresql.log')
with open(log_file, 'r') as f:
log_content = f.read()
self.assertNotIn(
'FailedAssertion',
log_content,
'PostgreSQL crashed because of a failed assert')
2017-07-12 17:28:28 +03:00
# Clean after yourself
self.del_test_dir(module_name, fname)
# @unittest.skip("skip")
def test_archive_push_file_exists(self):
2017-07-12 17:28:28 +03:00
"""Archive-push if file exists"""
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
2018-01-25 21:37:27 +03:00
node = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'node'),
2017-07-12 17:28:28 +03:00
set_replication=True,
initdb_params=['--data-checksums'],
2018-01-25 21:37:27 +03:00
pg_options={
'checkpoint_timeout': '30s'})
2017-07-12 17:28:28 +03:00
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
self.set_archiving(backup_dir, 'node', node)
wals_dir = os.path.join(backup_dir, 'wal', 'node')
if self.archive_compress:
2019-04-30 00:30:25 +03:00
filename = '000000010000000000000001.gz'
file = os.path.join(wals_dir, filename)
else:
2019-04-30 00:30:25 +03:00
filename = '000000010000000000000001'
file = os.path.join(wals_dir, filename)
2017-07-12 17:28:28 +03:00
with open(file, 'a') as f:
f.write(b"blablablaadssaaaaaaaaaaaaaaa")
f.flush()
f.close()
node.slow_start()
2017-07-12 17:28:28 +03:00
node.safe_psql(
"postgres",
2018-01-25 21:37:27 +03:00
"create table t_heap as select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(0,100500) i")
2017-07-12 17:28:28 +03:00
log_file = os.path.join(node.logs_dir, 'postgresql.log')
2018-01-25 21:37:27 +03:00
2019-07-08 02:41:20 +03:00
self.switch_wal_segment(node)
sleep(1)
2017-07-12 17:28:28 +03:00
with open(log_file, 'r') as f:
log_content = f.read()
2019-07-08 02:41:20 +03:00
self.assertIn(
'LOG: archive command failed with exit code 1',
log_content)
self.assertIn(
'DETAIL: The failed archive command was:',
log_content)
self.assertIn(
'INFO: pg_probackup archive-push from',
log_content)
self.assertIn(
'ERROR: WAL segment ',
log_content)
self.assertIn(
'already exists.',
log_content)
self.assertNotIn(
'pg_probackup archive-push completed successfully', log_content)
2017-07-12 17:28:28 +03:00
2019-04-22 20:52:00 +03:00
if self.get_version(node) < 100000:
wal_src = os.path.join(
node.data_dir, 'pg_xlog', '000000010000000000000001')
else:
wal_src = os.path.join(
node.data_dir, 'pg_wal', '000000010000000000000001')
2018-11-24 22:57:27 +03:00
if self.archive_compress:
2018-11-16 09:35:41 +03:00
with open(wal_src, 'rb') as f_in, gzip.open(
file, 'wb', compresslevel=1) as f_out:
2018-10-18 15:05:51 +03:00
shutil.copyfileobj(f_in, f_out)
else:
shutil.copyfile(wal_src, file)
2018-10-18 15:05:51 +03:00
2018-01-25 21:37:27 +03:00
self.switch_wal_segment(node)
2017-07-12 17:28:28 +03:00
sleep(5)
2018-01-25 21:37:27 +03:00
with open(log_file, 'r') as f:
log_content = f.read()
2019-07-08 02:41:20 +03:00
self.assertIn(
'pg_probackup archive-push completed successfully',
log_content)
2018-01-25 21:37:27 +03:00
# Clean after yourself
self.del_test_dir(module_name, fname)
# @unittest.skip("skip")
def test_archive_push_file_exists_overwrite(self):
2018-01-25 21:37:27 +03:00
"""Archive-push if file exists"""
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
node = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'node'),
2018-01-25 21:37:27 +03:00
set_replication=True,
initdb_params=['--data-checksums'],
pg_options={
'checkpoint_timeout': '30s'})
2018-01-25 21:37:27 +03:00
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
self.set_archiving(backup_dir, 'node', node)
wals_dir = os.path.join(backup_dir, 'wal', 'node')
if self.archive_compress:
2019-04-30 00:30:25 +03:00
filename = '000000010000000000000001.gz'
file = os.path.join(wals_dir, filename)
2018-01-25 21:37:27 +03:00
else:
2019-04-30 00:30:25 +03:00
filename = '000000010000000000000001'
file = os.path.join(wals_dir, filename)
2018-01-25 21:37:27 +03:00
with open(file, 'a') as f:
f.write(b"blablablaadssaaaaaaaaaaaaaaa")
f.flush()
f.close()
node.slow_start()
2018-01-25 21:37:27 +03:00
node.safe_psql(
"postgres",
"create table t_heap as select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(0,100500) i")
log_file = os.path.join(node.logs_dir, 'postgresql.log')
2019-07-08 02:41:20 +03:00
self.switch_wal_segment(node)
sleep(1)
2018-01-25 21:37:27 +03:00
with open(log_file, 'r') as f:
log_content = f.read()
2019-07-08 02:41:20 +03:00
self.assertIn(
'LOG: archive command failed with exit code 1', log_content)
self.assertIn(
'DETAIL: The failed archive command was:', log_content)
self.assertIn(
'INFO: pg_probackup archive-push from', log_content)
self.assertIn(
'{0}" already exists.'.format(filename), log_content)
self.assertNotIn(
'pg_probackup archive-push completed successfully', log_content)
2018-01-25 21:37:27 +03:00
self.set_archiving(backup_dir, 'node', node, overwrite=True)
node.reload()
2017-10-11 18:08:56 +03:00
self.switch_wal_segment(node)
2018-01-25 21:37:27 +03:00
sleep(2)
2017-07-12 17:28:28 +03:00
with open(log_file, 'r') as f:
log_content = f.read()
2018-01-25 21:37:27 +03:00
self.assertTrue(
'pg_probackup archive-push completed successfully' in log_content,
'Expecting messages about successfull execution archive_command')
2017-07-12 17:28:28 +03:00
# Clean after yourself
self.del_test_dir(module_name, fname)
2019-06-20 06:54:11 +03:00
# @unittest.skip("skip")
def test_archive_push_partial_file_exists(self):
2019-09-05 15:43:32 +03:00
"""Archive-push if stale '.part' file exists"""
2019-06-20 06:54:11 +03:00
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
node = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'node'),
set_replication=True,
initdb_params=['--data-checksums'])
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
self.set_archiving(backup_dir, 'node', node)
node.slow_start()
2019-06-20 16:38:29 +03:00
# this backup is needed only for validation to xid
self.backup_node(backup_dir, 'node', node)
2019-06-20 06:54:11 +03:00
node.safe_psql(
"postgres",
2019-06-20 16:38:29 +03:00
"create table t1(a int)")
2019-06-20 06:54:11 +03:00
2019-06-20 16:38:29 +03:00
xid = node.safe_psql(
2019-06-20 06:54:11 +03:00
"postgres",
2019-06-20 16:38:29 +03:00
"INSERT INTO t1 VALUES (1) RETURNING (xmin)").rstrip()
2019-06-20 06:54:11 +03:00
2019-07-08 19:47:27 +03:00
if self.get_version(node) < 100000:
filename_orig = node.safe_psql(
"postgres",
"SELECT file_name "
"FROM pg_xlogfile_name_offset(pg_current_xlog_location());").rstrip()
else:
filename_orig = node.safe_psql(
"postgres",
"SELECT file_name "
"FROM pg_walfile_name_offset(pg_current_wal_flush_lsn());").rstrip()
2019-06-20 06:54:11 +03:00
2019-09-05 15:43:32 +03:00
# form up path to next .part WAL segment
2019-06-20 06:54:11 +03:00
wals_dir = os.path.join(backup_dir, 'wal', 'node')
if self.archive_compress:
2019-09-05 15:43:32 +03:00
filename = filename_orig + '.gz' + '.part'
2019-06-20 06:54:11 +03:00
file = os.path.join(wals_dir, filename)
else:
2019-09-05 15:43:32 +03:00
filename = filename_orig + '.part'
2019-06-20 06:54:11 +03:00
file = os.path.join(wals_dir, filename)
2019-09-05 15:43:32 +03:00
# emulate stale .part file
2019-06-20 06:54:11 +03:00
with open(file, 'a') as f:
2019-06-20 16:38:29 +03:00
f.write(b"blahblah")
2019-06-20 06:54:11 +03:00
f.flush()
f.close()
self.switch_wal_segment(node)
2019-07-05 00:25:36 +03:00
sleep(70)
2019-06-20 06:54:11 +03:00
# check that segment is archived
if self.archive_compress:
filename_orig = filename_orig + '.gz'
file = os.path.join(wals_dir, filename_orig)
self.assertTrue(os.path.isfile(file))
2019-07-03 18:00:15 +03:00
# successful validate means that archive-push reused stale wal segment
2019-06-20 16:38:29 +03:00
self.validate_pb(
backup_dir, 'node',
options=['--recovery-target-xid={0}'.format(xid)])
2019-09-05 13:09:13 +03:00
log_file = os.path.join(node.logs_dir, 'postgresql.log')
with open(log_file, 'r') as f:
log_content = f.read()
self.assertIn(
'Reusing stale destination temporary WAL file',
log_content)
2019-06-20 06:54:11 +03:00
# Clean after yourself
self.del_test_dir(module_name, fname)
# @unittest.skip("skip")
def test_archive_push_partial_file_exists_not_stale(self):
2019-09-05 15:43:32 +03:00
"""Archive-push if .part file exists and it is not stale"""
2019-06-20 06:54:11 +03:00
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
node = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'node'),
set_replication=True,
initdb_params=['--data-checksums'])
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
self.set_archiving(backup_dir, 'node', node)
node.slow_start()
node.safe_psql(
"postgres",
"create table t1()")
self.switch_wal_segment(node)
node.safe_psql(
"postgres",
"create table t2()")
2019-07-08 19:47:27 +03:00
if self.get_version(node) < 100000:
filename_orig = node.safe_psql(
"postgres",
"SELECT file_name "
"FROM pg_xlogfile_name_offset(pg_current_xlog_location());").rstrip()
else:
filename_orig = node.safe_psql(
"postgres",
"SELECT file_name "
"FROM pg_walfile_name_offset(pg_current_wal_flush_lsn());").rstrip()
2019-06-20 06:54:11 +03:00
2019-09-05 15:43:32 +03:00
# form up path to next .part WAL segment
2019-06-20 06:54:11 +03:00
wals_dir = os.path.join(backup_dir, 'wal', 'node')
if self.archive_compress:
2019-09-05 15:43:32 +03:00
filename = filename_orig + '.gz' + '.part'
2019-06-20 06:54:11 +03:00
file = os.path.join(wals_dir, filename)
else:
2019-09-05 15:43:32 +03:00
filename = filename_orig + '.part'
2019-06-20 06:54:11 +03:00
file = os.path.join(wals_dir, filename)
with open(file, 'a') as f:
f.write(b"blahblah")
f.flush()
f.close()
self.switch_wal_segment(node)
2019-07-05 00:25:36 +03:00
sleep(30)
2019-06-20 06:54:11 +03:00
with open(file, 'a') as f:
f.write(b"blahblahblahblah")
f.flush()
f.close()
2019-07-05 00:25:36 +03:00
sleep(40)
2019-06-20 06:54:11 +03:00
# check that segment is NOT archived
if self.archive_compress:
filename_orig = filename_orig + '.gz'
file = os.path.join(wals_dir, filename_orig)
self.assertFalse(os.path.isfile(file))
# log_file = os.path.join(node.logs_dir, 'postgresql.log')
# with open(log_file, 'r') as f:
# log_content = f.read()
# self.assertIn(
# 'is not stale',
# log_content)
# Clean after yourself
self.del_test_dir(module_name, fname)
2017-10-09 15:32:48 +03:00
# @unittest.expectedFailure
2018-11-24 22:57:27 +03:00
# @unittest.skip("skip")
2017-07-12 17:28:28 +03:00
def test_replica_archive(self):
2018-06-02 20:35:37 +03:00
"""
make node without archiving, take stream backup and
turn it into replica, set replica with archiving,
make archive backup from replica
"""
2017-07-12 17:28:28 +03:00
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
2018-01-25 21:37:27 +03:00
master = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'master'),
2017-07-12 17:28:28 +03:00
set_replication=True,
initdb_params=['--data-checksums'],
2018-01-25 21:37:27 +03:00
pg_options={
2018-11-12 11:51:58 +03:00
'archive_timeout': '10s',
'checkpoint_timeout': '30s',
'max_wal_size': '32MB'})
2017-07-12 17:28:28 +03:00
self.init_pb(backup_dir)
2017-10-09 15:32:48 +03:00
# ADD INSTANCE 'MASTER'
2017-07-12 17:28:28 +03:00
self.add_instance(backup_dir, 'master', master)
master.slow_start()
2017-07-12 17:28:28 +03:00
2018-01-25 21:37:27 +03:00
replica = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'replica'))
2017-07-12 17:28:28 +03:00
replica.cleanup()
master.psql(
"postgres",
2018-01-25 21:37:27 +03:00
"create table t_heap as select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
2018-11-12 11:51:58 +03:00
"from generate_series(0,2560) i")
2017-07-12 17:28:28 +03:00
self.backup_node(backup_dir, 'master', master, options=['--stream'])
before = master.safe_psql("postgres", "SELECT * FROM t_heap")
# Settings for Replica
self.restore_node(backup_dir, 'master', replica)
2017-09-28 10:32:06 +03:00
self.set_replica(master, replica, synchronous=True)
2018-04-28 18:49:34 +03:00
self.add_instance(backup_dir, 'replica', replica)
2017-07-12 17:28:28 +03:00
self.set_archiving(backup_dir, 'replica', replica, replica=True)
replica.slow_start(replica=True)
2017-07-12 17:28:28 +03:00
# Check data correctness on replica
after = replica.safe_psql("postgres", "SELECT * FROM t_heap")
self.assertEqual(before, after)
2018-06-02 20:35:37 +03:00
# Change data on master, take FULL backup from replica,
# restore taken backup and check that restored data equal
# to original data
2017-07-12 17:28:28 +03:00
master.psql(
"postgres",
2018-01-25 21:37:27 +03:00
"insert into t_heap as select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(256,512) i")
2017-07-12 17:28:28 +03:00
before = master.safe_psql("postgres", "SELECT * FROM t_heap")
2018-04-28 18:49:34 +03:00
2018-01-25 21:37:27 +03:00
backup_id = self.backup_node(
backup_dir, 'replica', replica,
options=[
'--archive-timeout=30',
'--master-host=localhost',
'--master-db=postgres',
2018-11-12 11:51:58 +03:00
'--master-port={0}'.format(master.port),
'--stream'])
2017-07-12 17:28:28 +03:00
self.validate_pb(backup_dir, 'replica')
2018-01-25 21:37:27 +03:00
self.assertEqual(
'OK', self.show_pb(backup_dir, 'replica', backup_id)['status'])
2017-07-12 17:28:28 +03:00
# RESTORE FULL BACKUP TAKEN FROM replica
2018-01-25 21:37:27 +03:00
node = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'node'))
2017-07-12 17:28:28 +03:00
node.cleanup()
self.restore_node(backup_dir, 'replica', data_dir=node.data_dir)
2019-10-19 09:48:35 +03:00
self.set_auto_conf(node, {'port': node.port})
node.slow_start()
2017-07-12 17:28:28 +03:00
# CHECK DATA CORRECTNESS
after = node.safe_psql("postgres", "SELECT * FROM t_heap")
self.assertEqual(before, after)
2018-06-02 20:35:37 +03:00
# Change data on master, make PAGE backup from replica,
# restore taken backup and check that restored data equal
# to original data
2017-07-12 17:28:28 +03:00
master.psql(
"postgres",
2018-01-25 21:37:27 +03:00
"insert into t_heap as select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
2018-11-24 22:57:27 +03:00
"from generate_series(512,80680) i")
2018-11-12 11:51:58 +03:00
2017-07-12 17:28:28 +03:00
before = master.safe_psql("postgres", "SELECT * FROM t_heap")
2018-11-12 11:51:58 +03:00
master.safe_psql(
"postgres",
"CHECKPOINT")
2018-11-24 22:57:27 +03:00
self.wait_until_replica_catch_with_master(master, replica)
2018-01-25 21:37:27 +03:00
backup_id = self.backup_node(
backup_dir, 'replica',
replica, backup_type='page',
options=[
2018-11-24 22:57:27 +03:00
'--archive-timeout=60',
2018-11-12 11:51:58 +03:00
'--master-db=postgres',
'--master-host=localhost',
'--master-port={0}'.format(master.port),
'--stream'])
2017-07-12 17:28:28 +03:00
self.validate_pb(backup_dir, 'replica')
2018-01-25 21:37:27 +03:00
self.assertEqual(
'OK', self.show_pb(backup_dir, 'replica', backup_id)['status'])
2017-07-12 17:28:28 +03:00
# RESTORE PAGE BACKUP TAKEN FROM replica
node.cleanup()
2018-01-25 21:37:27 +03:00
self.restore_node(
backup_dir, 'replica', data_dir=node.data_dir, backup_id=backup_id)
2018-11-12 11:51:58 +03:00
2019-10-19 09:48:35 +03:00
self.set_auto_conf(node, {'port': node.port})
2018-11-12 11:51:58 +03:00
node.slow_start()
2017-07-12 17:28:28 +03:00
# CHECK DATA CORRECTNESS
after = node.safe_psql("postgres", "SELECT * FROM t_heap")
self.assertEqual(before, after)
# Clean after yourself
self.del_test_dir(module_name, fname)
2017-10-09 15:32:48 +03:00
# @unittest.expectedFailure
# @unittest.skip("skip")
def test_master_and_replica_parallel_archiving(self):
2018-01-25 21:37:27 +03:00
"""
make node 'master 'with archiving,
take archive backup and turn it into replica,
set replica with archiving, make archive backup from replica,
make archive backup from master
"""
2017-10-09 15:32:48 +03:00
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
2018-01-25 21:37:27 +03:00
master = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'master'),
2017-10-09 15:32:48 +03:00
set_replication=True,
initdb_params=['--data-checksums'],
2018-01-25 21:37:27 +03:00
pg_options={
2018-11-12 11:51:58 +03:00
'archive_timeout': '10s'}
2017-10-09 15:32:48 +03:00
)
2018-01-25 21:37:27 +03:00
replica = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'replica'))
2017-10-09 15:32:48 +03:00
replica.cleanup()
self.init_pb(backup_dir)
# ADD INSTANCE 'MASTER'
self.add_instance(backup_dir, 'master', master)
self.set_archiving(backup_dir, 'master', master)
master.slow_start()
2017-10-09 15:32:48 +03:00
master.psql(
"postgres",
2018-01-25 21:37:27 +03:00
"create table t_heap as select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(0,10000) i")
2017-10-09 15:32:48 +03:00
# TAKE FULL ARCHIVE BACKUP FROM MASTER
self.backup_node(backup_dir, 'master', master)
# GET LOGICAL CONTENT FROM MASTER
before = master.safe_psql("postgres", "SELECT * FROM t_heap")
# GET PHYSICAL CONTENT FROM MASTER
pgdata_master = self.pgdata_content(master.data_dir)
# Settings for Replica
self.restore_node(backup_dir, 'master', replica)
# CHECK PHYSICAL CORRECTNESS on REPLICA
pgdata_replica = self.pgdata_content(replica.data_dir)
self.compare_pgdata(pgdata_master, pgdata_replica)
2018-11-12 11:51:58 +03:00
self.set_replica(master, replica)
2017-10-09 15:32:48 +03:00
# ADD INSTANCE REPLICA
self.add_instance(backup_dir, 'replica', replica)
# SET ARCHIVING FOR REPLICA
self.set_archiving(backup_dir, 'replica', replica, replica=True)
replica.slow_start(replica=True)
2017-10-09 15:32:48 +03:00
# CHECK LOGICAL CORRECTNESS on REPLICA
after = replica.safe_psql("postgres", "SELECT * FROM t_heap")
self.assertEqual(before, after)
2018-11-12 11:51:58 +03:00
master.psql(
"postgres",
"insert into t_heap select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(0, 60000) i")
2018-11-16 09:35:41 +03:00
master.psql(
"postgres",
"CHECKPOINT")
2018-11-12 11:51:58 +03:00
2018-01-25 21:37:27 +03:00
backup_id = self.backup_node(
backup_dir, 'replica', replica,
options=[
2018-11-12 11:51:58 +03:00
'--archive-timeout=30',
2018-01-25 21:37:27 +03:00
'--master-host=localhost',
'--master-db=postgres',
2018-11-12 11:51:58 +03:00
'--master-port={0}'.format(master.port),
'--stream'])
2017-10-09 15:32:48 +03:00
self.validate_pb(backup_dir, 'replica')
2018-01-25 21:37:27 +03:00
self.assertEqual(
'OK', self.show_pb(backup_dir, 'replica', backup_id)['status'])
2017-10-09 15:32:48 +03:00
# TAKE FULL ARCHIVE BACKUP FROM MASTER
backup_id = self.backup_node(backup_dir, 'master', master)
self.validate_pb(backup_dir, 'master')
2018-01-25 21:37:27 +03:00
self.assertEqual(
'OK', self.show_pb(backup_dir, 'master', backup_id)['status'])
2017-12-13 11:15:42 +03:00
# Clean after yourself
self.del_test_dir(module_name, fname)
2017-12-13 11:15:42 +03:00
# @unittest.expectedFailure
# @unittest.skip("skip")
2019-05-28 12:41:03 +03:00
def test_basic_master_and_replica_concurrent_archiving(self):
2018-01-25 21:37:27 +03:00
"""
make node 'master 'with archiving,
take archive backup and turn it into replica,
set replica with archiving, make archive backup from replica,
make archive backup from master
"""
2017-12-14 00:29:39 +03:00
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
2018-01-25 21:37:27 +03:00
master = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'master'),
2017-12-14 00:29:39 +03:00
set_replication=True,
initdb_params=['--data-checksums'],
2018-01-25 21:37:27 +03:00
pg_options={
2018-11-12 11:51:58 +03:00
'checkpoint_timeout': '30s',
'archive_timeout': '10s'}
2017-12-14 00:29:39 +03:00
)
2018-01-25 21:37:27 +03:00
replica = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'replica'))
replica.cleanup()
2017-12-14 00:29:39 +03:00
self.init_pb(backup_dir)
# ADD INSTANCE 'MASTER'
self.add_instance(backup_dir, 'master', master)
self.set_archiving(backup_dir, 'master', master)
master.slow_start()
2017-12-14 00:29:39 +03:00
master.psql(
2017-12-14 00:29:39 +03:00
"postgres",
2018-01-25 21:37:27 +03:00
"create table t_heap as select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(0,10000) i")
2017-12-14 00:29:39 +03:00
# TAKE FULL ARCHIVE BACKUP FROM MASTER
self.backup_node(backup_dir, 'master', master)
# GET LOGICAL CONTENT FROM MASTER
before = master.safe_psql("postgres", "SELECT * FROM t_heap")
# GET PHYSICAL CONTENT FROM MASTER
pgdata_master = self.pgdata_content(master.data_dir)
2017-12-14 00:29:39 +03:00
# Settings for Replica
2018-05-01 13:41:17 +03:00
self.restore_node(
2018-05-21 17:08:46 +03:00
backup_dir, 'master', replica)
# CHECK PHYSICAL CORRECTNESS on REPLICA
pgdata_replica = self.pgdata_content(replica.data_dir)
self.compare_pgdata(pgdata_master, pgdata_replica)
2017-12-14 00:29:39 +03:00
self.set_replica(master, replica, synchronous=True)
# ADD INSTANCE REPLICA
# self.add_instance(backup_dir, 'replica', replica)
# SET ARCHIVING FOR REPLICA
# self.set_archiving(backup_dir, 'replica', replica, replica=True)
replica.slow_start(replica=True)
2017-12-14 00:29:39 +03:00
# CHECK LOGICAL CORRECTNESS on REPLICA
after = replica.safe_psql("postgres", "SELECT * FROM t_heap")
self.assertEqual(before, after)
2017-12-14 00:29:39 +03:00
master.psql(
2017-12-14 00:29:39 +03:00
"postgres",
2018-01-25 21:37:27 +03:00
"insert into t_heap as select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(0,10000) i")
2017-12-14 00:29:39 +03:00
# TAKE FULL ARCHIVE BACKUP FROM REPLICA
2018-01-25 21:37:27 +03:00
backup_id = self.backup_node(
backup_dir, 'master', replica,
options=[
'--archive-timeout=30',
'--master-host=localhost',
'--master-db=postgres',
'--master-port={0}'.format(master.port)])
self.validate_pb(backup_dir, 'master')
2018-01-25 21:37:27 +03:00
self.assertEqual(
'OK', self.show_pb(backup_dir, 'master', backup_id)['status'])
2017-12-14 00:29:39 +03:00
# TAKE FULL ARCHIVE BACKUP FROM MASTER
backup_id = self.backup_node(backup_dir, 'master', master)
self.validate_pb(backup_dir, 'master')
2018-01-25 21:37:27 +03:00
self.assertEqual(
'OK', self.show_pb(backup_dir, 'master', backup_id)['status'])
2017-12-14 00:29:39 +03:00
# Clean after yourself
self.del_test_dir(module_name, fname)
2017-12-14 00:29:39 +03:00
# @unittest.expectedFailure
# @unittest.skip("skip")
2017-12-14 00:29:39 +03:00
def test_archive_pg_receivexlog(self):
"""Test backup with pg_receivexlog wal delivary method"""
2017-12-14 00:29:39 +03:00
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
2018-01-25 21:37:27 +03:00
node = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'node'),
2017-12-14 00:29:39 +03:00
set_replication=True,
initdb_params=['--data-checksums'],
2018-01-25 21:37:27 +03:00
pg_options={
'checkpoint_timeout': '30s'})
2017-12-14 00:29:39 +03:00
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
2018-12-25 17:48:49 +03:00
node.slow_start()
if self.get_version(node) < 100000:
2018-01-28 04:36:27 +03:00
pg_receivexlog_path = self.get_bin_path('pg_receivexlog')
else:
2018-01-28 04:36:27 +03:00
pg_receivexlog_path = self.get_bin_path('pg_receivewal')
2018-01-25 21:37:27 +03:00
pg_receivexlog = self.run_binary(
[
pg_receivexlog_path, '-p', str(node.port), '--synchronous',
'-D', os.path.join(backup_dir, 'wal', 'node')
2019-01-10 18:12:00 +03:00
], asynchronous=True)
if pg_receivexlog.returncode:
2018-01-25 21:37:27 +03:00
self.assertFalse(
True,
'Failed to start pg_receivexlog: {0}'.format(
pg_receivexlog.communicate()[1]))
2017-12-14 00:29:39 +03:00
node.safe_psql(
"postgres",
2018-01-25 21:37:27 +03:00
"create table t_heap as select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(0,10000) i")
2017-12-14 00:29:39 +03:00
self.backup_node(backup_dir, 'node', node)
2018-01-25 21:37:27 +03:00
# PAGE
node.safe_psql(
"postgres",
2018-01-25 21:37:27 +03:00
"insert into t_heap select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(10000,20000) i")
self.backup_node(
backup_dir,
'node',
node,
backup_type='page'
)
result = node.safe_psql("postgres", "SELECT * FROM t_heap")
self.validate_pb(backup_dir)
2017-12-14 00:29:39 +03:00
# Check data correctness
node.cleanup()
self.restore_node(backup_dir, 'node', node)
node.slow_start()
2018-07-06 20:40:59 +03:00
2018-01-25 21:37:27 +03:00
self.assertEqual(
result,
node.safe_psql(
"postgres", "SELECT * FROM t_heap"
),
2017-12-14 00:29:39 +03:00
'data after restore not equal to original data')
2017-12-14 00:29:39 +03:00
# Clean after yourself
pg_receivexlog.kill()
self.del_test_dir(module_name, fname)
2017-12-14 00:29:39 +03:00
# @unittest.expectedFailure
# @unittest.skip("skip")
def test_archive_pg_receivexlog_compression_pg10(self):
"""Test backup with pg_receivewal compressed wal delivary method"""
2017-12-13 11:15:42 +03:00
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
2018-01-25 21:37:27 +03:00
node = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'node'),
2017-12-13 11:15:42 +03:00
set_replication=True,
initdb_params=['--data-checksums'],
2018-01-25 21:37:27 +03:00
pg_options={
'checkpoint_timeout': '30s'}
2017-12-13 11:15:42 +03:00
)
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
2018-12-25 17:48:49 +03:00
node.slow_start()
2018-01-25 21:37:27 +03:00
if self.get_version(node) < self.version_to_num('10.0'):
return unittest.skip('You need PostgreSQL >= 10 for this test')
else:
2018-07-06 20:40:59 +03:00
pg_receivexlog_path = self.get_bin_path('pg_receivewal')
2018-01-25 21:37:27 +03:00
pg_receivexlog = self.run_binary(
[
pg_receivexlog_path, '-p', str(node.port), '--synchronous',
'-Z', '9', '-D', os.path.join(backup_dir, 'wal', 'node')
2019-01-10 18:12:00 +03:00
], asynchronous=True)
if pg_receivexlog.returncode:
2018-01-25 21:37:27 +03:00
self.assertFalse(
True,
'Failed to start pg_receivexlog: {0}'.format(
pg_receivexlog.communicate()[1]))
2017-12-13 11:15:42 +03:00
node.safe_psql(
"postgres",
2018-01-25 21:37:27 +03:00
"create table t_heap as select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(0,10000) i")
2017-12-13 11:15:42 +03:00
self.backup_node(backup_dir, 'node', node)
2018-01-25 21:37:27 +03:00
# PAGE
node.safe_psql(
"postgres",
2018-01-25 21:37:27 +03:00
"insert into t_heap select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(10000,20000) i")
2017-12-13 11:15:42 +03:00
2018-01-25 21:37:27 +03:00
self.backup_node(
backup_dir, 'node', node,
backup_type='page'
)
result = node.safe_psql("postgres", "SELECT * FROM t_heap")
self.validate_pb(backup_dir)
# Check data correctness
node.cleanup()
2017-12-13 11:15:42 +03:00
self.restore_node(backup_dir, 'node', node)
node.slow_start()
2018-07-06 20:40:59 +03:00
2018-01-25 21:37:27 +03:00
self.assertEqual(
result, node.safe_psql("postgres", "SELECT * FROM t_heap"),
2017-12-13 11:15:42 +03:00
'data after restore not equal to original data')
2017-12-13 11:15:42 +03:00
# Clean after yourself
pg_receivexlog.kill()
self.del_test_dir(module_name, fname)
2019-09-17 17:35:27 +03:00
# @unittest.expectedFailure
# @unittest.skip("skip")
def test_archive_catalog(self):
"""
ARCHIVE replica:
t6 |-----------------------
t5 | |-------
| |
t4 | |--------------
| |
t3 | |--B1--|/|--B2-|/|-B3---
| |
t2 |--A1--------A2---
t1 ---------Y1--Y2--
ARCHIVE master:
t1 -Z1--Z2---
"""
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
master = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'master'),
set_replication=True,
initdb_params=['--data-checksums'],
pg_options={
'archive_timeout': '30s',
'checkpoint_timeout': '30s',
'autovacuum': 'off'})
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'master', master)
self.set_archiving(backup_dir, 'master', master)
master.slow_start()
# FULL
master.safe_psql(
"postgres",
"create table t_heap as select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(0,10000) i")
self.backup_node(backup_dir, 'master', master)
# PAGE
master.safe_psql(
"postgres",
"insert into t_heap select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
"from generate_series(10000,20000) i")
self.backup_node(
backup_dir, 'master', master, backup_type='page')
replica = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'replica'))
replica.cleanup()
self.restore_node(backup_dir, 'master', replica)
self.set_replica(master, replica)
self.add_instance(backup_dir, 'replica', replica)
self.set_archiving(backup_dir, 'replica', replica, replica=True)
copy_tree(
os.path.join(backup_dir, 'wal', 'master'),
os.path.join(backup_dir, 'wal', 'replica'))
# Check data correctness on replica
replica.slow_start(replica=True)
# FULL backup replica
Y1 = self.backup_node(
backup_dir, 'replica', replica,
options=['--stream', '--archive-timeout=60s'])
master.pgbench_init(scale=5)
# PAGE backup replica
Y2 = self.backup_node(
backup_dir, 'replica', replica,
backup_type='page', options=['--stream', '--archive-timeout=60s'])
# create timeline t2
replica.promote()
# do checkpoint to increment timeline ID in pg_control
replica.safe_psql(
'postgres',
'CHECKPOINT')
# FULL backup replica
A1 = self.backup_node(
backup_dir, 'replica', replica)
replica.pgbench_init(scale=5)
replica.safe_psql(
'postgres',
"CREATE TABLE t1 (a text)")
target_xid = None
with replica.connect("postgres") as con:
res = con.execute(
"INSERT INTO t1 VALUES ('inserted') RETURNING (xmin)")
con.commit()
target_xid = res[0][0]
# DELTA backup replica
A2 = self.backup_node(
backup_dir, 'replica', replica, backup_type='delta')
# create timeline t3
replica.cleanup()
self.restore_node(
backup_dir, 'replica', replica,
options=[
'--recovery-target-xid={0}'.format(target_xid),
'--recovery-target-timeline=2',
'--recovery-target-action=promote'])
replica.slow_start()
B1 = self.backup_node(
backup_dir, 'replica', replica)
replica.pgbench_init(scale=2)
B2 = self.backup_node(
backup_dir, 'replica', replica, backup_type='page')
replica.pgbench_init(scale=2)
target_xid = None
with replica.connect("postgres") as con:
res = con.execute(
"INSERT INTO t1 VALUES ('inserted') RETURNING (xmin)")
con.commit()
target_xid = res[0][0]
B3 = self.backup_node(
backup_dir, 'replica', replica, backup_type='page')
replica.pgbench_init(scale=2)
# create timeline t4
replica.cleanup()
self.restore_node(
backup_dir, 'replica', replica,
options=[
'--recovery-target-xid={0}'.format(target_xid),
'--recovery-target-timeline=3',
'--recovery-target-action=promote'])
replica.slow_start()
replica.safe_psql(
'postgres',
'CREATE TABLE '
't2 as select i, '
'repeat(md5(i::text),5006056) as fat_attr '
'from generate_series(0,6) i')
target_xid = None
with replica.connect("postgres") as con:
res = con.execute(
"INSERT INTO t1 VALUES ('inserted') RETURNING (xmin)")
con.commit()
target_xid = res[0][0]
replica.safe_psql(
'postgres',
'CREATE TABLE '
't3 as select i, '
'repeat(md5(i::text),5006056) as fat_attr '
'from generate_series(0,10) i')
# create timeline t5
replica.cleanup()
self.restore_node(
backup_dir, 'replica', replica,
options=[
'--recovery-target-xid={0}'.format(target_xid),
'--recovery-target-timeline=4',
'--recovery-target-action=promote'])
replica.slow_start()
replica.safe_psql(
'postgres',
'CREATE TABLE '
't4 as select i, '
'repeat(md5(i::text),5006056) as fat_attr '
'from generate_series(0,6) i')
# create timeline t6
replica.cleanup()
self.restore_node(
backup_dir, 'replica', replica, backup_id=A1,
options=[
'--recovery-target=immediate',
'--recovery-target-action=promote'])
replica.slow_start()
replica.pgbench_init(scale=2)
show = self.show_archive(backup_dir, as_text=True)
show = self.show_archive(backup_dir)
for instance in show:
if instance['instance'] == 'replica':
replica_timelines = instance['timelines']
if instance['instance'] == 'master':
master_timelines = instance['timelines']
# check that all timelines are ok
for timeline in replica_timelines:
self.assertTrue(timeline['status'], 'OK')
# check that all timelines are ok
for timeline in master_timelines:
self.assertTrue(timeline['status'], 'OK')
# create holes in t3
wals_dir = os.path.join(backup_dir, 'wal', 'replica')
wals = [
f for f in os.listdir(wals_dir) if os.path.isfile(os.path.join(wals_dir, f))
and not f.endswith('.backup') and not f.endswith('.history') and f.startswith('00000003')
]
wals.sort()
# check that t3 is ok
self.show_archive(backup_dir)
file = os.path.join(backup_dir, 'wal', 'replica', '000000030000000000000017')
if self.archive_compress:
file = file + '.gz'
os.remove(file)
file = os.path.join(backup_dir, 'wal', 'replica', '000000030000000000000012')
if self.archive_compress:
file = file + '.gz'
os.remove(file)
file = os.path.join(backup_dir, 'wal', 'replica', '000000030000000000000013')
if self.archive_compress:
file = file + '.gz'
os.remove(file)
# check that t3 is not OK
show = self.show_archive(backup_dir)
show = self.show_archive(backup_dir)
for instance in show:
if instance['instance'] == 'replica':
replica_timelines = instance['timelines']
# sanity
for timeline in replica_timelines:
if timeline['tli'] == 1:
timeline_1 = timeline
continue
if timeline['tli'] == 2:
timeline_2 = timeline
continue
if timeline['tli'] == 3:
timeline_3 = timeline
continue
if timeline['tli'] == 4:
timeline_4 = timeline
continue
if timeline['tli'] == 5:
timeline_5 = timeline
continue
if timeline['tli'] == 6:
timeline_6 = timeline
continue
self.assertEqual(timeline_6['status'], "OK")
self.assertEqual(timeline_5['status'], "OK")
self.assertEqual(timeline_4['status'], "OK")
self.assertEqual(timeline_3['status'], "DEGRADED")
self.assertEqual(timeline_2['status'], "OK")
self.assertEqual(timeline_1['status'], "OK")
self.assertEqual(len(timeline_3['lost-segments']), 2)
self.assertEqual(timeline_3['lost-segments'][0]['begin-segno'], '0000000000000012')
self.assertEqual(timeline_3['lost-segments'][0]['end-segno'], '0000000000000013')
self.assertEqual(timeline_3['lost-segments'][1]['begin-segno'], '0000000000000017')
self.assertEqual(timeline_3['lost-segments'][1]['end-segno'], '0000000000000017')
self.assertEqual(len(timeline_6['backups']), 0)
self.assertEqual(len(timeline_5['backups']), 0)
self.assertEqual(len(timeline_4['backups']), 0)
self.assertEqual(len(timeline_3['backups']), 3)
self.assertEqual(len(timeline_2['backups']), 2)
self.assertEqual(len(timeline_1['backups']), 2)
# check closest backup correctness
self.assertEqual(timeline_6['closest-backup-id'], A1)
self.assertEqual(timeline_5['closest-backup-id'], B2)
self.assertEqual(timeline_4['closest-backup-id'], B2)
self.assertEqual(timeline_3['closest-backup-id'], A1)
self.assertEqual(timeline_2['closest-backup-id'], Y2)
# check parent tli correctness
self.assertEqual(timeline_6['parent-tli'], 2)
self.assertEqual(timeline_5['parent-tli'], 4)
self.assertEqual(timeline_4['parent-tli'], 3)
self.assertEqual(timeline_3['parent-tli'], 2)
self.assertEqual(timeline_2['parent-tli'], 1)
self.assertEqual(timeline_1['parent-tli'], 0)
self.del_test_dir(module_name, fname)
# @unittest.expectedFailure
# @unittest.skip("skip")
def test_archive_catalog_1(self):
"""
double segment - compressed and not
"""
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
node = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'node'),
set_replication=True,
initdb_params=['--data-checksums'],
pg_options={
'archive_timeout': '30s',
'checkpoint_timeout': '30s',
'autovacuum': 'off'})
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
self.set_archiving(backup_dir, 'node', node, compress=True)
node.slow_start()
# FULL
self.backup_node(backup_dir, 'node', node)
node.pgbench_init(scale=2)
wals_dir = os.path.join(backup_dir, 'wal', 'node')
original_file = os.path.join(wals_dir, '000000010000000000000001.gz')
tmp_file = os.path.join(wals_dir, '000000010000000000000001')
with gzip.open(original_file, 'rb') as f_in, open(tmp_file, 'wb') as f_out:
shutil.copyfileobj(f_in, f_out)
os.rename(
os.path.join(wals_dir, '000000010000000000000001'),
os.path.join(wals_dir, '000000010000000000000002'))
show = self.show_archive(backup_dir)
for instance in show:
timelines = instance['timelines']
# sanity
for timeline in timelines:
self.assertEqual(timeline['min-segno'], '0000000000000001')
self.assertEqual(timeline['status'], 'OK')
self.del_test_dir(module_name, fname)
# @unittest.expectedFailure
# @unittest.skip("skip")
def test_archive_catalog_2(self):
"""
double segment - compressed and not
"""
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
node = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'node'),
set_replication=True,
initdb_params=['--data-checksums'],
pg_options={
'archive_timeout': '30s',
'checkpoint_timeout': '30s',
'autovacuum': 'off'})
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
self.set_archiving(backup_dir, 'node', node, compress=True)
node.slow_start()
# FULL
self.backup_node(backup_dir, 'node', node)
node.pgbench_init(scale=2)
wals_dir = os.path.join(backup_dir, 'wal', 'node')
original_file = os.path.join(wals_dir, '000000010000000000000001.gz')
tmp_file = os.path.join(wals_dir, '000000010000000000000001')
with gzip.open(original_file, 'rb') as f_in, open(tmp_file, 'wb') as f_out:
shutil.copyfileobj(f_in, f_out)
os.rename(
os.path.join(wals_dir, '000000010000000000000001'),
os.path.join(wals_dir, '000000010000000000000002'))
os.remove(original_file)
show = self.show_archive(backup_dir)
for instance in show:
timelines = instance['timelines']
# sanity
for timeline in timelines:
self.assertEqual(timeline['min-segno'], '0000000000000002')
self.assertEqual(timeline['status'], 'OK')
2019-09-17 17:35:27 +03:00
self.del_test_dir(module_name, fname)
# @unittest.expectedFailure
# @unittest.skip("skip")
def test_archive_options(self):
"""
check that '--archive-host', '--archive-user', '--archiver-port'
and '--restore-command' are working as expected.
"""
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
node = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'node'),
set_replication=True,
initdb_params=['--data-checksums'])
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
self.set_archiving(backup_dir, 'node', node, compress=True)
node.slow_start()
# FULL
self.backup_node(backup_dir, 'node', node)
node.pgbench_init(scale=1)
node.cleanup()
wal_dir = os.path.join(backup_dir, 'wal', 'node')
self.restore_node(
backup_dir, 'node', node,
options=[
'--restore-command="cp {0}/%f %p"'.format(wal_dir),
'--archive-host=localhost',
'--archive-port=22',
'--archive-user={0}'.format(self.user)
])
recovery_conf = os.path.join(node.data_dir, 'recovery.conf')
with open(recovery_conf, 'r') as f:
recovery_content = f.read()
self.assertIn(
'restore_command = \'"cp {0}/%f %p"\''.format(wal_dir),
recovery_content)
node.cleanup()
self.restore_node(
backup_dir, 'node', node,
options=[
'--archive-host=localhost',
'--archive-port=22',
2019-10-08 14:33:52 +03:00
'--archive-user={0}'.format(self.user)])
with open(recovery_conf, 'r') as f:
recovery_content = f.read()
self.assertIn(
"restore_command = '{0} archive-get -B {1} --instance {2} "
"--wal-file-path=%p --wal-file-name=%f --remote-host=localhost "
"--remote-port=22 --remote-user={3}'".format(
self.probackup_path, backup_dir, 'node', self.user),
recovery_content)
node.slow_start()
node.safe_psql(
'postgres',
'select 1')
self.del_test_dir(module_name, fname)
# @unittest.expectedFailure
# @unittest.skip("skip")
def test_archive_options_1(self):
"""
check that '--archive-host', '--archive-user', '--archiver-port'
and '--restore-command' are working as expected with set-config
"""
fname = self.id().split('.')[3]
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
node = self.make_simple_node(
base_dir=os.path.join(module_name, fname, 'node'),
set_replication=True,
initdb_params=['--data-checksums'])
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
self.set_archiving(backup_dir, 'node', node, compress=True)
node.slow_start()
# FULL
self.backup_node(backup_dir, 'node', node)
node.pgbench_init(scale=1)
node.cleanup()
wal_dir = os.path.join(backup_dir, 'wal', 'node')
self.set_config(
backup_dir, 'node',
options=[
'--restore-command="cp {0}/%f %p"'.format(wal_dir),
'--archive-host=localhost',
'--archive-port=22',
'--archive-user={0}'.format(self.user)])
self.restore_node(backup_dir, 'node', node)
recovery_conf = os.path.join(node.data_dir, 'recovery.conf')
with open(recovery_conf, 'r') as f:
recovery_content = f.read()
self.assertIn(
'restore_command = \'"cp {0}/%f %p"\''.format(wal_dir),
recovery_content)
node.cleanup()
self.restore_node(
backup_dir, 'node', node,
options=[
'--restore-command=none'.format(wal_dir),
'--archive-host=localhost1',
'--archive-port=23',
'--archive-user={0}'.format(self.user)
])
with open(recovery_conf, 'r') as f:
recovery_content = f.read()
self.assertIn(
"restore_command = '{0} archive-get -B {1} --instance {2} "
"--wal-file-path=%p --wal-file-name=%f --remote-host=localhost1 "
"--remote-port=23 --remote-user={3}'".format(
self.probackup_path, backup_dir, 'node', self.user),
recovery_content)
self.del_test_dir(module_name, fname)
2019-09-17 17:35:27 +03:00
# important - switchpoint may be NullOffset LSN and not actually existing in archive to boot.
# so write validation code accordingly
# change wal-seg-size
#
#
#t3 ----------------
# /
#t2 ----------------
# /
#t1 -A--------
#
#
#t3 ----------------
# /
#t2 ----------------
# /
#t1 -A--------
#