1
0
mirror of https://github.com/postgrespro/pg_probackup.git synced 2025-01-24 11:46:31 +02:00
pg_probackup/tests/ptrack_vacuum_full.py

202 lines
8.1 KiB
Python
Raw Normal View History

2017-06-20 13:57:23 +03:00
import os
2017-05-03 14:14:48 +03:00
import unittest
2017-06-27 08:42:52 +03:00
from .helpers.ptrack_helpers import ProbackupTest, idx_ptrack
2018-10-16 19:16:46 +03:00
import time
2017-05-03 14:14:48 +03:00
2017-07-12 17:28:28 +03:00
module_name = 'ptrack_vacuum_full'
2017-05-03 14:14:48 +03:00
class SimpleTest(ProbackupTest, unittest.TestCase):
# @unittest.skip("skip")
# @unittest.expectedFailure
2017-05-03 14:14:48 +03:00
def test_ptrack_vacuum_full(self):
2017-05-05 16:21:49 +03:00
fname = self.id().split('.')[3]
2018-10-16 19:16:46 +03:00
node = self.make_simple_node(
base_dir="{0}/{1}/node".format(module_name, fname),
2017-05-03 14:14:48 +03:00
set_replication=True,
2017-06-20 13:57:23 +03:00
initdb_params=['--data-checksums'],
2018-10-16 19:16:46 +03:00
pg_options={
'ptrack_enable': 'on',
'wal_level': 'replica',
'max_wal_senders': '2'})
2017-07-12 17:28:28 +03:00
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
2017-06-20 13:57:23 +03:00
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
node.slow_start()
2017-06-20 13:57:23 +03:00
2017-05-03 14:14:48 +03:00
self.create_tblspace_in_node(node, 'somedata')
# Create table and indexes
2017-07-12 17:28:28 +03:00
res = node.safe_psql(
2017-05-03 14:14:48 +03:00
"postgres",
2018-10-19 14:54:17 +03:00
"create extension bloom; create sequence t_seq; "
"create table t_heap tablespace somedata "
2018-10-16 19:16:46 +03:00
"as select i as id, md5(i::text) as text, "
"md5(repeat(i::text,10))::tsvector as tsvector "
2018-10-16 22:53:59 +03:00
"from generate_series(0,2560) i")
2017-05-03 14:14:48 +03:00
for i in idx_ptrack:
2017-07-12 17:28:28 +03:00
if idx_ptrack[i]['type'] != 'heap' and idx_ptrack[i]['type'] != 'seq':
2018-10-16 19:16:46 +03:00
node.safe_psql(
"postgres", "create index {0} on {1} "
"using {2}({3}) tablespace somedata".format(
i, idx_ptrack[i]['relation'],
idx_ptrack[i]['type'], idx_ptrack[i]['column']))
2017-05-03 14:14:48 +03:00
2017-07-12 17:28:28 +03:00
node.safe_psql('postgres', 'vacuum t_heap')
node.safe_psql('postgres', 'checkpoint')
2017-05-03 14:14:48 +03:00
2018-10-17 17:04:23 +03:00
self.backup_node(
backup_dir, 'node', node, options=['-j10', '--stream'])
2017-05-03 14:14:48 +03:00
for i in idx_ptrack:
# get size of heap and indexes. size calculated in pages
idx_ptrack[i]['old_size'] = self.get_fork_size(node, i)
# get path to heap and index files
idx_ptrack[i]['path'] = self.get_fork_path(node, i)
# calculate md5sums of pages
idx_ptrack[i]['old_pages'] = self.get_md5_per_page_for_fork(
2017-05-03 18:05:19 +03:00
idx_ptrack[i]['path'], idx_ptrack[i]['old_size'])
2017-05-03 14:14:48 +03:00
2017-07-12 17:28:28 +03:00
node.safe_psql('postgres', 'delete from t_heap where id%2 = 1')
node.safe_psql('postgres', 'vacuum full t_heap')
node.safe_psql('postgres', 'checkpoint')
2017-05-03 14:14:48 +03:00
2018-10-16 22:53:59 +03:00
# CHECK PTRACK SANITY
success = True
2017-05-03 14:14:48 +03:00
for i in idx_ptrack:
# get new size of heap and indexes. size calculated in pages
idx_ptrack[i]['new_size'] = self.get_fork_size(node, i)
# update path to heap and index files in case they`ve changed
idx_ptrack[i]['path'] = self.get_fork_path(node, i)
# calculate new md5sums for pages
idx_ptrack[i]['new_pages'] = self.get_md5_per_page_for_fork(
2017-05-03 18:05:19 +03:00
idx_ptrack[i]['path'], idx_ptrack[i]['new_size'])
2017-05-03 14:14:48 +03:00
# get ptrack for every idx
2017-05-05 16:21:49 +03:00
idx_ptrack[i]['ptrack'] = self.get_ptrack_bits_per_page_for_fork(
2018-10-16 19:16:46 +03:00
node, idx_ptrack[i]['path'],
[idx_ptrack[i]['old_size'], idx_ptrack[i]['new_size']])
2017-05-03 14:14:48 +03:00
2017-05-03 18:05:19 +03:00
# compare pages and check ptrack sanity, the most important part
2018-10-16 22:53:59 +03:00
if not self.check_ptrack_sanity(idx_ptrack[i]):
success = False
self.assertTrue(
success, 'Ptrack has failed to register changes in data files'
)
2017-05-03 14:14:48 +03:00
2017-06-27 08:42:52 +03:00
# Clean after yourself
2017-07-12 17:28:28 +03:00
self.del_test_dir(module_name, fname)
2017-09-28 10:32:06 +03:00
# @unittest.skip("skip")
# @unittest.expectedFailure
def test_ptrack_vacuum_full_replica(self):
fname = self.id().split('.')[3]
2018-10-16 19:16:46 +03:00
master = self.make_simple_node(
base_dir="{0}/{1}/master".format(module_name, fname),
2017-09-28 10:32:06 +03:00
set_replication=True,
initdb_params=['--data-checksums'],
2018-10-16 19:16:46 +03:00
pg_options={
2018-11-28 21:19:10 +03:00
'ptrack_enable': 'on',
'wal_level': 'replica',
'max_wal_senders': '2',
'autovacuum': 'off',
'archive_timeout': '30s'}
2018-10-16 19:16:46 +03:00
)
2017-09-28 10:32:06 +03:00
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'master', master)
master.slow_start()
2017-09-28 10:32:06 +03:00
self.backup_node(backup_dir, 'master', master, options=['--stream'])
2018-10-16 19:16:46 +03:00
replica = self.make_simple_node(
base_dir="{0}/{1}/replica".format(module_name, fname))
2017-09-28 10:32:06 +03:00
replica.cleanup()
self.restore_node(backup_dir, 'master', replica)
self.add_instance(backup_dir, 'replica', replica)
self.set_replica(master, replica, 'replica', synchronous=True)
self.set_archiving(backup_dir, 'replica', replica, replica=True)
replica.slow_start(replica=True)
2017-09-28 10:32:06 +03:00
# Create table and indexes
master.safe_psql(
"postgres",
2018-10-19 14:54:17 +03:00
"create extension bloom; create sequence t_seq; "
"create table t_heap as select i as id, "
2018-10-16 19:16:46 +03:00
"md5(i::text) as text, md5(repeat(i::text,10))::tsvector as "
2018-10-17 17:04:23 +03:00
"tsvector from generate_series(0,256000) i")
2017-09-28 10:32:06 +03:00
for i in idx_ptrack:
if idx_ptrack[i]['type'] != 'heap' and idx_ptrack[i]['type'] != 'seq':
2018-10-16 19:16:46 +03:00
master.safe_psql(
"postgres",
"create index {0} on {1} using {2}({3})".format(
i, idx_ptrack[i]['relation'],
idx_ptrack[i]['type'],
idx_ptrack[i]['column']))
2017-09-28 10:32:06 +03:00
master.safe_psql('postgres', 'vacuum t_heap')
master.safe_psql('postgres', 'checkpoint')
2018-10-16 19:16:46 +03:00
# Sync master and replica
self.wait_until_replica_catch_with_master(master, replica)
2018-10-16 19:16:46 +03:00
replica.safe_psql('postgres', 'checkpoint')
2017-09-28 10:32:06 +03:00
# Take FULL backup to clean every ptrack
2018-10-16 19:16:46 +03:00
self.backup_node(
backup_dir, 'replica', replica,
options=[
'-j10',
'--master-host=localhost',
'--master-db=postgres',
2018-11-28 21:19:10 +03:00
'--master-port={0}'.format(master.port),
'--stream'
2018-10-16 19:16:46 +03:00
]
)
# TODO: check that all ptrack are nullified
2018-10-17 17:04:23 +03:00
for i in idx_ptrack:
# get size of heap and indexes. size calculated in pages
idx_ptrack[i]['old_size'] = self.get_fork_size(replica, i)
# get path to heap and index files
idx_ptrack[i]['path'] = self.get_fork_path(replica, i)
# calculate md5sums of pages
idx_ptrack[i]['old_pages'] = self.get_md5_per_page_for_fork(
idx_ptrack[i]['path'], idx_ptrack[i]['old_size'])
2017-09-28 10:32:06 +03:00
master.safe_psql('postgres', 'delete from t_heap where id%2 = 1')
master.safe_psql('postgres', 'vacuum full t_heap')
2018-10-17 17:04:23 +03:00
master.safe_psql('postgres', 'checkpoint')
2018-10-16 19:16:46 +03:00
# Sync master and replica
self.wait_until_replica_catch_with_master(master, replica)
2018-10-16 19:16:46 +03:00
replica.safe_psql('postgres', 'checkpoint')
2018-10-16 22:53:59 +03:00
# CHECK PTRACK SANITY
success = True
2017-09-28 10:32:06 +03:00
for i in idx_ptrack:
# get new size of heap and indexes. size calculated in pages
idx_ptrack[i]['new_size'] = self.get_fork_size(replica, i)
# update path to heap and index files in case they`ve changed
idx_ptrack[i]['path'] = self.get_fork_path(replica, i)
# calculate new md5sums for pages
idx_ptrack[i]['new_pages'] = self.get_md5_per_page_for_fork(
idx_ptrack[i]['path'], idx_ptrack[i]['new_size'])
# get ptrack for every idx
idx_ptrack[i]['ptrack'] = self.get_ptrack_bits_per_page_for_fork(
2018-10-16 19:16:46 +03:00
replica, idx_ptrack[i]['path'],
[idx_ptrack[i]['old_size'], idx_ptrack[i]['new_size']])
2017-09-28 10:32:06 +03:00
# compare pages and check ptrack sanity, the most important part
2018-10-16 22:53:59 +03:00
if not self.check_ptrack_sanity(idx_ptrack[i]):
success = False
self.assertTrue(
success, 'Ptrack has failed to register changes in data files'
)
2017-09-28 10:32:06 +03:00
# Clean after yourself
self.del_test_dir(module_name, fname)