1
0
mirror of https://github.com/postgrespro/pg_probackup.git synced 2025-01-09 14:45:47 +02:00
pg_probackup/tests/ptrack_clean.py

192 lines
9.5 KiB
Python
Raw Normal View History

2017-06-20 12:57:23 +02:00
import os
2017-06-27 07:42:52 +02:00
import unittest
from .helpers.ptrack_helpers import ProbackupTest, idx_ptrack
2017-05-03 13:14:48 +02:00
2017-07-12 16:28:28 +02:00
module_name = 'ptrack_clean'
2017-05-03 13:14:48 +02:00
class SimpleTest(ProbackupTest, unittest.TestCase):
# @unittest.skip("skip")
# @unittest.expectedFailure
2017-05-03 13:14:48 +02:00
def test_ptrack_clean(self):
2017-09-28 09:32:06 +02:00
"""Take backups of every available types and check that PTRACK is clean"""
2017-05-03 13:14:48 +02:00
fname = self.id().split('.')[3]
node = self.make_simple_node(
base_dir="{0}/{1}/node".format(module_name, fname),
2017-05-03 13:14:48 +02:00
set_replication=True,
2017-06-20 12:57:23 +02:00
initdb_params=['--data-checksums'],
pg_options={
'ptrack_enable': 'on',
'wal_level': 'replica',
'max_wal_senders': '2'})
2017-07-12 16:28:28 +02:00
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
2017-06-20 12:57:23 +02:00
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'node', node)
self.set_archiving(backup_dir, 'node', node)
2017-05-03 13:14:48 +02:00
node.start()
2017-06-20 12:57:23 +02:00
2017-05-03 13:14:48 +02:00
self.create_tblspace_in_node(node, 'somedata')
# Create table and indexes
2017-07-12 16:28:28 +02:00
node.safe_psql(
2017-05-03 13:14:48 +02:00
"postgres",
2017-07-12 16:28:28 +02:00
"create sequence t_seq; create table t_heap tablespace somedata as select i as id, nextval('t_seq') as t_seq, md5(i::text) as text, md5(repeat(i::text,10))::tsvector as tsvector from generate_series(0,256) i")
2017-05-03 13:14:48 +02:00
for i in idx_ptrack:
2017-07-12 16:28:28 +02:00
if idx_ptrack[i]['type'] != 'heap' and idx_ptrack[i]['type'] != 'seq':
node.safe_psql("postgres", "create index {0} on {1} using {2}({3}) tablespace somedata".format(
i, idx_ptrack[i]['relation'], idx_ptrack[i]['type'], idx_ptrack[i]['column']))
2017-05-03 13:14:48 +02:00
2017-09-28 09:32:06 +02:00
# Take FULL backup to clean every ptrack
self.backup_node(backup_dir, 'node', node, options=['-j10', '--stream'])
2017-10-09 14:32:48 +02:00
node.safe_psql('postgres', 'checkpoint')
2017-05-03 13:14:48 +02:00
for i in idx_ptrack:
# get fork size and calculate it in pages
idx_ptrack[i]['size'] = self.get_fork_size(node, i)
# get path to heap and index files
idx_ptrack[i]['path'] = self.get_fork_path(node, i)
# get ptrack for every idx
2017-05-05 15:21:49 +02:00
idx_ptrack[i]['ptrack'] = self.get_ptrack_bits_per_page_for_fork(
2017-07-12 16:28:28 +02:00
node, idx_ptrack[i]['path'], [idx_ptrack[i]['size']])
2017-05-03 17:05:19 +02:00
self.check_ptrack_clean(idx_ptrack[i], idx_ptrack[i]['size'])
2017-05-03 13:14:48 +02:00
2017-09-28 09:32:06 +02:00
# Update everything and vacuum it
2017-07-12 16:28:28 +02:00
node.safe_psql('postgres', "update t_heap set t_seq = nextval('t_seq'), text = md5(text), tsvector = md5(repeat(tsvector::text, 10))::tsvector;")
node.safe_psql('postgres', 'vacuum t_heap')
2017-05-03 13:14:48 +02:00
2017-09-28 09:32:06 +02:00
# Take PTRACK backup to clean every ptrack
backup_id = self.backup_node(
backup_dir, 'node', node, backup_type='ptrack',
options=['-j100', '--log-level-file=verbose'])
2017-10-09 14:32:48 +02:00
node.safe_psql('postgres', 'checkpoint')
2017-05-03 13:14:48 +02:00
for i in idx_ptrack:
# get new size of heap and indexes and calculate it in pages
idx_ptrack[i]['size'] = self.get_fork_size(node, i)
# update path to heap and index files in case they`ve changed
idx_ptrack[i]['path'] = self.get_fork_path(node, i)
# # get ptrack for every idx
2017-05-05 15:21:49 +02:00
idx_ptrack[i]['ptrack'] = self.get_ptrack_bits_per_page_for_fork(
2017-07-12 16:28:28 +02:00
node, idx_ptrack[i]['path'], [idx_ptrack[i]['size']])
2017-05-03 13:14:48 +02:00
# check that ptrack bits are cleaned
2017-05-03 17:05:19 +02:00
self.check_ptrack_clean(idx_ptrack[i], idx_ptrack[i]['size'])
2017-09-28 09:32:06 +02:00
# Update everything and vacuum it
2017-07-12 16:28:28 +02:00
node.safe_psql('postgres', "update t_heap set t_seq = nextval('t_seq'), text = md5(text), tsvector = md5(repeat(tsvector::text, 10))::tsvector;")
node.safe_psql('postgres', 'vacuum t_heap')
2017-05-03 17:05:19 +02:00
2017-09-28 09:32:06 +02:00
# Take PAGE backup to clean every ptrack
2017-06-20 12:57:23 +02:00
self.backup_node(backup_dir, 'node', node, backup_type='page', options=['-j100'])
2017-07-12 16:28:28 +02:00
node.safe_psql('postgres', 'checkpoint')
2017-05-03 17:05:19 +02:00
for i in idx_ptrack:
# get new size of heap and indexes and calculate it in pages
idx_ptrack[i]['size'] = self.get_fork_size(node, i)
# update path to heap and index files in case they`ve changed
idx_ptrack[i]['path'] = self.get_fork_path(node, i)
# # get ptrack for every idx
2017-05-05 15:21:49 +02:00
idx_ptrack[i]['ptrack'] = self.get_ptrack_bits_per_page_for_fork(
2017-07-12 16:28:28 +02:00
node, idx_ptrack[i]['path'], [idx_ptrack[i]['size']])
# check that ptrack bits are cleaned
self.check_ptrack_clean(idx_ptrack[i], idx_ptrack[i]['size'])
# Clean after yourself
self.del_test_dir(module_name, fname)
# @unittest.skip("skip")
# @unittest.expectedFailure
def test_ptrack_clean_replica(self):
2017-09-28 09:32:06 +02:00
"""Take backups of every available types from master and check that PTRACK on replica is clean"""
2017-07-12 16:28:28 +02:00
fname = self.id().split('.')[3]
master = self.make_simple_node(base_dir="{0}/{1}/master".format(module_name, fname),
set_replication=True,
initdb_params=['--data-checksums'],
pg_options={'ptrack_enable': 'on', 'wal_level': 'replica', 'max_wal_senders': '2'})
backup_dir = os.path.join(self.tmp_path, module_name, fname, 'backup')
self.init_pb(backup_dir)
self.add_instance(backup_dir, 'master', master)
master.start()
self.backup_node(backup_dir, 'master', master, options=['--stream'])
replica = self.make_simple_node(base_dir="{0}/{1}/replica".format(module_name, fname))
replica.cleanup()
2017-09-28 09:32:06 +02:00
self.restore_node(backup_dir, 'master', replica)
2017-07-12 16:28:28 +02:00
self.add_instance(backup_dir, 'replica', replica)
self.set_replica(master, replica)
self.set_archiving(backup_dir, 'replica', replica, replica=True)
replica.start()
# Create table and indexes
master.safe_psql(
"postgres",
2017-09-28 09:32:06 +02:00
"create sequence t_seq; create table t_heap as select i as id, nextval('t_seq') as t_seq, md5(i::text) as text, md5(repeat(i::text,10))::tsvector as tsvector from generate_series(0,256) i")
2017-07-12 16:28:28 +02:00
for i in idx_ptrack:
if idx_ptrack[i]['type'] != 'heap' and idx_ptrack[i]['type'] != 'seq':
2017-09-28 09:32:06 +02:00
master.safe_psql("postgres", "create index {0} on {1} using {2}({3})".format(
2017-07-12 16:28:28 +02:00
i, idx_ptrack[i]['relation'], idx_ptrack[i]['type'], idx_ptrack[i]['column']))
2017-09-28 09:32:06 +02:00
# Take FULL backup to clean every ptrack
2017-07-12 16:28:28 +02:00
self.backup_node(backup_dir, 'replica', replica, options=['-j100', '--stream',
'--master-host=localhost', '--master-db=postgres', '--master-port={0}'.format(master.port)])
2017-10-09 14:32:48 +02:00
master.safe_psql('postgres', 'checkpoint')
2017-07-12 16:28:28 +02:00
for i in idx_ptrack:
# get fork size and calculate it in pages
idx_ptrack[i]['size'] = self.get_fork_size(replica, i)
# get path to heap and index files
idx_ptrack[i]['path'] = self.get_fork_path(replica, i)
# get ptrack for every idx
idx_ptrack[i]['ptrack'] = self.get_ptrack_bits_per_page_for_fork(
replica, idx_ptrack[i]['path'], [idx_ptrack[i]['size']])
self.check_ptrack_clean(idx_ptrack[i], idx_ptrack[i]['size'])
2017-09-28 09:32:06 +02:00
# Update everything and vacuum it
2017-07-12 16:28:28 +02:00
master.safe_psql('postgres', "update t_heap set t_seq = nextval('t_seq'), text = md5(text), tsvector = md5(repeat(tsvector::text, 10))::tsvector;")
master.safe_psql('postgres', 'vacuum t_heap')
2017-09-28 09:32:06 +02:00
# Take PTRACK backup to clean every ptrack
2017-07-12 16:28:28 +02:00
backup_id = self.backup_node(backup_dir, 'replica', replica, backup_type='ptrack', options=['-j100', '--stream',
'--master-host=localhost', '--master-db=postgres', '--master-port={0}'.format(master.port)])
master.safe_psql('postgres', 'checkpoint')
2017-10-09 14:32:48 +02:00
2017-07-12 16:28:28 +02:00
for i in idx_ptrack:
# get new size of heap and indexes and calculate it in pages
idx_ptrack[i]['size'] = self.get_fork_size(replica, i)
# update path to heap and index files in case they`ve changed
idx_ptrack[i]['path'] = self.get_fork_path(replica, i)
# # get ptrack for every idx
idx_ptrack[i]['ptrack'] = self.get_ptrack_bits_per_page_for_fork(
replica, idx_ptrack[i]['path'], [idx_ptrack[i]['size']])
2017-05-03 17:05:19 +02:00
# check that ptrack bits are cleaned
self.check_ptrack_clean(idx_ptrack[i], idx_ptrack[i]['size'])
2017-09-28 09:32:06 +02:00
# Update everything and vacuum it
master.safe_psql('postgres', "update t_heap set t_seq = nextval('t_seq'), text = md5(text), tsvector = md5(repeat(tsvector::text, 10))::tsvector;")
master.safe_psql('postgres', 'vacuum t_heap')
master.safe_psql('postgres', 'checkpoint')
# Take PAGE backup to clean every ptrack
self.backup_node(backup_dir, 'replica', replica, backup_type='page', options=['-j100',
'--master-host=localhost', '--master-db=postgres', '--master-port={0}'.format(master.port)])
2017-10-09 14:32:48 +02:00
master.safe_psql('postgres', 'checkpoint')
2017-09-28 09:32:06 +02:00
for i in idx_ptrack:
# get new size of heap and indexes and calculate it in pages
idx_ptrack[i]['size'] = self.get_fork_size(replica, i)
# update path to heap and index files in case they`ve changed
idx_ptrack[i]['path'] = self.get_fork_path(replica, i)
# # get ptrack for every idx
idx_ptrack[i]['ptrack'] = self.get_ptrack_bits_per_page_for_fork(
replica, idx_ptrack[i]['path'], [idx_ptrack[i]['size']])
# check that ptrack bits are cleaned
self.check_ptrack_clean(idx_ptrack[i], idx_ptrack[i]['size'])
2017-07-12 16:28:28 +02:00
2017-06-27 07:42:52 +02:00
# Clean after yourself
2017-07-12 16:28:28 +02:00
self.del_test_dir(module_name, fname)