# you need os for unittest to work import os from sys import exit, argv, version_info import subprocess import shutil import six import testgres import hashlib import re import getpass import select from time import sleep import re import json idx_ptrack = { 't_heap': { 'type': 'heap' }, 't_btree': { 'type': 'btree', 'column': 'text', 'relation': 't_heap' }, 't_seq': { 'type': 'seq', 'column': 't_seq', 'relation': 't_heap' }, 't_spgist': { 'type': 'spgist', 'column': 'text', 'relation': 't_heap' }, 't_brin': { 'type': 'brin', 'column': 'text', 'relation': 't_heap' }, 't_gist': { 'type': 'gist', 'column': 'tsvector', 'relation': 't_heap' }, 't_gin': { 'type': 'gin', 'column': 'tsvector', 'relation': 't_heap' }, 't_hash': { 'type': 'hash', 'column': 'id', 'relation': 't_heap' }, 't_bloom': { 'type': 'bloom', 'column': 'id', 'relation': 't_heap' } } warning = """ Wrong splint in show_pb Original Header: {header} Original Body: {body} Splitted Header {header_split} Splitted Body {body_split} """ def dir_files(base_dir): out_list = [] for dir_name, subdir_list, file_list in os.walk(base_dir): if dir_name != base_dir: out_list.append(os.path.relpath(dir_name, base_dir)) for fname in file_list: out_list.append( os.path.relpath(os.path.join( dir_name, fname), base_dir) ) out_list.sort() return out_list def is_enterprise(): # pg_config --help if os.name == 'posix': cmd = [os.environ['PG_CONFIG'], '--help'] elif os.name == 'nt': cmd = [[os.environ['PG_CONFIG']], ['--help']] p = subprocess.Popen( cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE ) if b'postgrespro.ru' in p.communicate()[0]: return True else: return False class ProbackupException(Exception): def __init__(self, message, cmd): self.message = message self.cmd = cmd def __str__(self): return '\n ERROR: {0}\n CMD: {1}'.format(repr(self.message), self.cmd) def slow_start(self, replica=False): # wait for https://github.com/postgrespro/testgres/pull/50 # self.start() # self.poll_query_until( # "postgres", # "SELECT not pg_is_in_recovery()", # suppress={testgres.NodeConnection}) if replica: query = 'SELECT pg_is_in_recovery()' else: query = 'SELECT not pg_is_in_recovery()' self.start() while True: try: output = self.safe_psql('template1', query).decode("utf-8").rstrip() if output == 't': break except testgres.QueryException as e: if 'database system is starting up' in e.message: continue else: raise e class ProbackupTest(object): # Class attributes enterprise = is_enterprise() def __init__(self, *args, **kwargs): super(ProbackupTest, self).__init__(*args, **kwargs) if '-v' in argv or '--verbose' in argv: self.verbose = True else: self.verbose = False self.test_env = os.environ.copy() envs_list = [ 'LANGUAGE', 'LC_ALL', 'PGCONNECT_TIMEOUT', 'PGDATA', 'PGDATABASE', 'PGHOSTADDR', 'PGREQUIRESSL', 'PGSERVICE', 'PGSSLMODE', 'PGUSER', 'PGPORT', 'PGHOST' ] for e in envs_list: try: del self.test_env[e] except: pass self.test_env['LC_MESSAGES'] = 'C' self.test_env['LC_TIME'] = 'C' self.paranoia = False if 'PG_PROBACKUP_PARANOIA' in self.test_env: if self.test_env['PG_PROBACKUP_PARANOIA'] == 'ON': self.paranoia = True self.archive_compress = False if 'ARCHIVE_COMPRESSION' in self.test_env: if self.test_env['ARCHIVE_COMPRESSION'] == 'ON': self.archive_compress = True try: testgres.configure_testgres( cache_initdb=False, cached_initdb_dir=False, cache_pg_config=False, node_cleanup_full=False) except: pass self.helpers_path = os.path.dirname(os.path.realpath(__file__)) self.dir_path = os.path.abspath( os.path.join(self.helpers_path, os.pardir) ) self.tmp_path = os.path.abspath( os.path.join(self.dir_path, 'tmp_dirs') ) try: os.makedirs(os.path.join(self.dir_path, 'tmp_dirs')) except: pass self.user = self.get_username() self.probackup_path = None if 'PGPROBACKUPBIN' in self.test_env: if ( os.path.isfile(self.test_env["PGPROBACKUPBIN"]) and os.access(self.test_env["PGPROBACKUPBIN"], os.X_OK) ): self.probackup_path = self.test_env["PGPROBACKUPBIN"] else: if self.verbose: print('PGPROBACKUPBIN is not an executable file') if not self.probackup_path: probackup_path_tmp = os.path.join( testgres.get_pg_config()['BINDIR'], 'pg_probackup') if os.path.isfile(probackup_path_tmp): if not os.access(probackup_path_tmp, os.X_OK): print('{0} is not an executable file'.format( probackup_path_tmp)) else: self.probackup_path = probackup_path_tmp if not self.probackup_path: probackup_path_tmp = os.path.abspath(os.path.join( self.dir_path, '../pg_probackup')) if os.path.isfile(probackup_path_tmp): if not os.access(probackup_path_tmp, os.X_OK): print('{0} is not an executable file'.format( probackup_path_tmp)) else: self.probackup_path = probackup_path_tmp if not self.probackup_path: print('pg_probackup binary is not found') exit(1) self.probackup_version = None try: self.probackup_version_output = subprocess.check_output( [self.probackup_path, "--version"], stderr=subprocess.STDOUT, ).decode('utf-8') except subprocess.CalledProcessError as e: raise ProbackupException(e.output.decode('utf-8')) self.probackup_version = re.search(r"\d+\.\d+\.\d+", self.probackup_version_output).group(0) if os.name == 'posix': self.EXTERNAL_DIRECTORY_DELIMITER = ':' os.environ['PATH'] = os.path.dirname( self.probackup_path) + ':' + os.environ['PATH'] elif os.name == 'nt': self.EXTERNAL_DIRECTORY_DELIMITER = ';' os.environ['PATH'] = os.path.dirname( self.probackup_path) + ';' + os.environ['PATH'] self.probackup_old_path = None if 'PGPROBACKUPBIN_OLD' in self.test_env: if ( os.path.isfile(self.test_env['PGPROBACKUPBIN_OLD']) and os.access(self.test_env['PGPROBACKUPBIN_OLD'], os.X_OK) ): self.probackup_old_path = self.test_env['PGPROBACKUPBIN_OLD'] else: if self.verbose: print('PGPROBACKUPBIN_OLD is not an executable file') self.remote = False self.remote_host = None self.remote_port = None self.remote_user = None if 'PGPROBACKUP_SSH_REMOTE' in self.test_env: if self.test_env['PGPROBACKUP_SSH_REMOTE'] == 'ON': self.remote = True self.ptrack = False if 'PG_PROBACKUP_PTRACK' in self.test_env: if self.test_env['PG_PROBACKUP_PTRACK'] == 'ON': self.ptrack = True os.environ["PGAPPNAME"] = "pg_probackup" @property def pg_config_version(self): return self.version_to_num( testgres.get_pg_config()['VERSION'].split(" ")[1]) # if 'PGPROBACKUP_SSH_HOST' in self.test_env: # self.remote_host = self.test_env['PGPROBACKUP_SSH_HOST'] # else # print('PGPROBACKUP_SSH_HOST is not set') # exit(1) # # if 'PGPROBACKUP_SSH_PORT' in self.test_env: # self.remote_port = self.test_env['PGPROBACKUP_SSH_PORT'] # else # print('PGPROBACKUP_SSH_PORT is not set') # exit(1) # # if 'PGPROBACKUP_SSH_USER' in self.test_env: # self.remote_user = self.test_env['PGPROBACKUP_SSH_USER'] # else # print('PGPROBACKUP_SSH_USER is not set') # exit(1) def make_simple_node( self, base_dir=None, set_replication=False, ptrack_enable=False, initdb_params=[], pg_options={}): real_base_dir = os.path.join(self.tmp_path, base_dir) shutil.rmtree(real_base_dir, ignore_errors=True) os.makedirs(real_base_dir) node = testgres.get_new_node('test', base_dir=real_base_dir) # bound method slow_start() to 'node' class instance node.slow_start = slow_start.__get__(node) node.should_rm_dirs = True node.init( initdb_params=initdb_params, allow_streaming=set_replication) # set major version with open(os.path.join(node.data_dir, 'PG_VERSION')) as f: node.major_version_str = str(f.read().rstrip()) node.major_version = float(node.major_version_str) # Sane default parameters options = {} options['max_connections'] = 100 options['shared_buffers'] = '10MB' options['fsync'] = 'off' options['wal_level'] = 'logical' options['hot_standby'] = 'off' options['log_line_prefix'] = '%t [%p]: [%l-1] ' options['log_statement'] = 'none' options['log_duration'] = 'on' options['log_min_duration_statement'] = 0 options['log_connections'] = 'on' options['log_disconnections'] = 'on' options['restart_after_crash'] = 'off' # Allow replication in pg_hba.conf if set_replication: options['max_wal_senders'] = 10 if ptrack_enable: if node.major_version >= 11: options['ptrack.map_size'] = '128' options['shared_preload_libraries'] = 'ptrack' else: options['ptrack_enable'] = 'on' if node.major_version >= 13: options['wal_keep_size'] = '200MB' else: options['wal_keep_segments'] = '100' # set default values self.set_auto_conf(node, options) # Apply given parameters self.set_auto_conf(node, pg_options) # kludge for testgres # https://github.com/postgrespro/testgres/issues/54 # for PG >= 13 remove 'wal_keep_segments' parameter if node.major_version >= 13: self.set_auto_conf( node, {}, 'postgresql.conf', ['wal_keep_segments']) return node def create_tblspace_in_node(self, node, tblspc_name, tblspc_path=None, cfs=False): res = node.execute( 'postgres', 'select exists' " (select 1 from pg_tablespace where spcname = '{0}')".format( tblspc_name) ) # Check that tablespace with name 'tblspc_name' do not exists already self.assertFalse( res[0][0], 'Tablespace "{0}" already exists'.format(tblspc_name) ) if not tblspc_path: tblspc_path = os.path.join( node.base_dir, '{0}'.format(tblspc_name)) cmd = "CREATE TABLESPACE {0} LOCATION '{1}'".format( tblspc_name, tblspc_path) if cfs: cmd += ' with (compression=true)' if not os.path.exists(tblspc_path): os.makedirs(tblspc_path) res = node.safe_psql('postgres', cmd) # Check that tablespace was successfully created # self.assertEqual( # res[0], 0, # 'Failed to create tablespace with cmd: {0}'.format(cmd)) def get_tblspace_path(self, node, tblspc_name): return os.path.join(node.base_dir, tblspc_name) def get_fork_size(self, node, fork_name): return node.execute( 'postgres', "select pg_relation_size('{0}')/8192".format(fork_name))[0][0] def get_fork_path(self, node, fork_name): return os.path.join( node.base_dir, 'data', node.execute( 'postgres', "select pg_relation_filepath('{0}')".format( fork_name))[0][0] ) def get_md5_per_page_for_fork(self, file, size_in_pages): pages_per_segment = {} md5_per_page = {} size_in_pages = int(size_in_pages) nsegments = int(size_in_pages/131072) if size_in_pages % 131072 != 0: nsegments = nsegments + 1 size = size_in_pages for segment_number in range(nsegments): if size - 131072 > 0: pages_per_segment[segment_number] = 131072 else: pages_per_segment[segment_number] = size size = size - 131072 for segment_number in range(nsegments): offset = 0 if segment_number == 0: file_desc = os.open(file, os.O_RDONLY) start_page = 0 end_page = pages_per_segment[segment_number] else: file_desc = os.open( file+'.{0}'.format(segment_number), os.O_RDONLY ) start_page = max(md5_per_page)+1 end_page = end_page + pages_per_segment[segment_number] for page in range(start_page, end_page): md5_per_page[page] = hashlib.md5( os.read(file_desc, 8192)).hexdigest() offset += 8192 os.lseek(file_desc, offset, 0) os.close(file_desc) return md5_per_page def get_ptrack_bits_per_page_for_fork(self, node, file, size=[]): if self.get_pgpro_edition(node) == 'enterprise': if self.get_version(node) < self.version_to_num('10.0'): header_size = 48 else: header_size = 24 else: header_size = 24 ptrack_bits_for_fork = [] # TODO: use macro instead of hard coded 8KB page_body_size = 8192-header_size # Check that if main fork file size is 0, it`s ok # to not having a _ptrack fork if os.path.getsize(file) == 0: return ptrack_bits_for_fork byte_size = os.path.getsize(file + '_ptrack') npages = int(byte_size/8192) if byte_size % 8192 != 0: print('Ptrack page is not 8k aligned') exit(1) file = os.open(file + '_ptrack', os.O_RDONLY) for page in range(npages): offset = 8192*page+header_size os.lseek(file, offset, 0) lots_of_bytes = os.read(file, page_body_size) byte_list = [ lots_of_bytes[i:i+1] for i in range(len(lots_of_bytes)) ] for byte in byte_list: # byte_inverted = bin(int(byte, base=16))[2:][::-1] # bits = (byte >> x) & 1 for x in range(7, -1, -1) byte_inverted = bin(ord(byte))[2:].rjust(8, '0')[::-1] for bit in byte_inverted: # if len(ptrack_bits_for_fork) < size: ptrack_bits_for_fork.append(int(bit)) os.close(file) return ptrack_bits_for_fork def check_ptrack_map_sanity(self, node, idx_ptrack): if node.major_version >= 12: return success = True for i in idx_ptrack: # get new size of heap and indexes. size calculated in pages idx_ptrack[i]['new_size'] = self.get_fork_size(node, i) # update path to heap and index files in case they`ve changed idx_ptrack[i]['path'] = self.get_fork_path(node, i) # calculate new md5sums for pages idx_ptrack[i]['new_pages'] = self.get_md5_per_page_for_fork( idx_ptrack[i]['path'], idx_ptrack[i]['new_size']) # get ptrack for every idx idx_ptrack[i]['ptrack'] = self.get_ptrack_bits_per_page_for_fork( node, idx_ptrack[i]['path'], [idx_ptrack[i]['old_size'], idx_ptrack[i]['new_size']]) # compare pages and check ptrack sanity if not self.check_ptrack_sanity(idx_ptrack[i]): success = False self.assertTrue( success, 'Ptrack has failed to register changes in data files') def check_ptrack_sanity(self, idx_dict): success = True if idx_dict['new_size'] > idx_dict['old_size']: size = idx_dict['new_size'] else: size = idx_dict['old_size'] for PageNum in range(size): if PageNum not in idx_dict['old_pages']: # Page was not present before, meaning that relation got bigger # Ptrack should be equal to 1 if idx_dict['ptrack'][PageNum] != 1: if self.verbose: print( 'File: {0}\n Page Number {1} of type {2} was added,' ' but ptrack value is {3}. THIS IS BAD'.format( idx_dict['path'], PageNum, idx_dict['type'], idx_dict['ptrack'][PageNum]) ) # print(idx_dict) success = False continue if PageNum not in idx_dict['new_pages']: # Page is not present now, meaning that relation got smaller # Ptrack should be equal to 1, # We are not freaking out about false positive stuff if idx_dict['ptrack'][PageNum] != 1: if self.verbose: print( 'File: {0}\n Page Number {1} of type {2} was deleted,' ' but ptrack value is {3}. THIS IS BAD'.format( idx_dict['path'], PageNum, idx_dict['type'], idx_dict['ptrack'][PageNum]) ) continue # Ok, all pages in new_pages that do not have # corresponding page in old_pages are been dealt with. # We can now safely proceed to comparing old and new pages if idx_dict['new_pages'][ PageNum] != idx_dict['old_pages'][PageNum]: # Page has been changed, # meaning that ptrack should be equal to 1 if idx_dict['ptrack'][PageNum] != 1: if self.verbose: print( 'File: {0}\n Page Number {1} of type {2} was changed,' ' but ptrack value is {3}. THIS IS BAD'.format( idx_dict['path'], PageNum, idx_dict['type'], idx_dict['ptrack'][PageNum]) ) print( ' Old checksumm: {0}\n' ' New checksumm: {1}'.format( idx_dict['old_pages'][PageNum], idx_dict['new_pages'][PageNum]) ) if PageNum == 0 and idx_dict['type'] == 'spgist': if self.verbose: print( 'SPGIST is a special snowflake, so don`t ' 'fret about losing ptrack for blknum 0' ) continue success = False else: # Page has not been changed, # meaning that ptrack should be equal to 0 if idx_dict['ptrack'][PageNum] != 0: if self.verbose: print( 'File: {0}\n Page Number {1} of type {2} was not changed,' ' but ptrack value is {3}'.format( idx_dict['path'], PageNum, idx_dict['type'], idx_dict['ptrack'][PageNum] ) ) return success # self.assertTrue( # success, 'Ptrack has failed to register changes in data files' # ) def get_backup_filelist(self, backup_dir, instance, backup_id): filelist_path = os.path.join( backup_dir, 'backups', instance, backup_id, 'backup_content.control') with open(filelist_path, 'r') as f: filelist_raw = f.read() filelist_splitted = filelist_raw.splitlines() filelist = {} for line in filelist_splitted: line = json.loads(line) filelist[line['path']] = line return filelist # return dict of files from filelist A, # which are not exists in filelist_B def get_backup_filelist_diff(self, filelist_A, filelist_B): filelist_diff = {} for file in filelist_A: if file not in filelist_B: filelist_diff[file] = filelist_A[file] return filelist_diff # used for partial restore def truncate_every_file_in_dir(self, path): for file in os.listdir(path): with open(os.path.join(path, file), "w") as f: f.close() def check_ptrack_recovery(self, idx_dict): size = idx_dict['size'] for PageNum in range(size): if idx_dict['ptrack'][PageNum] != 1: self.assertTrue( False, 'Recovery for Page Number {0} of Type {1}' ' was conducted, but ptrack value is {2}.' ' THIS IS BAD\n IDX_DICT: {3}'.format( PageNum, idx_dict['type'], idx_dict['ptrack'][PageNum], idx_dict ) ) def check_ptrack_clean(self, idx_dict, size): for PageNum in range(size): if idx_dict['ptrack'][PageNum] != 0: self.assertTrue( False, 'Ptrack for Page Number {0} of Type {1}' ' should be clean, but ptrack value is {2}.' '\n THIS IS BAD\n IDX_DICT: {3}'.format( PageNum, idx_dict['type'], idx_dict['ptrack'][PageNum], idx_dict ) ) def run_pb(self, command, asynchronous=False, gdb=False, old_binary=False, return_id=True): if not self.probackup_old_path and old_binary: print('PGPROBACKUPBIN_OLD is not set') exit(1) if old_binary: binary_path = self.probackup_old_path else: binary_path = self.probackup_path try: self.cmd = [' '.join(map(str, [binary_path] + command))] if self.verbose: print(self.cmd) if gdb: return GDBobj([binary_path] + command, self.verbose) if asynchronous: return subprocess.Popen( self.cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, env=self.test_env ) else: self.output = subprocess.check_output( [binary_path] + command, stderr=subprocess.STDOUT, env=self.test_env ).decode('utf-8') if command[0] == 'backup' and return_id: # return backup ID for line in self.output.splitlines(): if 'INFO: Backup' and 'completed' in line: return line.split()[2] else: return self.output except subprocess.CalledProcessError as e: raise ProbackupException(e.output.decode('utf-8'), self.cmd) def run_binary(self, command, asynchronous=False): if self.verbose: print([' '.join(map(str, command))]) try: if asynchronous: return subprocess.Popen( command, stdin=subprocess.PIPE, stdout=subprocess.PIPE, stderr=subprocess.PIPE, env=self.test_env ) else: self.output = subprocess.check_output( command, stderr=subprocess.STDOUT, env=self.test_env ).decode('utf-8') return self.output except subprocess.CalledProcessError as e: raise ProbackupException(e.output.decode('utf-8'), command) def init_pb(self, backup_dir, options=[], old_binary=False): shutil.rmtree(backup_dir, ignore_errors=True) # don`t forget to kill old_binary after remote ssh release if self.remote and not old_binary: options = options + [ '--remote-proto=ssh', '--remote-host=localhost'] return self.run_pb([ 'init', '-B', backup_dir ] + options, old_binary=old_binary ) def add_instance(self, backup_dir, instance, node, old_binary=False, options=[]): cmd = [ 'add-instance', '--instance={0}'.format(instance), '-B', backup_dir, '-D', node.data_dir ] # don`t forget to kill old_binary after remote ssh release if self.remote and not old_binary: options = options + [ '--remote-proto=ssh', '--remote-host=localhost'] return self.run_pb(cmd + options, old_binary=old_binary) def set_config(self, backup_dir, instance, old_binary=False, options=[]): cmd = [ 'set-config', '--instance={0}'.format(instance), '-B', backup_dir, ] return self.run_pb(cmd + options, old_binary=old_binary) def set_backup(self, backup_dir, instance, backup_id=False, old_binary=False, options=[]): cmd = [ 'set-backup', '-B', backup_dir ] if instance: cmd = cmd + ['--instance={0}'.format(instance)] if backup_id: cmd = cmd + ['-i', backup_id] return self.run_pb(cmd + options, old_binary=old_binary) def del_instance(self, backup_dir, instance, old_binary=False): return self.run_pb([ 'del-instance', '--instance={0}'.format(instance), '-B', backup_dir ], old_binary=old_binary ) def clean_pb(self, backup_dir): shutil.rmtree(backup_dir, ignore_errors=True) def backup_node( self, backup_dir, instance, node, data_dir=False, backup_type='full', datname=False, options=[], asynchronous=False, gdb=False, old_binary=False, return_id=True, no_remote=False ): if not node and not data_dir: print('You must provide ether node or data_dir for backup') exit(1) if not datname: datname = 'postgres' cmd_list = [ 'backup', '-B', backup_dir, '--instance={0}'.format(instance), # "-D", pgdata, '-p', '%i' % node.port, '-d', datname ] if data_dir: cmd_list += ['-D', data_dir] # don`t forget to kill old_binary after remote ssh release if self.remote and not old_binary and not no_remote: options = options + [ '--remote-proto=ssh', '--remote-host=localhost'] if backup_type: cmd_list += ['-b', backup_type] if not old_binary: cmd_list += ['--no-sync'] return self.run_pb(cmd_list + options, asynchronous, gdb, old_binary, return_id) def checkdb_node( self, backup_dir=False, instance=False, data_dir=False, options=[], asynchronous=False, gdb=False, old_binary=False ): cmd_list = ["checkdb"] if backup_dir: cmd_list += ["-B", backup_dir] if instance: cmd_list += ["--instance={0}".format(instance)] if data_dir: cmd_list += ["-D", data_dir] return self.run_pb(cmd_list + options, asynchronous, gdb, old_binary) def merge_backup( self, backup_dir, instance, backup_id, asynchronous=False, gdb=False, old_binary=False, options=[]): cmd_list = [ 'merge', '-B', backup_dir, '--instance={0}'.format(instance), '-i', backup_id ] return self.run_pb(cmd_list + options, asynchronous, gdb, old_binary) def restore_node( self, backup_dir, instance, node=False, data_dir=None, backup_id=None, old_binary=False, options=[], gdb=False ): if data_dir is None: data_dir = node.data_dir cmd_list = [ 'restore', '-B', backup_dir, '-D', data_dir, '--instance={0}'.format(instance) ] # don`t forget to kill old_binary after remote ssh release if self.remote and not old_binary: options = options + [ '--remote-proto=ssh', '--remote-host=localhost'] if backup_id: cmd_list += ['-i', backup_id] if not old_binary: cmd_list += ['--no-sync'] return self.run_pb(cmd_list + options, gdb=gdb, old_binary=old_binary) def show_pb( self, backup_dir, instance=None, backup_id=None, options=[], as_text=False, as_json=True, old_binary=False ): backup_list = [] specific_record = {} cmd_list = [ 'show', '-B', backup_dir, ] if instance: cmd_list += ['--instance={0}'.format(instance)] if backup_id: cmd_list += ['-i', backup_id] # AHTUNG, WARNING will break json parsing if as_json: cmd_list += ['--format=json', '--log-level-console=error'] if as_text: # You should print it when calling as_text=true return self.run_pb(cmd_list + options, old_binary=old_binary) # get show result as list of lines if as_json: data = json.loads(self.run_pb(cmd_list + options, old_binary=old_binary)) # print(data) for instance_data in data: # find specific instance if requested if instance and instance_data['instance'] != instance: continue for backup in reversed(instance_data['backups']): # find specific backup if requested if backup_id: if backup['id'] == backup_id: return backup else: backup_list.append(backup) if backup_id is not None: self.assertTrue(False, "Failed to find backup with ID: {0}".format(backup_id)) return backup_list else: show_splitted = self.run_pb( cmd_list + options, old_binary=old_binary).splitlines() if instance is not None and backup_id is None: # cut header(ID, Mode, etc) from show as single string header = show_splitted[1:2][0] # cut backup records from show as single list # with string for every backup record body = show_splitted[3:] # inverse list so oldest record come first body = body[::-1] # split string in list with string for every header element header_split = re.split(' +', header) # Remove empty items for i in header_split: if i == '': header_split.remove(i) continue header_split = [ header_element.rstrip() for header_element in header_split ] for backup_record in body: backup_record = backup_record.rstrip() # split list with str for every backup record element backup_record_split = re.split(' +', backup_record) # Remove empty items for i in backup_record_split: if i == '': backup_record_split.remove(i) if len(header_split) != len(backup_record_split): print(warning.format( header=header, body=body, header_split=header_split, body_split=backup_record_split) ) exit(1) new_dict = dict(zip(header_split, backup_record_split)) backup_list.append(new_dict) return backup_list else: # cut out empty lines and lines started with # # and other garbage then reconstruct it as dictionary # print show_splitted sanitized_show = [item for item in show_splitted if item] sanitized_show = [ item for item in sanitized_show if not item.startswith('#') ] # print sanitized_show for line in sanitized_show: name, var = line.partition(' = ')[::2] var = var.strip('"') var = var.strip("'") specific_record[name.strip()] = var if not specific_record: self.assertTrue(False, "Failed to find backup with ID: {0}".format(backup_id)) return specific_record def show_archive( self, backup_dir, instance=None, options=[], as_text=False, as_json=True, old_binary=False, tli=0 ): cmd_list = [ 'show', '--archive', '-B', backup_dir, ] if instance: cmd_list += ['--instance={0}'.format(instance)] # AHTUNG, WARNING will break json parsing if as_json: cmd_list += ['--format=json', '--log-level-console=error'] if as_text: # You should print it when calling as_text=true return self.run_pb(cmd_list + options, old_binary=old_binary) if as_json: if as_text: data = self.run_pb(cmd_list + options, old_binary=old_binary) else: data = json.loads(self.run_pb(cmd_list + options, old_binary=old_binary)) if instance: instance_timelines = None for instance_name in data: if instance_name['instance'] == instance: instance_timelines = instance_name['timelines'] break if tli > 0: timeline_data = None for timeline in instance_timelines: if timeline['tli'] == tli: return timeline return {} if instance_timelines: return instance_timelines return data else: show_splitted = self.run_pb( cmd_list + options, old_binary=old_binary).splitlines() print(show_splitted) exit(1) def validate_pb( self, backup_dir, instance=None, backup_id=None, options=[], old_binary=False, gdb=False ): cmd_list = [ 'validate', '-B', backup_dir ] if instance: cmd_list += ['--instance={0}'.format(instance)] if backup_id: cmd_list += ['-i', backup_id] return self.run_pb(cmd_list + options, old_binary=old_binary, gdb=gdb) def delete_pb( self, backup_dir, instance, backup_id=None, options=[], old_binary=False): cmd_list = [ 'delete', '-B', backup_dir ] cmd_list += ['--instance={0}'.format(instance)] if backup_id: cmd_list += ['-i', backup_id] return self.run_pb(cmd_list + options, old_binary=old_binary) def delete_expired( self, backup_dir, instance, options=[], old_binary=False): cmd_list = [ 'delete', '-B', backup_dir, '--instance={0}'.format(instance) ] return self.run_pb(cmd_list + options, old_binary=old_binary) def show_config(self, backup_dir, instance, old_binary=False): out_dict = {} cmd_list = [ 'show-config', '-B', backup_dir, '--instance={0}'.format(instance) ] res = self.run_pb(cmd_list, old_binary=old_binary).splitlines() for line in res: if not line.startswith('#'): name, var = line.partition(' = ')[::2] out_dict[name] = var return out_dict def get_recovery_conf(self, node): out_dict = {} if self.get_version(node) >= self.version_to_num('12.0'): recovery_conf_path = os.path.join( node.data_dir, 'probackup_recovery.conf') else: recovery_conf_path = os.path.join(node.data_dir, 'recovery.conf') with open( recovery_conf_path, 'r' ) as recovery_conf: for line in recovery_conf: try: key, value = line.split('=') except: continue out_dict[key.strip()] = value.strip(" '").replace("'\n", "") return out_dict def set_archiving( self, backup_dir, instance, node, replica=False, overwrite=False, compress=True, old_binary=False, log_level=False, archive_timeout=False): # parse postgresql.auto.conf options = {} if replica: options['archive_mode'] = 'always' options['hot_standby'] = 'on' else: options['archive_mode'] = 'on' if os.name == 'posix': options['archive_command'] = '"{0}" archive-push -B {1} --instance={2} '.format( self.probackup_path, backup_dir, instance) elif os.name == 'nt': options['archive_command'] = '"{0}" archive-push -B {1} --instance={2} '.format( self.probackup_path.replace("\\","\\\\"), backup_dir.replace("\\","\\\\"), instance) # don`t forget to kill old_binary after remote ssh release if self.remote and not old_binary: options['archive_command'] += '--remote-proto=ssh ' options['archive_command'] += '--remote-host=localhost ' if self.archive_compress and compress: options['archive_command'] += '--compress ' if overwrite: options['archive_command'] += '--overwrite ' options['archive_command'] += '--log-level-console=VERBOSE ' options['archive_command'] += '-j 5 ' options['archive_command'] += '--batch-size 10 ' options['archive_command'] += '--no-sync ' if archive_timeout: options['archive_command'] += '--archive-timeout={0} '.format( archive_timeout) if os.name == 'posix': options['archive_command'] += '--wal-file-path=%p --wal-file-name=%f' elif os.name == 'nt': options['archive_command'] += '--wal-file-path="%p" --wal-file-name="%f"' if log_level: options['archive_command'] += ' --log-level-console={0}'.format(log_level) options['archive_command'] += ' --log-level-file={0} '.format(log_level) self.set_auto_conf(node, options) def get_restore_command(self, backup_dir, instance, node): # parse postgresql.auto.conf restore_command = '' if os.name == 'posix': restore_command += '{0} archive-get -B {1} --instance={2} '.format( self.probackup_path, backup_dir, instance) elif os.name == 'nt': restore_command += '"{0}" archive-get -B {1} --instance={2} '.format( self.probackup_path.replace("\\","\\\\"), backup_dir.replace("\\","\\\\"), instance) # don`t forget to kill old_binary after remote ssh release if self.remote: restore_command += '--remote-proto=ssh ' restore_command += '--remote-host=localhost ' if os.name == 'posix': restore_command += '--wal-file-path=%p --wal-file-name=%f' elif os.name == 'nt': restore_command += '--wal-file-path="%p" --wal-file-name="%f"' return restore_command # rm_options - list of parameter name that should be deleted from current config, # example: ['wal_keep_segments', 'max_wal_size'] def set_auto_conf(self, node, options, config='postgresql.auto.conf', rm_options={}): # parse postgresql.auto.conf path = os.path.join(node.data_dir, config) with open(path, 'r') as f: raw_content = f.read() current_options = {} current_directives = [] for line in raw_content.splitlines(): # ignore comments if line.startswith('#'): continue if line == '': continue if line.startswith('include'): current_directives.append(line) continue name, var = line.partition('=')[::2] name = name.strip() var = var.strip() var = var.strip('"') var = var.strip("'") # remove options specified in rm_options list if name in rm_options: continue current_options[name] = var for option in options: current_options[option] = options[option] auto_conf = '' for option in current_options: auto_conf += "{0} = '{1}'\n".format( option, current_options[option]) for directive in current_directives: auto_conf += directive + "\n" with open(path, 'wt') as f: f.write(auto_conf) f.flush() f.close() def set_replica( self, master, replica, replica_name='replica', synchronous=False, log_shipping=False ): self.set_auto_conf( replica, options={ 'port': replica.port, 'hot_standby': 'on'}) if self.get_version(replica) >= self.version_to_num('12.0'): with open(os.path.join(replica.data_dir, "standby.signal"), 'w') as f: f.flush() f.close() config = 'postgresql.auto.conf' probackup_recovery_path = os.path.join(replica.data_dir, 'probackup_recovery.conf') if os.path.exists(probackup_recovery_path): if os.stat(probackup_recovery_path).st_size > 0: config = 'probackup_recovery.conf' if not log_shipping: self.set_auto_conf( replica, {'primary_conninfo': 'user={0} port={1} application_name={2} ' ' sslmode=prefer sslcompression=1'.format( self.user, master.port, replica_name)}, config) else: replica.append_conf('recovery.conf', 'standby_mode = on') if not log_shipping: replica.append_conf( 'recovery.conf', "primary_conninfo = 'user={0} port={1} application_name={2}" " sslmode=prefer sslcompression=1'".format( self.user, master.port, replica_name)) if synchronous: self.set_auto_conf( master, options={ 'synchronous_standby_names': replica_name, 'synchronous_commit': 'remote_apply'}) master.reload() def change_backup_status(self, backup_dir, instance, backup_id, status): control_file_path = os.path.join( backup_dir, 'backups', instance, backup_id, 'backup.control') with open(control_file_path, 'r') as f: actual_control = f.read() new_control_file = '' for line in actual_control.splitlines(): if line.startswith('status'): line = 'status = {0}'.format(status) new_control_file += line new_control_file += '\n' with open(control_file_path, 'wt') as f: f.write(new_control_file) f.flush() f.close() with open(control_file_path, 'r') as f: actual_control = f.read() def wrong_wal_clean(self, node, wal_size): wals_dir = os.path.join(self.backup_dir(node), 'wal') wals = [ f for f in os.listdir(wals_dir) if os.path.isfile( os.path.join(wals_dir, f)) ] wals.sort() file_path = os.path.join(wals_dir, wals[-1]) if os.path.getsize(file_path) != wal_size: os.remove(file_path) def guc_wal_segment_size(self, node): var = node.execute( 'postgres', "select setting from pg_settings where name = 'wal_segment_size'" ) return int(var[0][0]) * self.guc_wal_block_size(node) def guc_wal_block_size(self, node): var = node.execute( 'postgres', "select setting from pg_settings where name = 'wal_block_size'" ) return int(var[0][0]) def get_pgpro_edition(self, node): if node.execute( 'postgres', "select exists (select 1 from" " pg_proc where proname = 'pgpro_edition')" )[0][0]: var = node.execute('postgres', 'select pgpro_edition()') return str(var[0][0]) else: return False def get_username(self): """ Returns current user name """ return getpass.getuser() def version_to_num(self, version): if not version: return 0 parts = version.split('.') while len(parts) < 3: parts.append('0') num = 0 for part in parts: num = num * 100 + int(re.sub("[^\d]", "", part)) return num def switch_wal_segment(self, node): """ Execute pg_switch_wal/xlog() in given node Args: node: an instance of PostgresNode or NodeConnection class """ if isinstance(node, testgres.PostgresNode): if self.version_to_num( node.safe_psql('postgres', 'show server_version').decode('utf-8') ) >= self.version_to_num('10.0'): node.safe_psql('postgres', 'select pg_switch_wal()') else: node.safe_psql('postgres', 'select pg_switch_xlog()') else: if self.version_to_num( node.execute('show server_version')[0][0] ) >= self.version_to_num('10.0'): node.execute('select pg_switch_wal()') else: node.execute('select pg_switch_xlog()') sleep(1) def wait_until_replica_catch_with_master(self, master, replica): version = master.safe_psql( 'postgres', 'show server_version').decode('utf-8').rstrip() if self.version_to_num(version) >= self.version_to_num('10.0'): master_function = 'pg_catalog.pg_current_wal_lsn()' replica_function = 'pg_catalog.pg_last_wal_replay_lsn()' else: master_function = 'pg_catalog.pg_current_xlog_location()' replica_function = 'pg_catalog.pg_last_xlog_replay_location()' lsn = master.safe_psql( 'postgres', 'SELECT {0}'.format(master_function)).decode('utf-8').rstrip() # Wait until replica catch up with master replica.poll_query_until( 'postgres', "SELECT '{0}'::pg_lsn <= {1}".format(lsn, replica_function)) def get_version(self, node): return self.version_to_num( testgres.get_pg_config()['VERSION'].split(" ")[1]) def get_bin_path(self, binary): return testgres.get_bin_path(binary) def del_test_dir(self, module_name, fname, nodes=[]): """ Del testdir and optimistically try to del module dir""" try: testgres.clean_all() except: pass for node in nodes: node.stop() shutil.rmtree( os.path.join( self.tmp_path, module_name, fname ), ignore_errors=True ) try: os.rmdir(os.path.join(self.tmp_path, module_name)) except: pass def pgdata_content(self, pgdata, ignore_ptrack=True, exclude_dirs=None): """ return dict with directory content. " " TAKE IT AFTER CHECKPOINT or BACKUP""" dirs_to_ignore = [ 'pg_xlog', 'pg_wal', 'pg_log', 'pg_stat_tmp', 'pg_subtrans', 'pg_notify' ] files_to_ignore = [ 'postmaster.pid', 'postmaster.opts', 'pg_internal.init', 'postgresql.auto.conf', 'backup_label', 'tablespace_map', 'recovery.conf', 'ptrack_control', 'ptrack_init', 'pg_control', 'probackup_recovery.conf', 'recovery.signal', 'standby.signal', 'ptrack.map', 'ptrack.map.mmap', 'ptrack.map.tmp' ] if exclude_dirs: dirs_to_ignore = dirs_to_ignore + exclude_dirs # suffixes_to_ignore = ( # '_ptrack' # ) directory_dict = {} directory_dict['pgdata'] = pgdata directory_dict['files'] = {} directory_dict['dirs'] = {} for root, dirs, files in os.walk(pgdata, followlinks=True): dirs[:] = [d for d in dirs if d not in dirs_to_ignore] for file in files: if ( file in files_to_ignore or (ignore_ptrack and file.endswith('_ptrack')) ): continue file_fullpath = os.path.join(root, file) file_relpath = os.path.relpath(file_fullpath, pgdata) directory_dict['files'][file_relpath] = {'is_datafile': False} with open(file_fullpath, 'rb') as f: directory_dict['files'][file_relpath]['md5'] = hashlib.md5(f.read()).hexdigest() # directory_dict['files'][file_relpath]['md5'] = hashlib.md5( # f = open(file_fullpath, 'rb').read()).hexdigest() # crappy algorithm if file.isdigit(): directory_dict['files'][file_relpath]['is_datafile'] = True size_in_pages = os.path.getsize(file_fullpath)/8192 directory_dict['files'][file_relpath][ 'md5_per_page'] = self.get_md5_per_page_for_fork( file_fullpath, size_in_pages ) for root, dirs, files in os.walk(pgdata, topdown=False, followlinks=True): for directory in dirs: directory_path = os.path.join(root, directory) directory_relpath = os.path.relpath(directory_path, pgdata) found = False for d in dirs_to_ignore: if d in directory_relpath: found = True break # check if directory already here as part of larger directory if not found: for d in directory_dict['dirs']: # print("OLD dir {0}".format(d)) if directory_relpath in d: found = True break if not found: directory_dict['dirs'][directory_relpath] = {} # get permissions for every file and directory for file in directory_dict['dirs']: full_path = os.path.join(pgdata, file) directory_dict['dirs'][file]['mode'] = os.stat( full_path).st_mode for file in directory_dict['files']: full_path = os.path.join(pgdata, file) directory_dict['files'][file]['mode'] = os.stat( full_path).st_mode return directory_dict def compare_pgdata(self, original_pgdata, restored_pgdata): """ return dict with directory content. DO IT BEFORE RECOVERY""" fail = False error_message = 'Restored PGDATA is not equal to original!\n' # Compare directories for directory in restored_pgdata['dirs']: if directory not in original_pgdata['dirs']: fail = True error_message += '\nDirectory was not present' error_message += ' in original PGDATA: {0}\n'.format( os.path.join(restored_pgdata['pgdata'], directory)) else: if ( restored_pgdata['dirs'][directory]['mode'] != original_pgdata['dirs'][directory]['mode'] ): fail = True error_message += '\nDir permissions mismatch:\n' error_message += ' Dir old: {0} Permissions: {1}\n'.format( os.path.join(original_pgdata['pgdata'], directory), original_pgdata['dirs'][directory]['mode']) error_message += ' Dir new: {0} Permissions: {1}\n'.format( os.path.join(restored_pgdata['pgdata'], directory), restored_pgdata['dirs'][directory]['mode']) for directory in original_pgdata['dirs']: if directory not in restored_pgdata['dirs']: fail = True error_message += '\nDirectory dissappeared' error_message += ' in restored PGDATA: {0}\n'.format( os.path.join(restored_pgdata['pgdata'], directory)) for file in restored_pgdata['files']: # File is present in RESTORED PGDATA # but not present in ORIGINAL # only backup_label is allowed if file not in original_pgdata['files']: fail = True error_message += '\nFile is not present' error_message += ' in original PGDATA: {0}\n'.format( os.path.join(restored_pgdata['pgdata'], file)) for file in original_pgdata['files']: if file in restored_pgdata['files']: if ( restored_pgdata['files'][file]['mode'] != original_pgdata['files'][file]['mode'] ): fail = True error_message += '\nFile permissions mismatch:\n' error_message += ' File_old: {0} Permissions: {1}\n'.format( os.path.join(original_pgdata['pgdata'], file), original_pgdata['files'][file]['mode']) error_message += ' File_new: {0} Permissions: {1}\n'.format( os.path.join(restored_pgdata['pgdata'], file), restored_pgdata['files'][file]['mode']) if ( original_pgdata['files'][file]['md5'] != restored_pgdata['files'][file]['md5'] ): fail = True error_message += ( '\nFile Checksumm mismatch.\n' 'File_old: {0}\nChecksumm_old: {1}\n' 'File_new: {2}\nChecksumm_new: {3}\n').format( os.path.join(original_pgdata['pgdata'], file), original_pgdata['files'][file]['md5'], os.path.join(restored_pgdata['pgdata'], file), restored_pgdata['files'][file]['md5'] ) if original_pgdata['files'][file]['is_datafile']: for page in original_pgdata['files'][file]['md5_per_page']: if page not in restored_pgdata['files'][file]['md5_per_page']: error_message += ( '\n Page {0} dissappeared.\n ' 'File: {1}\n').format( page, os.path.join( restored_pgdata['pgdata'], file ) ) continue if original_pgdata['files'][file][ 'md5_per_page'][page] != restored_pgdata[ 'files'][file]['md5_per_page'][page]: error_message += ( '\n Page checksumm mismatch: {0}\n ' ' PAGE Checksumm_old: {1}\n ' ' PAGE Checksumm_new: {2}\n ' ' File: {3}\n' ).format( page, original_pgdata['files'][file][ 'md5_per_page'][page], restored_pgdata['files'][file][ 'md5_per_page'][page], os.path.join( restored_pgdata['pgdata'], file) ) for page in restored_pgdata['files'][file]['md5_per_page']: if page not in original_pgdata['files'][file]['md5_per_page']: error_message += '\n Extra page {0}\n File: {1}\n'.format( page, os.path.join( restored_pgdata['pgdata'], file)) else: error_message += ( '\nFile disappearance.\n ' 'File: {0}\n').format( os.path.join(restored_pgdata['pgdata'], file) ) fail = True self.assertFalse(fail, error_message) def gdb_attach(self, pid): return GDBobj([str(pid)], self.verbose, attach=True) class GdbException(Exception): def __init__(self, message=False): self.message = message def __str__(self): return '\n ERROR: {0}\n'.format(repr(self.message)) class GDBobj(ProbackupTest): def __init__(self, cmd, verbose, attach=False): self.verbose = verbose # Check gdb presense try: gdb_version, _ = subprocess.Popen( ['gdb', '--version'], stdout=subprocess.PIPE ).communicate() except OSError: raise GdbException("Couldn't find gdb on the path") self.base_cmd = [ 'gdb', '--interpreter', 'mi2', ] if attach: self.cmd = self.base_cmd + ['--pid'] + cmd else: self.cmd = self.base_cmd + ['--args'] + cmd # Get version gdb_version_number = re.search( b"^GNU gdb [^\d]*(\d+)\.(\d)", gdb_version) self.major_version = int(gdb_version_number.group(1)) self.minor_version = int(gdb_version_number.group(2)) if self.verbose: print([' '.join(map(str, self.cmd))]) self.proc = subprocess.Popen( self.cmd, stdin=subprocess.PIPE, stdout=subprocess.PIPE, stderr=subprocess.STDOUT, bufsize=0, universal_newlines=True ) self.gdb_pid = self.proc.pid # discard data from pipe, # is there a way to do it a less derpy way? while True: line = self.proc.stdout.readline() if 'No such process' in line: raise GdbException(line) if not line.startswith('(gdb)'): pass else: break def kill(self): self.proc.kill() self.proc.wait() def set_breakpoint(self, location): result = self._execute('break ' + location) for line in result: if line.startswith('~"Breakpoint'): return elif line.startswith('=breakpoint-created'): return elif line.startswith('^error'): #or line.startswith('(gdb)'): break elif line.startswith('&"break'): pass elif line.startswith('&"Function'): raise GdbException(line) elif line.startswith('&"No line'): raise GdbException(line) elif line.startswith('~"Make breakpoint pending on future shared'): raise GdbException(line) raise GdbException( 'Failed to set breakpoint.\n Output:\n {0}'.format(result) ) def remove_all_breakpoints(self): result = self._execute('delete') for line in result: if line.startswith('^done'): return raise GdbException( 'Failed to remove breakpoints.\n Output:\n {0}'.format(result) ) def run_until_break(self): result = self._execute('run', False) for line in result: if line.startswith('*stopped,reason="breakpoint-hit"'): return raise GdbException( 'Failed to run until breakpoint.\n' ) def continue_execution_until_running(self): result = self._execute('continue') for line in result: if line.startswith('*running') or line.startswith('^running'): return if line.startswith('*stopped,reason="breakpoint-hit"'): continue if line.startswith('*stopped,reason="exited-normally"'): continue raise GdbException( 'Failed to continue execution until running.\n' ) def continue_execution_until_exit(self): result = self._execute('continue', False) for line in result: if line.startswith('*running'): continue if line.startswith('*stopped,reason="breakpoint-hit"'): continue if ( line.startswith('*stopped,reason="exited') or line == '*stopped\n' ): return raise GdbException( 'Failed to continue execution until exit.\n' ) def continue_execution_until_error(self): result = self._execute('continue', False) for line in result: if line.startswith('^error'): return if line.startswith('*stopped,reason="exited'): return if line.startswith( '*stopped,reason="signal-received",signal-name="SIGABRT"'): return raise GdbException( 'Failed to continue execution until error.\n') def continue_execution_until_break(self, ignore_count=0): if ignore_count > 0: result = self._execute( 'continue ' + str(ignore_count), False ) else: result = self._execute('continue', False) for line in result: if line.startswith('*stopped,reason="breakpoint-hit"'): return if line.startswith('*stopped,reason="exited-normally"'): break raise GdbException( 'Failed to continue execution until break.\n') def stopped_in_breakpoint(self): output = [] while True: line = self.proc.stdout.readline() output += [line] if self.verbose: print(line) if line.startswith('*stopped,reason="breakpoint-hit"'): return True return False # use for breakpoint, run, continue def _execute(self, cmd, running=True): output = [] self.proc.stdin.flush() self.proc.stdin.write(cmd + '\n') self.proc.stdin.flush() sleep(1) # look for command we just send while True: line = self.proc.stdout.readline() if self.verbose: print(repr(line)) if cmd not in line: continue else: break while True: line = self.proc.stdout.readline() output += [line] if self.verbose: print(repr(line)) if line.startswith('^done') or line.startswith('*stopped'): break if line.startswith('^error'): break if running and (line.startswith('*running') or line.startswith('^running')): # if running and line.startswith('*running'): break return output