mirror of
				https://github.com/facebook/zstd.git
				synced 2025-10-26 00:02:22 -04:00 
			
		
		
		
	
		
			
				
	
	
		
			277 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			Python
		
	
	
		
			Executable File
		
	
	
	
	
			
		
		
	
	
			277 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			Python
		
	
	
		
			Executable File
		
	
	
	
	
| #!/usr/bin/env python3
 | |
| """Test zstd interoperability between versions"""
 | |
| 
 | |
| #
 | |
| # Copyright (c) 2016-present, Yann Collet, Facebook, Inc.
 | |
| # All rights reserved.
 | |
| #
 | |
| # This source code is licensed under the BSD-style license found in the
 | |
| # LICENSE file in the root directory of this source tree. An additional grant
 | |
| # of patent rights can be found in the PATENTS file in the same directory.
 | |
| #
 | |
| 
 | |
| import filecmp
 | |
| import glob
 | |
| import hashlib
 | |
| import os
 | |
| import shutil
 | |
| import sys
 | |
| import subprocess
 | |
| from subprocess import Popen, PIPE
 | |
| 
 | |
| repo_url = 'https://github.com/facebook/zstd.git'
 | |
| tmp_dir_name = 'tests/versionsTest'
 | |
| make_cmd = 'make'
 | |
| git_cmd = 'git'
 | |
| test_dat_src = 'README.md'
 | |
| test_dat = 'test_dat'
 | |
| head = 'vdevel'
 | |
| dict_source = 'dict_source'
 | |
| dict_files = './zstd/programs/*.c ./zstd/lib/common/*.c ./zstd/lib/compress/*.c ./zstd/lib/decompress/*.c ./zstd/lib/dictBuilder/*.c ./zstd/lib/legacy/*.c '
 | |
| dict_files += './zstd/programs/*.h ./zstd/lib/common/*.h ./zstd/lib/compress/*.h ./zstd/lib/dictBuilder/*.h ./zstd/lib/legacy/*.h'
 | |
| 
 | |
| 
 | |
| def execute(command, print_output=False, print_error=True, param_shell=False):
 | |
|     popen = Popen(command, stdout=PIPE, stderr=PIPE, shell=param_shell)
 | |
|     stdout_lines, stderr_lines = popen.communicate()
 | |
|     stderr_lines = stderr_lines.decode("utf-8")
 | |
|     stdout_lines = stdout_lines.decode("utf-8")
 | |
|     if print_output:
 | |
|         print(stdout_lines)
 | |
|         print(stderr_lines)
 | |
|     if popen.returncode is not None and popen.returncode != 0:
 | |
|         if not print_output and print_error:
 | |
|             print(stderr_lines)
 | |
|     return popen.returncode
 | |
| 
 | |
| 
 | |
| def proc(cmd_args, pipe=True, dummy=False):
 | |
|     if dummy:
 | |
|         return
 | |
|     if pipe:
 | |
|         subproc = Popen(cmd_args, stdout=PIPE, stderr=PIPE)
 | |
|     else:
 | |
|         subproc = Popen(cmd_args)
 | |
|     return subproc.communicate()
 | |
| 
 | |
| 
 | |
| def make(args, pipe=True):
 | |
|     return proc([make_cmd] + args, pipe)
 | |
| 
 | |
| 
 | |
| def git(args, pipe=True):
 | |
|     return proc([git_cmd] + args, pipe)
 | |
| 
 | |
| 
 | |
| def get_git_tags():
 | |
|     stdout, stderr = git(['tag', '-l', 'v[0-9].[0-9].[0-9]'])
 | |
|     tags = stdout.decode('utf-8').split()
 | |
|     return tags
 | |
| 
 | |
| 
 | |
| def create_dict(tag, dict_source_path):
 | |
|     dict_name = 'dict.' + tag
 | |
|     if not os.path.isfile(dict_name):
 | |
|         cFiles = glob.glob(dict_source_path + "/*.c")
 | |
|         hFiles = glob.glob(dict_source_path + "/*.h")
 | |
|         if tag == 'v0.5.0':
 | |
|             result = execute('./dictBuilder.' + tag + ' ' + ' '.join(cFiles) + ' ' + ' '.join(hFiles) + ' -o ' + dict_name, print_output=False, param_shell=True)
 | |
|         else:
 | |
|             result = execute('./zstd.' + tag + ' -f --train ' + ' '.join(cFiles) + ' ' + ' '.join(hFiles) + ' -o ' + dict_name, print_output=False, param_shell=True)
 | |
|         if result == 0:
 | |
|             print(dict_name + ' created')
 | |
|         else:
 | |
|             print('ERROR: creating of ' + dict_name + ' failed')
 | |
|     else:
 | |
|         print(dict_name + ' already exists')
 | |
| 
 | |
| 
 | |
| def dict_compress_sample(tag, sample):
 | |
|     dict_name = 'dict.' + tag
 | |
|     DEVNULL = open(os.devnull, 'wb')
 | |
|     if subprocess.call(['./zstd.' + tag, '-D', dict_name, '-f',   sample], stderr=DEVNULL) == 0:
 | |
|         os.rename(sample + '.zst', sample + '_01_64_' + tag + '_dictio.zst')
 | |
|     if subprocess.call(['./zstd.' + tag, '-D', dict_name, '-5f',  sample], stderr=DEVNULL) == 0:
 | |
|         os.rename(sample + '.zst', sample + '_05_64_' + tag + '_dictio.zst')
 | |
|     if subprocess.call(['./zstd.' + tag, '-D', dict_name, '-9f',  sample], stderr=DEVNULL) == 0:
 | |
|         os.rename(sample + '.zst', sample + '_09_64_' + tag + '_dictio.zst')
 | |
|     if subprocess.call(['./zstd.' + tag, '-D', dict_name, '-15f', sample], stderr=DEVNULL) == 0:
 | |
|         os.rename(sample + '.zst', sample + '_15_64_' + tag + '_dictio.zst')
 | |
|     if subprocess.call(['./zstd.' + tag, '-D', dict_name, '-18f', sample], stderr=DEVNULL) == 0:
 | |
|         os.rename(sample + '.zst', sample + '_18_64_' + tag + '_dictio.zst')
 | |
|     # zstdFiles = glob.glob("*.zst*")
 | |
|     # print(zstdFiles)
 | |
|     print(tag + " : dict compression completed")
 | |
| 
 | |
| 
 | |
| def compress_sample(tag, sample):
 | |
|     DEVNULL = open(os.devnull, 'wb')
 | |
|     if subprocess.call(['./zstd.' + tag, '-f',   sample], stderr=DEVNULL) == 0:
 | |
|         os.rename(sample + '.zst', sample + '_01_64_' + tag + '_nodict.zst')
 | |
|     if subprocess.call(['./zstd.' + tag, '-5f',  sample], stderr=DEVNULL) == 0:
 | |
|         os.rename(sample + '.zst', sample + '_05_64_' + tag + '_nodict.zst')
 | |
|     if subprocess.call(['./zstd.' + tag, '-9f',  sample], stderr=DEVNULL) == 0:
 | |
|         os.rename(sample + '.zst', sample + '_09_64_' + tag + '_nodict.zst')
 | |
|     if subprocess.call(['./zstd.' + tag, '-15f', sample], stderr=DEVNULL) == 0:
 | |
|         os.rename(sample + '.zst', sample + '_15_64_' + tag + '_nodict.zst')
 | |
|     if subprocess.call(['./zstd.' + tag, '-18f', sample], stderr=DEVNULL) == 0:
 | |
|         os.rename(sample + '.zst', sample + '_18_64_' + tag + '_nodict.zst')
 | |
|     # zstdFiles = glob.glob("*.zst*")
 | |
|     # print(zstdFiles)
 | |
|     print(tag + " : compression completed")
 | |
| 
 | |
| 
 | |
| # http://stackoverflow.com/a/19711609/2132223
 | |
| def sha1_of_file(filepath):
 | |
|     with open(filepath, 'rb') as f:
 | |
|         return hashlib.sha1(f.read()).hexdigest()
 | |
| 
 | |
| 
 | |
| def remove_duplicates():
 | |
|     list_of_zst = sorted(glob.glob('*.zst'))
 | |
|     for i, ref_zst in enumerate(list_of_zst):
 | |
|         if not os.path.isfile(ref_zst):
 | |
|             continue
 | |
|         for j in range(i + 1, len(list_of_zst)):
 | |
|             compared_zst = list_of_zst[j]
 | |
|             if not os.path.isfile(compared_zst):
 | |
|                 continue
 | |
|             if filecmp.cmp(ref_zst, compared_zst):
 | |
|                 os.remove(compared_zst)
 | |
|                 print('duplicated : {} == {}'.format(ref_zst, compared_zst))
 | |
| 
 | |
| 
 | |
| def decompress_zst(tag):
 | |
|     dec_error = 0
 | |
|     list_zst = sorted(glob.glob('*_nodict.zst'))
 | |
|     for file_zst in list_zst:
 | |
|         print(file_zst, end=' ')
 | |
|         print(tag, end=' ')
 | |
|         file_dec = file_zst + '_d64_' + tag + '.dec'
 | |
|         if tag <= 'v0.5.0':
 | |
|             params = ['./zstd.' + tag, '-df', file_zst, file_dec]
 | |
|         else:
 | |
|             params = ['./zstd.' + tag, '-df', file_zst, '-o', file_dec]
 | |
|         if execute(params) == 0:
 | |
|             if not filecmp.cmp(file_dec, test_dat):
 | |
|                 print('ERR !! ')
 | |
|                 dec_error = 1
 | |
|             else:
 | |
|                 print('OK     ')
 | |
|         else:
 | |
|             print('command does not work')
 | |
|             dec_error = 1
 | |
|     return dec_error
 | |
| 
 | |
| 
 | |
| def decompress_dict(tag):
 | |
|     dec_error = 0
 | |
|     list_zst = sorted(glob.glob('*_dictio.zst'))
 | |
|     for file_zst in list_zst:
 | |
|         dict_tag = file_zst[0:len(file_zst)-11]  # remove "_dictio.zst"
 | |
|         if head in dict_tag: # find vdevel
 | |
|             dict_tag = head
 | |
|         else:
 | |
|             dict_tag = dict_tag[dict_tag.rfind('v'):]
 | |
|         if tag == 'v0.6.0' and dict_tag < 'v0.6.0':
 | |
|             continue
 | |
|         dict_name = 'dict.' + dict_tag
 | |
|         print(file_zst + ' ' + tag + ' dict=' + dict_tag, end=' ')
 | |
|         file_dec = file_zst + '_d64_' + tag + '.dec'
 | |
|         if tag <= 'v0.5.0':
 | |
|             params = ['./zstd.' + tag, '-D', dict_name, '-df', file_zst, file_dec]
 | |
|         else:
 | |
|             params = ['./zstd.' + tag, '-D', dict_name, '-df', file_zst, '-o', file_dec]
 | |
|         if execute(params) == 0:
 | |
|             if not filecmp.cmp(file_dec, test_dat):
 | |
|                 print('ERR !! ')
 | |
|                 dec_error = 1
 | |
|             else:
 | |
|                 print('OK     ')
 | |
|         else:
 | |
|             print('command does not work')
 | |
|             dec_error = 1
 | |
|     return dec_error
 | |
| 
 | |
| 
 | |
| if __name__ == '__main__':
 | |
|     error_code = 0
 | |
|     base_dir = os.getcwd() + '/..'                  # /path/to/zstd
 | |
|     tmp_dir = base_dir + '/' + tmp_dir_name         # /path/to/zstd/tests/versionsTest
 | |
|     clone_dir = tmp_dir + '/' + 'zstd'              # /path/to/zstd/tests/versionsTest/zstd
 | |
|     dict_source_path = tmp_dir + '/' + dict_source  # /path/to/zstd/tests/versionsTest/dict_source
 | |
|     programs_dir = base_dir + '/programs'           # /path/to/zstd/programs
 | |
|     os.makedirs(tmp_dir, exist_ok=True)
 | |
| 
 | |
|     # since Travis clones limited depth, we should clone full repository
 | |
|     if not os.path.isdir(clone_dir):
 | |
|         git(['clone', repo_url, clone_dir])
 | |
| 
 | |
|     shutil.copy2(base_dir + '/' + test_dat_src, tmp_dir + '/' + test_dat)
 | |
| 
 | |
|     # Retrieve all release tags
 | |
|     print('Retrieve all release tags :')
 | |
|     os.chdir(clone_dir)
 | |
|     alltags = get_git_tags() + [head]
 | |
|     tags = [t for t in alltags if t >= 'v0.4.0']
 | |
|     print(tags)
 | |
| 
 | |
|     # Build all release zstd
 | |
|     for tag in tags:
 | |
|         os.chdir(base_dir)
 | |
|         dst_zstd = '{}/zstd.{}'.format(tmp_dir, tag)  # /path/to/zstd/tests/versionsTest/zstd.<TAG>
 | |
|         if not os.path.isfile(dst_zstd) or tag == head:
 | |
|             if tag != head:
 | |
|                 r_dir = '{}/{}'.format(tmp_dir, tag)  # /path/to/zstd/tests/versionsTest/<TAG>
 | |
|                 os.makedirs(r_dir, exist_ok=True)
 | |
|                 os.chdir(clone_dir)
 | |
|                 git(['--work-tree=' + r_dir, 'checkout', tag, '--', '.'], False)
 | |
|                 if tag == 'v0.5.0':
 | |
|                     os.chdir(r_dir + '/dictBuilder')  # /path/to/zstd/tests/versionsTest/v0.5.0/dictBuilder
 | |
|                     make(['clean', 'dictBuilder'], False)
 | |
|                     shutil.copy2('dictBuilder', '{}/dictBuilder.{}'.format(tmp_dir, tag))
 | |
|                 os.chdir(r_dir + '/programs')  # /path/to/zstd/tests/versionsTest/<TAG>/programs
 | |
|                 make(['clean', 'zstd'], False)
 | |
|             else:
 | |
|                 os.chdir(programs_dir)
 | |
|                 make(['zstd'], False)
 | |
|             shutil.copy2('zstd',   dst_zstd)
 | |
| 
 | |
|     # remove any remaining *.zst and *.dec from previous test
 | |
|     os.chdir(tmp_dir)
 | |
|     for compressed in glob.glob("*.zst"):
 | |
|         os.remove(compressed)
 | |
|     for dec in glob.glob("*.dec"):
 | |
|         os.remove(dec)
 | |
| 
 | |
|     # copy *.c and *.h to a temporary directory ("dict_source")
 | |
|     if not os.path.isdir(dict_source_path):
 | |
|         os.mkdir(dict_source_path)
 | |
|         print('cp ' + dict_files + ' ' + dict_source_path)
 | |
|         execute('cp ' + dict_files + ' ' + dict_source_path, param_shell=True)
 | |
| 
 | |
|     print('Compress test.dat by all released zstd')
 | |
| 
 | |
|     error_code = 0
 | |
|     for tag in tags:
 | |
|         print(tag)
 | |
|         if tag >= 'v0.5.0':
 | |
|             create_dict(tag, dict_source_path)
 | |
|             dict_compress_sample(tag, test_dat)
 | |
|             remove_duplicates()
 | |
|             error_code += decompress_dict(tag)
 | |
|         compress_sample(tag, test_dat)
 | |
|         remove_duplicates()
 | |
|         error_code += decompress_zst(tag)
 | |
| 
 | |
|     print('')
 | |
|     print('Enumerate different compressed files')
 | |
|     zstds = sorted(glob.glob('*.zst'))
 | |
|     for zstd in zstds:
 | |
|         print(zstd + ' : ' + repr(os.path.getsize(zstd)) + ', ' + sha1_of_file(zstd))
 | |
| 
 | |
|     if error_code != 0:
 | |
|         print('======  ERROR !!!  =======')
 | |
| 
 | |
|     sys.exit(error_code)
 |