mercurial-scm/hg-stable: contrib/python-zstandard/tests/test_compressor

comparison contrib/python-zstandard/tests/test_compressor_fuzzing.py @ 42070:675775c33ab6

zstandard: vendor python-zstandard 0.11 The upstream source distribution from PyPI was extracted. Unwanted files were removed. The clang-format ignore list was updated to reflect the new source of files. The project contains a vendored copy of zstandard 1.3.8. The old version was 1.3.6. This should result in some minor performance wins. test-check-py3-compat.t was updated to reflect now-passing tests on Python 3.8. Some HTTP tests were updated to reflect new zstd compression output. # no-check-commit because 3rd party code has different style guidelines Differential Revision: https://phab.mercurial-scm.org/D6199

author	Gregory Szorc <gregory.szorc@gmail.com>
date	Thu, 04 Apr 2019 17:34:43 -0700
parents	73fef626dae3
children	de7838053207

comparison

equal deleted inserted replaced

-:668eff08387f
+:675775c33ab6
 import zstandard as zstd
 from . common import (
 make_cffi,
+NonClosingBytesIO,
 random_input_data,
 )
 @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
 @make_cffi
 class TestCompressor_stream_reader_fuzzing(unittest.TestCase):
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
+@hypothesis.given(original=strategies.sampled_from(random_input_data()),
+level=strategies.integers(min_value=1, max_value=5),
+source_read_size=strategies.integers(1, 16384),
+read_size=strategies.integers(-1, zstd.COMPRESSION_RECOMMENDED_OUTPUT_SIZE))
+def test_stream_source_read(self, original, level, source_read_size,
+read_size):
+if read_size == 0:
+read_size = -1
+refctx = zstd.ZstdCompressor(level=level)
+ref_frame = refctx.compress(original)
+cctx = zstd.ZstdCompressor(level=level)
+with cctx.stream_reader(io.BytesIO(original), size=len(original),
+read_size=source_read_size) as reader:
+chunks = []
+while True:
+chunk = reader.read(read_size)
+if not chunk:
+break
+chunks.append(chunk)
+self.assertEqual(b''.join(chunks), ref_frame)
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
+@hypothesis.given(original=strategies.sampled_from(random_input_data()),
+level=strategies.integers(min_value=1, max_value=5),
+source_read_size=strategies.integers(1, 16384),
+read_size=strategies.integers(-1, zstd.COMPRESSION_RECOMMENDED_OUTPUT_SIZE))
+def test_buffer_source_read(self, original, level, source_read_size,
+read_size):
+if read_size == 0:
+read_size = -1
+refctx = zstd.ZstdCompressor(level=level)
+ref_frame = refctx.compress(original)
+cctx = zstd.ZstdCompressor(level=level)
+with cctx.stream_reader(original, size=len(original),
+read_size=source_read_size) as reader:
+chunks = []
+while True:
+chunk = reader.read(read_size)
+if not chunk:
+break
+chunks.append(chunk)
+self.assertEqual(b''.join(chunks), ref_frame)
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
 @hypothesis.given(original=strategies.sampled_from(random_input_data()),
 level=strategies.integers(min_value=1, max_value=5),
 source_read_size=strategies.integers(1, 16384),
 read_sizes=strategies.data())
 def test_stream_source_read_variance(self, original, level, source_read_size,
 cctx = zstd.ZstdCompressor(level=level)
 with cctx.stream_reader(io.BytesIO(original), size=len(original),
 read_size=source_read_size) as reader:
 chunks = []
 while True:
-read_size = read_sizes.draw(strategies.integers(1, 16384))
+read_size = read_sizes.draw(strategies.integers(-1, 16384))
 chunk = reader.read(read_size)
+if not chunk and read_size:
-if not chunk:
+break
-break
 chunks.append(chunk)
 self.assertEqual(b''.join(chunks), ref_frame)
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
 @hypothesis.given(original=strategies.sampled_from(random_input_data()),
 level=strategies.integers(min_value=1, max_value=5),
 source_read_size=strategies.integers(1, 16384),
 read_sizes=strategies.data())
 def test_buffer_source_read_variance(self, original, level, source_read_size,
 cctx = zstd.ZstdCompressor(level=level)
 with cctx.stream_reader(original, size=len(original),
 read_size=source_read_size) as reader:
 chunks = []
 while True:
+read_size = read_sizes.draw(strategies.integers(-1, 16384))
+chunk = reader.read(read_size)
+if not chunk and read_size:
+break
+chunks.append(chunk)
+self.assertEqual(b''.join(chunks), ref_frame)
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
+@hypothesis.given(original=strategies.sampled_from(random_input_data()),
+level=strategies.integers(min_value=1, max_value=5),
+source_read_size=strategies.integers(1, 16384),
+read_size=strategies.integers(1, zstd.COMPRESSION_RECOMMENDED_OUTPUT_SIZE))
+def test_stream_source_readinto(self, original, level,
+source_read_size, read_size):
+refctx = zstd.ZstdCompressor(level=level)
+ref_frame = refctx.compress(original)
+cctx = zstd.ZstdCompressor(level=level)
+with cctx.stream_reader(io.BytesIO(original), size=len(original),
+read_size=source_read_size) as reader:
+chunks = []
+while True:
+b = bytearray(read_size)
+count = reader.readinto(b)
+if not count:
+break
+chunks.append(bytes(b[0:count]))
+self.assertEqual(b''.join(chunks), ref_frame)
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
+@hypothesis.given(original=strategies.sampled_from(random_input_data()),
+level=strategies.integers(min_value=1, max_value=5),
+source_read_size=strategies.integers(1, 16384),
+read_size=strategies.integers(1, zstd.COMPRESSION_RECOMMENDED_OUTPUT_SIZE))
+def test_buffer_source_readinto(self, original, level,
+source_read_size, read_size):
+refctx = zstd.ZstdCompressor(level=level)
+ref_frame = refctx.compress(original)
+cctx = zstd.ZstdCompressor(level=level)
+with cctx.stream_reader(original, size=len(original),
+read_size=source_read_size) as reader:
+chunks = []
+while True:
+b = bytearray(read_size)
+count = reader.readinto(b)
+if not count:
+break
+chunks.append(bytes(b[0:count]))
+self.assertEqual(b''.join(chunks), ref_frame)
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
+@hypothesis.given(original=strategies.sampled_from(random_input_data()),
+level=strategies.integers(min_value=1, max_value=5),
+source_read_size=strategies.integers(1, 16384),
+read_sizes=strategies.data())
+def test_stream_source_readinto_variance(self, original, level,
+source_read_size, read_sizes):
+refctx = zstd.ZstdCompressor(level=level)
+ref_frame = refctx.compress(original)
+cctx = zstd.ZstdCompressor(level=level)
+with cctx.stream_reader(io.BytesIO(original), size=len(original),
+read_size=source_read_size) as reader:
+chunks = []
+while True:
 read_size = read_sizes.draw(strategies.integers(1, 16384))
-chunk = reader.read(read_size)
+b = bytearray(read_size)
+count = reader.readinto(b)
+if not count:
+break
+chunks.append(bytes(b[0:count]))
+self.assertEqual(b''.join(chunks), ref_frame)
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
+@hypothesis.given(original=strategies.sampled_from(random_input_data()),
+level=strategies.integers(min_value=1, max_value=5),
+source_read_size=strategies.integers(1, 16384),
+read_sizes=strategies.data())
+def test_buffer_source_readinto_variance(self, original, level,
+source_read_size, read_sizes):
+refctx = zstd.ZstdCompressor(level=level)
+ref_frame = refctx.compress(original)
+cctx = zstd.ZstdCompressor(level=level)
+with cctx.stream_reader(original, size=len(original),
+read_size=source_read_size) as reader:
+chunks = []
+while True:
+read_size = read_sizes.draw(strategies.integers(1, 16384))
+b = bytearray(read_size)
+count = reader.readinto(b)
+if not count:
+break
+chunks.append(bytes(b[0:count]))
+self.assertEqual(b''.join(chunks), ref_frame)
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
+@hypothesis.given(original=strategies.sampled_from(random_input_data()),
+level=strategies.integers(min_value=1, max_value=5),
+source_read_size=strategies.integers(1, 16384),
+read_size=strategies.integers(-1, zstd.COMPRESSION_RECOMMENDED_OUTPUT_SIZE))
+def test_stream_source_read1(self, original, level, source_read_size,
+read_size):
+if read_size == 0:
+read_size = -1
+refctx = zstd.ZstdCompressor(level=level)
+ref_frame = refctx.compress(original)
+cctx = zstd.ZstdCompressor(level=level)
+with cctx.stream_reader(io.BytesIO(original), size=len(original),
+read_size=source_read_size) as reader:
+chunks = []
+while True:
+chunk = reader.read1(read_size)
 if not chunk:
 break
 chunks.append(chunk)
 self.assertEqual(b''.join(chunks), ref_frame)
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
+@hypothesis.given(original=strategies.sampled_from(random_input_data()),
+level=strategies.integers(min_value=1, max_value=5),
+source_read_size=strategies.integers(1, 16384),
+read_size=strategies.integers(-1, zstd.COMPRESSION_RECOMMENDED_OUTPUT_SIZE))
+def test_buffer_source_read1(self, original, level, source_read_size,
+read_size):
+if read_size == 0:
+read_size = -1
+refctx = zstd.ZstdCompressor(level=level)
+ref_frame = refctx.compress(original)
+cctx = zstd.ZstdCompressor(level=level)
+with cctx.stream_reader(original, size=len(original),
+read_size=source_read_size) as reader:
+chunks = []
+while True:
+chunk = reader.read1(read_size)
+if not chunk:
+break
+chunks.append(chunk)
+self.assertEqual(b''.join(chunks), ref_frame)
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
+@hypothesis.given(original=strategies.sampled_from(random_input_data()),
+level=strategies.integers(min_value=1, max_value=5),
+source_read_size=strategies.integers(1, 16384),
+read_sizes=strategies.data())
+def test_stream_source_read1_variance(self, original, level, source_read_size,
+read_sizes):
+refctx = zstd.ZstdCompressor(level=level)
+ref_frame = refctx.compress(original)
+cctx = zstd.ZstdCompressor(level=level)
+with cctx.stream_reader(io.BytesIO(original), size=len(original),
+read_size=source_read_size) as reader:
+chunks = []
+while True:
+read_size = read_sizes.draw(strategies.integers(-1, 16384))
+chunk = reader.read1(read_size)
+if not chunk and read_size:
+break
+chunks.append(chunk)
+self.assertEqual(b''.join(chunks), ref_frame)
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
+@hypothesis.given(original=strategies.sampled_from(random_input_data()),
+level=strategies.integers(min_value=1, max_value=5),
+source_read_size=strategies.integers(1, 16384),
+read_sizes=strategies.data())
+def test_buffer_source_read1_variance(self, original, level, source_read_size,
+read_sizes):
+refctx = zstd.ZstdCompressor(level=level)
+ref_frame = refctx.compress(original)
+cctx = zstd.ZstdCompressor(level=level)
+with cctx.stream_reader(original, size=len(original),
+read_size=source_read_size) as reader:
+chunks = []
+while True:
+read_size = read_sizes.draw(strategies.integers(-1, 16384))
+chunk = reader.read1(read_size)
+if not chunk and read_size:
+break
+chunks.append(chunk)
+self.assertEqual(b''.join(chunks), ref_frame)
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
+@hypothesis.given(original=strategies.sampled_from(random_input_data()),
+level=strategies.integers(min_value=1, max_value=5),
+source_read_size=strategies.integers(1, 16384),
+read_size=strategies.integers(1, zstd.COMPRESSION_RECOMMENDED_OUTPUT_SIZE))
+def test_stream_source_readinto1(self, original, level, source_read_size,
+read_size):
+if read_size == 0:
+read_size = -1
+refctx = zstd.ZstdCompressor(level=level)
+ref_frame = refctx.compress(original)
+cctx = zstd.ZstdCompressor(level=level)
+with cctx.stream_reader(io.BytesIO(original), size=len(original),
+read_size=source_read_size) as reader:
+chunks = []
+while True:
+b = bytearray(read_size)
+count = reader.readinto1(b)
+if not count:
+break
+chunks.append(bytes(b[0:count]))
+self.assertEqual(b''.join(chunks), ref_frame)
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
+@hypothesis.given(original=strategies.sampled_from(random_input_data()),
+level=strategies.integers(min_value=1, max_value=5),
+source_read_size=strategies.integers(1, 16384),
+read_size=strategies.integers(1, zstd.COMPRESSION_RECOMMENDED_OUTPUT_SIZE))
+def test_buffer_source_readinto1(self, original, level, source_read_size,
+read_size):
+if read_size == 0:
+read_size = -1
+refctx = zstd.ZstdCompressor(level=level)
+ref_frame = refctx.compress(original)
+cctx = zstd.ZstdCompressor(level=level)
+with cctx.stream_reader(original, size=len(original),
+read_size=source_read_size) as reader:
+chunks = []
+while True:
+b = bytearray(read_size)
+count = reader.readinto1(b)
+if not count:
+break
+chunks.append(bytes(b[0:count]))
+self.assertEqual(b''.join(chunks), ref_frame)
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
+@hypothesis.given(original=strategies.sampled_from(random_input_data()),
+level=strategies.integers(min_value=1, max_value=5),
+source_read_size=strategies.integers(1, 16384),
+read_sizes=strategies.data())
+def test_stream_source_readinto1_variance(self, original, level, source_read_size,
+read_sizes):
+refctx = zstd.ZstdCompressor(level=level)
+ref_frame = refctx.compress(original)
+cctx = zstd.ZstdCompressor(level=level)
+with cctx.stream_reader(io.BytesIO(original), size=len(original),
+read_size=source_read_size) as reader:
+chunks = []
+while True:
+read_size = read_sizes.draw(strategies.integers(1, 16384))
+b = bytearray(read_size)
+count = reader.readinto1(b)
+if not count:
+break
+chunks.append(bytes(b[0:count]))
+self.assertEqual(b''.join(chunks), ref_frame)
+@hypothesis.settings(
+suppress_health_check=[hypothesis.HealthCheck.large_base_example])
+@hypothesis.given(original=strategies.sampled_from(random_input_data()),
+level=strategies.integers(min_value=1, max_value=5),
+source_read_size=strategies.integers(1, 16384),
+read_sizes=strategies.data())
+def test_buffer_source_readinto1_variance(self, original, level, source_read_size,
+read_sizes):
+refctx = zstd.ZstdCompressor(level=level)
+ref_frame = refctx.compress(original)
+cctx = zstd.ZstdCompressor(level=level)
+with cctx.stream_reader(original, size=len(original),
+read_size=source_read_size) as reader:
+chunks = []
+while True:
+read_size = read_sizes.draw(strategies.integers(1, 16384))
+b = bytearray(read_size)
+count = reader.readinto1(b)
+if not count:
+break
+chunks.append(bytes(b[0:count]))
+self.assertEqual(b''.join(chunks), ref_frame)
 @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
 @make_cffi
 class TestCompressor_stream_writer_fuzzing(unittest.TestCase):
 def test_write_size_variance(self, original, level, write_size):
 refctx = zstd.ZstdCompressor(level=level)
 ref_frame = refctx.compress(original)
 cctx = zstd.ZstdCompressor(level=level)
-b = io.BytesIO()
+b = NonClosingBytesIO()
 with cctx.stream_writer(b, size=len(original), write_size=write_size) as compressor:
 compressor.write(original)
 self.assertEqual(b.getvalue(), ref_frame)
 cctx = zstd.ZstdCompressor(level=1,
 write_checksum=True,
 **kwargs)
+if not hasattr(cctx, 'multi_compress_to_buffer'):
+self.skipTest('multi_compress_to_buffer not available')
 result = cctx.multi_compress_to_buffer(original, threads=-1)
 self.assertEqual(len(result), len(original))
 # The frame produced via the batch APIs may not be bit identical to that

Mercurial > public > mercurial-scm > hg-stable

comparison contrib/python-zstandard/tests/test_compressor_fuzzing.py @ 42070:675775c33ab6