upstream/mercurial-mirror Files · contrib/python-zstandard/tests/test_decompressor_fuzzing.py

linelog: optimize replacelines...

linelog: optimize replacelines The optimization to avoid calling `annotate` inside `replacelines` is significant for practical use patterns. Before this patch: hg perflinelogedits ! wall 6.778478 comb 6.710000 user 6.700000 sys 0.010000 (best of 3) After this patch: hg perflinelogedits ! wall 0.136573 comb 0.140000 user 0.130000 sys 0.010000 (best of 63) Differential Revision: https://phab.mercurial-scm.org/D4150

Gregory Szorc - - Load All Authors

File last commit:

r37513:b1fb341d default


                r39007:ee97f7a6

default

Download file

             test_decompressor_fuzzing.py
        
                    252 lines
            
             | 9.7 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / contrib / python-zstandard / tests / test_decompressor_fuzzing.py
          
                    History
                
                 |
                  Annotation
                 | Raw
                 |Copy content
                 |Copy permalink

      import io

      import os

      import unittest

      try:

          import hypothesis

          import hypothesis.strategies as strategies

      except ImportError:

          raise unittest.SkipTest('hypothesis not available')

      import zstandard as zstd

      from . common import (

          make_cffi,

          random_input_data,

      )

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      @make_cffi

      class TestDecompressor_stream_reader_fuzzing(unittest.TestCase):

          @hypothesis.settings(

              suppress_health_check=[hypothesis.HealthCheck.large_base_example])

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            source_read_size=strategies.integers(1, 16384),

                            read_sizes=strategies.data())

          def test_stream_source_read_variance(self, original, level, source_read_size,

                                               read_sizes):

              cctx = zstd.ZstdCompressor(level=level)

              frame = cctx.compress(original)

              dctx = zstd.ZstdDecompressor()

              source = io.BytesIO(frame)

              chunks = []

              with dctx.stream_reader(source, read_size=source_read_size) as reader:

                  while True:

                      read_size = read_sizes.draw(strategies.integers(1, 16384))

                      chunk = reader.read(read_size)

                      if not chunk:

                          break

                      chunks.append(chunk)

              self.assertEqual(b''.join(chunks), original)

          @hypothesis.settings(

              suppress_health_check=[hypothesis.HealthCheck.large_base_example])

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            source_read_size=strategies.integers(1, 16384),

                            read_sizes=strategies.data())

          def test_buffer_source_read_variance(self, original, level, source_read_size,

                                               read_sizes):

              cctx = zstd.ZstdCompressor(level=level)

              frame = cctx.compress(original)

              dctx = zstd.ZstdDecompressor()

              chunks = []

              with dctx.stream_reader(frame, read_size=source_read_size) as reader:

                  while True:

                      read_size = read_sizes.draw(strategies.integers(1, 16384))

                      chunk = reader.read(read_size)

                      if not chunk:

                          break

                      chunks.append(chunk)

              self.assertEqual(b''.join(chunks), original)

          @hypothesis.settings(

              suppress_health_check=[hypothesis.HealthCheck.large_base_example])

          @hypothesis.given(

              original=strategies.sampled_from(random_input_data()),

              level=strategies.integers(min_value=1, max_value=5),

              source_read_size=strategies.integers(1, 16384),

              seek_amounts=strategies.data(),

              read_sizes=strategies.data())

          def test_relative_seeks(self, original, level, source_read_size, seek_amounts,

                                  read_sizes):

              cctx = zstd.ZstdCompressor(level=level)

              frame = cctx.compress(original)

              dctx = zstd.ZstdDecompressor()

              with dctx.stream_reader(frame, read_size=source_read_size) as reader:

                  while True:

                      amount = seek_amounts.draw(strategies.integers(0, 16384))

                      reader.seek(amount, os.SEEK_CUR)

                      offset = reader.tell()

                      read_amount = read_sizes.draw(strategies.integers(1, 16384))

                      chunk = reader.read(read_amount)

                      if not chunk:

                          break

                      self.assertEqual(original[offset:offset + len(chunk)], chunk)

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      @make_cffi

      class TestDecompressor_stream_writer_fuzzing(unittest.TestCase):

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            write_size=strategies.integers(min_value=1, max_value=8192),

                            input_sizes=strategies.data())

          def test_write_size_variance(self, original, level, write_size, input_sizes):

              cctx = zstd.ZstdCompressor(level=level)

              frame = cctx.compress(original)

              dctx = zstd.ZstdDecompressor()

              source = io.BytesIO(frame)

              dest = io.BytesIO()

              with dctx.stream_writer(dest, write_size=write_size) as decompressor:

                  while True:

                      input_size = input_sizes.draw(strategies.integers(1, 4096))

                      chunk = source.read(input_size)

                      if not chunk:

                          break

                      decompressor.write(chunk)

              self.assertEqual(dest.getvalue(), original)

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      @make_cffi

      class TestDecompressor_copy_stream_fuzzing(unittest.TestCase):

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            read_size=strategies.integers(min_value=1, max_value=8192),

                            write_size=strategies.integers(min_value=1, max_value=8192))

          def test_read_write_size_variance(self, original, level, read_size, write_size):

              cctx = zstd.ZstdCompressor(level=level)

              frame = cctx.compress(original)

              source = io.BytesIO(frame)

              dest = io.BytesIO()

              dctx = zstd.ZstdDecompressor()

              dctx.copy_stream(source, dest, read_size=read_size, write_size=write_size)

              self.assertEqual(dest.getvalue(), original)

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      @make_cffi

      class TestDecompressor_decompressobj_fuzzing(unittest.TestCase):

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            chunk_sizes=strategies.data())

          def test_random_input_sizes(self, original, level, chunk_sizes):

              cctx = zstd.ZstdCompressor(level=level)

              frame = cctx.compress(original)

              source = io.BytesIO(frame)

              dctx = zstd.ZstdDecompressor()

              dobj = dctx.decompressobj()

              chunks = []

              while True:

                  chunk_size = chunk_sizes.draw(strategies.integers(1, 4096))

                  chunk = source.read(chunk_size)

                  if not chunk:

                      break

                  chunks.append(dobj.decompress(chunk))

              self.assertEqual(b''.join(chunks), original)

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            write_size=strategies.integers(min_value=1,

                                                           max_value=4 * zstd.DECOMPRESSION_RECOMMENDED_OUTPUT_SIZE),

                            chunk_sizes=strategies.data())

          def test_random_output_sizes(self, original, level, write_size, chunk_sizes):

              cctx = zstd.ZstdCompressor(level=level)

              frame = cctx.compress(original)

              source = io.BytesIO(frame)

              dctx = zstd.ZstdDecompressor()

              dobj = dctx.decompressobj(write_size=write_size)

              chunks = []

              while True:

                  chunk_size = chunk_sizes.draw(strategies.integers(1, 4096))

                  chunk = source.read(chunk_size)

                  if not chunk:

                      break

                  chunks.append(dobj.decompress(chunk))

              self.assertEqual(b''.join(chunks), original)

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      @make_cffi

      class TestDecompressor_read_to_iter_fuzzing(unittest.TestCase):

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            read_size=strategies.integers(min_value=1, max_value=4096),

                            write_size=strategies.integers(min_value=1, max_value=4096))

          def test_read_write_size_variance(self, original, level, read_size, write_size):

              cctx = zstd.ZstdCompressor(level=level)

              frame = cctx.compress(original)

              source = io.BytesIO(frame)

              dctx = zstd.ZstdDecompressor()

              chunks = list(dctx.read_to_iter(source, read_size=read_size, write_size=write_size))

              self.assertEqual(b''.join(chunks), original)

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      class TestDecompressor_multi_decompress_to_buffer_fuzzing(unittest.TestCase):

          @hypothesis.given(original=strategies.lists(strategies.sampled_from(random_input_data()),

                                              min_size=1, max_size=1024),

                      threads=strategies.integers(min_value=1, max_value=8),

                      use_dict=strategies.booleans())

          def test_data_equivalence(self, original, threads, use_dict):

              kwargs = {}

              if use_dict:

                  kwargs['dict_data'] = zstd.ZstdCompressionDict(original[0])

              cctx = zstd.ZstdCompressor(level=1,

                                         write_content_size=True,

                                         write_checksum=True,

                                         **kwargs)

              frames_buffer = cctx.multi_compress_to_buffer(original, threads=-1)

              dctx = zstd.ZstdDecompressor(**kwargs)

              result = dctx.multi_decompress_to_buffer(frames_buffer)

              self.assertEqual(len(result), len(original))

              for i, frame in enumerate(result):

                  self.assertEqual(frame.tobytes(), original[i])

              frames_list = [f.tobytes() for f in frames_buffer]

              result = dctx.multi_decompress_to_buffer(frames_list)

              self.assertEqual(len(result), len(original))

              for i, frame in enumerate(result):

                  self.assertEqual(frame.tobytes(), original[i])

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

				import io
				import os
				import unittest

				try:
				import hypothesis
				import hypothesis.strategies as strategies
				except ImportError:
				raise unittest.SkipTest('hypothesis not available')

				import zstandard as zstd

				from . common import (
				make_cffi,
				random_input_data,
				)


				@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
				@make_cffi
				class TestDecompressor_stream_reader_fuzzing(unittest.TestCase):
				@hypothesis.settings(
				suppress_health_check=[hypothesis.HealthCheck.large_base_example])
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				source_read_size=strategies.integers(1, 16384),
				read_sizes=strategies.data())
				def test_stream_source_read_variance(self, original, level, source_read_size,
				read_sizes):
				cctx = zstd.ZstdCompressor(level=level)
				frame = cctx.compress(original)

				dctx = zstd.ZstdDecompressor()
				source = io.BytesIO(frame)

				chunks = []
				with dctx.stream_reader(source, read_size=source_read_size) as reader:
				while True:
				read_size = read_sizes.draw(strategies.integers(1, 16384))
				chunk = reader.read(read_size)
				if not chunk:
				break

				chunks.append(chunk)

				self.assertEqual(b''.join(chunks), original)

				@hypothesis.settings(
				suppress_health_check=[hypothesis.HealthCheck.large_base_example])
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				source_read_size=strategies.integers(1, 16384),
				read_sizes=strategies.data())
				def test_buffer_source_read_variance(self, original, level, source_read_size,
				read_sizes):
				cctx = zstd.ZstdCompressor(level=level)
				frame = cctx.compress(original)

				dctx = zstd.ZstdDecompressor()
				chunks = []

				with dctx.stream_reader(frame, read_size=source_read_size) as reader:
				while True:
				read_size = read_sizes.draw(strategies.integers(1, 16384))
				chunk = reader.read(read_size)
				if not chunk:
				break

				chunks.append(chunk)

				self.assertEqual(b''.join(chunks), original)

				@hypothesis.settings(
				suppress_health_check=[hypothesis.HealthCheck.large_base_example])
				@hypothesis.given(
				original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				source_read_size=strategies.integers(1, 16384),
				seek_amounts=strategies.data(),
				read_sizes=strategies.data())
				def test_relative_seeks(self, original, level, source_read_size, seek_amounts,
				read_sizes):
				cctx = zstd.ZstdCompressor(level=level)
				frame = cctx.compress(original)

				dctx = zstd.ZstdDecompressor()

				with dctx.stream_reader(frame, read_size=source_read_size) as reader:
				while True:
				amount = seek_amounts.draw(strategies.integers(0, 16384))
				reader.seek(amount, os.SEEK_CUR)

				offset = reader.tell()
				read_amount = read_sizes.draw(strategies.integers(1, 16384))
				chunk = reader.read(read_amount)

				if not chunk:
				break

				self.assertEqual(original[offset:offset + len(chunk)], chunk)


				@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
				@make_cffi
				class TestDecompressor_stream_writer_fuzzing(unittest.TestCase):
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				write_size=strategies.integers(min_value=1, max_value=8192),
				input_sizes=strategies.data())
				def test_write_size_variance(self, original, level, write_size, input_sizes):
				cctx = zstd.ZstdCompressor(level=level)
				frame = cctx.compress(original)

				dctx = zstd.ZstdDecompressor()
				source = io.BytesIO(frame)
				dest = io.BytesIO()

				with dctx.stream_writer(dest, write_size=write_size) as decompressor:
				while True:
				input_size = input_sizes.draw(strategies.integers(1, 4096))
				chunk = source.read(input_size)
				if not chunk:
				break

				decompressor.write(chunk)

				self.assertEqual(dest.getvalue(), original)


				@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
				@make_cffi
				class TestDecompressor_copy_stream_fuzzing(unittest.TestCase):
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				read_size=strategies.integers(min_value=1, max_value=8192),
				write_size=strategies.integers(min_value=1, max_value=8192))
				def test_read_write_size_variance(self, original, level, read_size, write_size):
				cctx = zstd.ZstdCompressor(level=level)
				frame = cctx.compress(original)

				source = io.BytesIO(frame)
				dest = io.BytesIO()

				dctx = zstd.ZstdDecompressor()
				dctx.copy_stream(source, dest, read_size=read_size, write_size=write_size)

				self.assertEqual(dest.getvalue(), original)


				@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
				@make_cffi
				class TestDecompressor_decompressobj_fuzzing(unittest.TestCase):
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				chunk_sizes=strategies.data())
				def test_random_input_sizes(self, original, level, chunk_sizes):
				cctx = zstd.ZstdCompressor(level=level)
				frame = cctx.compress(original)

				source = io.BytesIO(frame)

				dctx = zstd.ZstdDecompressor()
				dobj = dctx.decompressobj()

				chunks = []
				while True:
				chunk_size = chunk_sizes.draw(strategies.integers(1, 4096))
				chunk = source.read(chunk_size)
				if not chunk:
				break

				chunks.append(dobj.decompress(chunk))

				self.assertEqual(b''.join(chunks), original)

				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				write_size=strategies.integers(min_value=1,
				max_value=4 * zstd.DECOMPRESSION_RECOMMENDED_OUTPUT_SIZE),
				chunk_sizes=strategies.data())
				def test_random_output_sizes(self, original, level, write_size, chunk_sizes):
				cctx = zstd.ZstdCompressor(level=level)
				frame = cctx.compress(original)

				source = io.BytesIO(frame)

				dctx = zstd.ZstdDecompressor()
				dobj = dctx.decompressobj(write_size=write_size)

				chunks = []
				while True:
				chunk_size = chunk_sizes.draw(strategies.integers(1, 4096))
				chunk = source.read(chunk_size)
				if not chunk:
				break

				chunks.append(dobj.decompress(chunk))

				self.assertEqual(b''.join(chunks), original)


				@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
				@make_cffi
				class TestDecompressor_read_to_iter_fuzzing(unittest.TestCase):
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				read_size=strategies.integers(min_value=1, max_value=4096),
				write_size=strategies.integers(min_value=1, max_value=4096))
				def test_read_write_size_variance(self, original, level, read_size, write_size):
				cctx = zstd.ZstdCompressor(level=level)
				frame = cctx.compress(original)

				source = io.BytesIO(frame)

				dctx = zstd.ZstdDecompressor()
				chunks = list(dctx.read_to_iter(source, read_size=read_size, write_size=write_size))

				self.assertEqual(b''.join(chunks), original)


				@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
				class TestDecompressor_multi_decompress_to_buffer_fuzzing(unittest.TestCase):
				@hypothesis.given(original=strategies.lists(strategies.sampled_from(random_input_data()),
				min_size=1, max_size=1024),
				threads=strategies.integers(min_value=1, max_value=8),
				use_dict=strategies.booleans())
				def test_data_equivalence(self, original, threads, use_dict):
				kwargs = {}
				if use_dict:
				kwargs['dict_data'] = zstd.ZstdCompressionDict(original[0])

				cctx = zstd.ZstdCompressor(level=1,
				write_content_size=True,
				write_checksum=True,
				**kwargs)

				frames_buffer = cctx.multi_compress_to_buffer(original, threads=-1)

				dctx = zstd.ZstdDecompressor(**kwargs)

				result = dctx.multi_decompress_to_buffer(frames_buffer)

				self.assertEqual(len(result), len(original))
				for i, frame in enumerate(result):
				self.assertEqual(frame.tobytes(), original[i])

				frames_list = [f.tobytes() for f in frames_buffer]
				result = dctx.multi_decompress_to_buffer(frames_list)

				self.assertEqual(len(result), len(original))
				for i, frame in enumerate(result):
				self.assertEqual(frame.tobytes(), original[i])