upstream/mercurial-mirror Files · contrib/python-zstandard/tests/test_compressor_fuzzing.py

gitweb: render changesets server-side on /graph page

Gregory Szorc - - Load All Authors

File last commit:

r31796:e0dc4053 default


                r35220:dc623009

default

Download file

             test_compressor_fuzzing.py
        
                    143 lines
            
             | 5.5 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / contrib / python-zstandard / tests / test_compressor_fuzzing.py
          
                    History
                
                 |
                  Source
                 | Raw
                 |Copy content
                 |Copy permalink

        Gregory Szorc
    
zstd: vendor python-zstandard 0.8.0...

              r31796
            
      import io

      import os

      try:

          import unittest2 as unittest

      except ImportError:

          import unittest

      try:

          import hypothesis

          import hypothesis.strategies as strategies

      except ImportError:

          raise unittest.SkipTest('hypothesis not available')

      import zstd

      from . common import (

          make_cffi,

          random_input_data,

      )

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      @make_cffi

      class TestCompressor_write_to_fuzzing(unittest.TestCase):

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                              level=strategies.integers(min_value=1, max_value=5),

                              write_size=strategies.integers(min_value=1, max_value=1048576))

          def test_write_size_variance(self, original, level, write_size):

              refctx = zstd.ZstdCompressor(level=level)

              ref_frame = refctx.compress(original)

              cctx = zstd.ZstdCompressor(level=level)

              b = io.BytesIO()

              with cctx.write_to(b, size=len(original), write_size=write_size) as compressor:

                  compressor.write(original)

              self.assertEqual(b.getvalue(), ref_frame)

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      @make_cffi

      class TestCompressor_copy_stream_fuzzing(unittest.TestCase):

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            read_size=strategies.integers(min_value=1, max_value=1048576),

                            write_size=strategies.integers(min_value=1, max_value=1048576))

          def test_read_write_size_variance(self, original, level, read_size, write_size):

              refctx = zstd.ZstdCompressor(level=level)

              ref_frame = refctx.compress(original)

              cctx = zstd.ZstdCompressor(level=level)

              source = io.BytesIO(original)

              dest = io.BytesIO()

              cctx.copy_stream(source, dest, size=len(original), read_size=read_size,

                               write_size=write_size)

              self.assertEqual(dest.getvalue(), ref_frame)

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      @make_cffi

      class TestCompressor_compressobj_fuzzing(unittest.TestCase):

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            chunk_sizes=strategies.streaming(

                                strategies.integers(min_value=1, max_value=4096)))

          def test_random_input_sizes(self, original, level, chunk_sizes):

              chunk_sizes = iter(chunk_sizes)

              refctx = zstd.ZstdCompressor(level=level)

              ref_frame = refctx.compress(original)

              cctx = zstd.ZstdCompressor(level=level)

              cobj = cctx.compressobj(size=len(original))

              chunks = []

              i = 0

              while True:

                  chunk_size = next(chunk_sizes)

                  source = original[i:i + chunk_size]

                  if not source:

                      break

                  chunks.append(cobj.compress(source))

                  i += chunk_size

              chunks.append(cobj.flush())

              self.assertEqual(b''.join(chunks), ref_frame)

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      @make_cffi

      class TestCompressor_read_from_fuzzing(unittest.TestCase):

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            read_size=strategies.integers(min_value=1, max_value=4096),

                            write_size=strategies.integers(min_value=1, max_value=4096))

          def test_read_write_size_variance(self, original, level, read_size, write_size):

              refcctx = zstd.ZstdCompressor(level=level)

              ref_frame = refcctx.compress(original)

              source = io.BytesIO(original)

              cctx = zstd.ZstdCompressor(level=level)

              chunks = list(cctx.read_from(source, size=len(original), read_size=read_size,

                                           write_size=write_size))

              self.assertEqual(b''.join(chunks), ref_frame)

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      class TestCompressor_multi_compress_to_buffer_fuzzing(unittest.TestCase):

          @hypothesis.given(original=strategies.lists(strategies.sampled_from(random_input_data()),

                                                      min_size=1, max_size=1024),

                              threads=strategies.integers(min_value=1, max_value=8),

                              use_dict=strategies.booleans())

          def test_data_equivalence(self, original, threads, use_dict):

              kwargs = {}

              # Use a content dictionary because it is cheap to create.

              if use_dict:

                  kwargs['dict_data'] = zstd.ZstdCompressionDict(original[0])

              cctx = zstd.ZstdCompressor(level=1,

                                         write_content_size=True,

                                         write_checksum=True,

                                         **kwargs)

              result = cctx.multi_compress_to_buffer(original, threads=-1)

              self.assertEqual(len(result), len(original))

              # The frame produced via the batch APIs may not be bit identical to that

              # produced by compress() because compression parameters are adjusted

              # from the first input in batch mode. So the only thing we can do is

              # verify the decompressed data matches the input.

              dctx = zstd.ZstdDecompressor(**kwargs)

              for i, frame in enumerate(result):

                  self.assertEqual(dctx.decompress(frame), original[i])

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

Gregory Szorc zstd: vendor python-zstandard 0.8.0...	r31796	import io
		import os

		try:
		import unittest2 as unittest
		except ImportError:
		import unittest

		try:
		import hypothesis
		import hypothesis.strategies as strategies
		except ImportError:
		raise unittest.SkipTest('hypothesis not available')

		import zstd

		from . common import (
		make_cffi,
		random_input_data,
		)


		@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
		@make_cffi
		class TestCompressor_write_to_fuzzing(unittest.TestCase):
		@hypothesis.given(original=strategies.sampled_from(random_input_data()),
		level=strategies.integers(min_value=1, max_value=5),
		write_size=strategies.integers(min_value=1, max_value=1048576))
		def test_write_size_variance(self, original, level, write_size):
		refctx = zstd.ZstdCompressor(level=level)
		ref_frame = refctx.compress(original)

		cctx = zstd.ZstdCompressor(level=level)
		b = io.BytesIO()
		with cctx.write_to(b, size=len(original), write_size=write_size) as compressor:
		compressor.write(original)

		self.assertEqual(b.getvalue(), ref_frame)


		@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
		@make_cffi
		class TestCompressor_copy_stream_fuzzing(unittest.TestCase):
		@hypothesis.given(original=strategies.sampled_from(random_input_data()),
		level=strategies.integers(min_value=1, max_value=5),
		read_size=strategies.integers(min_value=1, max_value=1048576),
		write_size=strategies.integers(min_value=1, max_value=1048576))
		def test_read_write_size_variance(self, original, level, read_size, write_size):
		refctx = zstd.ZstdCompressor(level=level)
		ref_frame = refctx.compress(original)

		cctx = zstd.ZstdCompressor(level=level)
		source = io.BytesIO(original)
		dest = io.BytesIO()

		cctx.copy_stream(source, dest, size=len(original), read_size=read_size,
		write_size=write_size)

		self.assertEqual(dest.getvalue(), ref_frame)


		@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
		@make_cffi
		class TestCompressor_compressobj_fuzzing(unittest.TestCase):
		@hypothesis.given(original=strategies.sampled_from(random_input_data()),
		level=strategies.integers(min_value=1, max_value=5),
		chunk_sizes=strategies.streaming(
		strategies.integers(min_value=1, max_value=4096)))
		def test_random_input_sizes(self, original, level, chunk_sizes):
		chunk_sizes = iter(chunk_sizes)

		refctx = zstd.ZstdCompressor(level=level)
		ref_frame = refctx.compress(original)

		cctx = zstd.ZstdCompressor(level=level)
		cobj = cctx.compressobj(size=len(original))

		chunks = []
		i = 0
		while True:
		chunk_size = next(chunk_sizes)
		source = original[i:i + chunk_size]
		if not source:
		break

		chunks.append(cobj.compress(source))
		i += chunk_size

		chunks.append(cobj.flush())

		self.assertEqual(b''.join(chunks), ref_frame)


		@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
		@make_cffi
		class TestCompressor_read_from_fuzzing(unittest.TestCase):
		@hypothesis.given(original=strategies.sampled_from(random_input_data()),
		level=strategies.integers(min_value=1, max_value=5),
		read_size=strategies.integers(min_value=1, max_value=4096),
		write_size=strategies.integers(min_value=1, max_value=4096))
		def test_read_write_size_variance(self, original, level, read_size, write_size):
		refcctx = zstd.ZstdCompressor(level=level)
		ref_frame = refcctx.compress(original)

		source = io.BytesIO(original)

		cctx = zstd.ZstdCompressor(level=level)
		chunks = list(cctx.read_from(source, size=len(original), read_size=read_size,
		write_size=write_size))

		self.assertEqual(b''.join(chunks), ref_frame)


		@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
		class TestCompressor_multi_compress_to_buffer_fuzzing(unittest.TestCase):
		@hypothesis.given(original=strategies.lists(strategies.sampled_from(random_input_data()),
		min_size=1, max_size=1024),
		threads=strategies.integers(min_value=1, max_value=8),
		use_dict=strategies.booleans())
		def test_data_equivalence(self, original, threads, use_dict):
		kwargs = {}

		# Use a content dictionary because it is cheap to create.
		if use_dict:
		kwargs['dict_data'] = zstd.ZstdCompressionDict(original[0])

		cctx = zstd.ZstdCompressor(level=1,
		write_content_size=True,
		write_checksum=True,
		**kwargs)

		result = cctx.multi_compress_to_buffer(original, threads=-1)

		self.assertEqual(len(result), len(original))

		# The frame produced via the batch APIs may not be bit identical to that
		# produced by compress() because compression parameters are adjusted
		# from the first input in batch mode. So the only thing we can do is
		# verify the decompressed data matches the input.
		dctx = zstd.ZstdDecompressor(**kwargs)

		for i, frame in enumerate(result):
		self.assertEqual(dctx.decompress(frame), original[i])