upstream/mercurial-mirror Files · contrib/python-zstandard/tests/test_decompressor_fuzzing.py

copies: move from a copy on branchpoint to a copy on write approach...

copies: move from a copy on branchpoint to a copy on write approach Before this changes, any branch points results in a copy of the dictionary containing the copy information. This can be very costly for branchy history with few rename information. Instead, we take a "copy on write" approach. Copying the input data only when we are about to update them. In practice we where already doing the copying in half of these case (because `_chain` makes a copy), so we don't add a significant cost here even in the linear case. However the speed up in branchy case is very significant. Here are some timing on the pypy repository. revision: large amount; added files: large amount; rename small amount; 9ba6ab77fd29 before: ! wall 1.399863 comb 1.400000 user 1.370000 sys 0.030000 (median of 10) after: ! wall 0.766453 comb 0.770000 user 0.750000 sys 0.020000 (median of 11) revision: large amount; added files: small amount; rename small amount; f650a9b140d2 before: ! wall 1.876748 comb 1.890000 user 1.870000 sys 0.020000 (median of 10) after: ! wall 1.167223 comb 1.170000 user 1.150000 sys 0.020000 (median of 10) revision: large amount; added files: large amount; rename large amount; d9fa043f30c0 before: ! wall 0.242457 comb 0.240000 user 0.240000 sys 0.000000 (median of 39) after: ! wall 0.211476 comb 0.210000 user 0.210000 sys 0.000000 (median of 45) revision: small amount; added files: large amount; rename large amount; a83dc6a2d56f before: ! wall 0.013193 comb 0.020000 user 0.020000 sys 0.000000 (median of 224) after: ! wall 0.013290 comb 0.010000 user 0.010000 sys 0.000000 (median of 222) revision: small amount; added files: large amount; rename small amount; 169138063d63 before: ! wall 0.001673 comb 0.000000 user 0.000000 sys 0.000000 (median of 1000) after: ! wall 0.001677 comb 0.000000 user 0.000000 sys 0.000000 (median of 1000) revision: small amount; added files: small amount; rename small amount; 964879152e2e before: ! wall 0.000119 comb 0.000000 user 0.000000 sys 0.000000 (median of 8023) after: ! wall 0.000119 comb 0.000000 user 0.000000 sys 0.000000 (median of 7997) revision: medium amount; added files: large amount; rename medium amount; 2c68e87c3efe before: ! wall 0.201898 comb 0.210000 user 0.200000 sys 0.010000 (median of 48) after: ! wall 0.167415 comb 0.170000 user 0.160000 sys 0.010000 (median of 58) revision: medium amount; added files: medium amount; rename small amount; d7746d32bf9d before: ! wall 0.036820 comb 0.040000 user 0.040000 sys 0.000000 (median of 100) after: ! wall 0.035797 comb 0.040000 user 0.040000 sys 0.000000 (median of 100) The extra cost in the linear case can be reclaimed later with some extra logic. Differential Revision: https://phab.mercurial-scm.org/D7124

Gregory Szorc - - Load All Authors

File last commit:

r42237:675775c3 default


                r43594:ffd04bc9

default

Download file

             test_decompressor_fuzzing.py
        
                    485 lines
            
             | 18.3 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / contrib / python-zstandard / tests / test_decompressor_fuzzing.py
          
                    History
                
                 |
                  Annotation
                 | Raw
                 |Copy content
                 |Copy permalink

      import io

      import os

      import unittest

      try:

          import hypothesis

          import hypothesis.strategies as strategies

      except ImportError:

          raise unittest.SkipTest('hypothesis not available')

      import zstandard as zstd

      from . common import (

          make_cffi,

          NonClosingBytesIO,

          random_input_data,

      )

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      @make_cffi

      class TestDecompressor_stream_reader_fuzzing(unittest.TestCase):

          @hypothesis.settings(

              suppress_health_check=[hypothesis.HealthCheck.large_base_example])

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            streaming=strategies.booleans(),

                            source_read_size=strategies.integers(1, 1048576),

                            read_sizes=strategies.data())

          def test_stream_source_read_variance(self, original, level, streaming,

                                               source_read_size, read_sizes):

              cctx = zstd.ZstdCompressor(level=level)

              if streaming:

                  source = io.BytesIO()

                  writer = cctx.stream_writer(source)

                  writer.write(original)

                  writer.flush(zstd.FLUSH_FRAME)

                  source.seek(0)

              else:

                  frame = cctx.compress(original)

                  source = io.BytesIO(frame)

              dctx = zstd.ZstdDecompressor()

              chunks = []

              with dctx.stream_reader(source, read_size=source_read_size) as reader:

                  while True:

                      read_size = read_sizes.draw(strategies.integers(-1, 131072))

                      chunk = reader.read(read_size)

                      if not chunk and read_size:

                          break

                      chunks.append(chunk)

              self.assertEqual(b''.join(chunks), original)

          # Similar to above except we have a constant read() size.

          @hypothesis.settings(

              suppress_health_check=[hypothesis.HealthCheck.large_base_example])

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            streaming=strategies.booleans(),

                            source_read_size=strategies.integers(1, 1048576),

                            read_size=strategies.integers(-1, 131072))

          def test_stream_source_read_size(self, original, level, streaming,

                                           source_read_size, read_size):

              if read_size == 0:

                  read_size = 1

              cctx = zstd.ZstdCompressor(level=level)

              if streaming:

                  source = io.BytesIO()

                  writer = cctx.stream_writer(source)

                  writer.write(original)

                  writer.flush(zstd.FLUSH_FRAME)

                  source.seek(0)

              else:

                  frame = cctx.compress(original)

                  source = io.BytesIO(frame)

              dctx = zstd.ZstdDecompressor()

              chunks = []

              reader = dctx.stream_reader(source, read_size=source_read_size)

              while True:

                  chunk = reader.read(read_size)

                  if not chunk and read_size:

                      break

                  chunks.append(chunk)

              self.assertEqual(b''.join(chunks), original)

          @hypothesis.settings(

              suppress_health_check=[hypothesis.HealthCheck.large_base_example])

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            streaming=strategies.booleans(),

                            source_read_size=strategies.integers(1, 1048576),

                            read_sizes=strategies.data())

          def test_buffer_source_read_variance(self, original, level, streaming,

                                               source_read_size, read_sizes):

              cctx = zstd.ZstdCompressor(level=level)

              if streaming:

                  source = io.BytesIO()

                  writer = cctx.stream_writer(source)

                  writer.write(original)

                  writer.flush(zstd.FLUSH_FRAME)

                  frame = source.getvalue()

              else:

                  frame = cctx.compress(original)

              dctx = zstd.ZstdDecompressor()

              chunks = []

              with dctx.stream_reader(frame, read_size=source_read_size) as reader:

                  while True:

                      read_size = read_sizes.draw(strategies.integers(-1, 131072))

                      chunk = reader.read(read_size)

                      if not chunk and read_size:

                          break

                      chunks.append(chunk)

              self.assertEqual(b''.join(chunks), original)

          # Similar to above except we have a constant read() size.

          @hypothesis.settings(

              suppress_health_check=[hypothesis.HealthCheck.large_base_example])

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            streaming=strategies.booleans(),

                            source_read_size=strategies.integers(1, 1048576),

                            read_size=strategies.integers(-1, 131072))

          def test_buffer_source_constant_read_size(self, original, level, streaming,

                                                    source_read_size, read_size):

              if read_size == 0:

                  read_size = -1

              cctx = zstd.ZstdCompressor(level=level)

              if streaming:

                  source = io.BytesIO()

                  writer = cctx.stream_writer(source)

                  writer.write(original)

                  writer.flush(zstd.FLUSH_FRAME)

                  frame = source.getvalue()

              else:

                  frame = cctx.compress(original)

              dctx = zstd.ZstdDecompressor()

              chunks = []

              reader = dctx.stream_reader(frame, read_size=source_read_size)

              while True:

                  chunk = reader.read(read_size)

                  if not chunk and read_size:

                      break

                  chunks.append(chunk)

              self.assertEqual(b''.join(chunks), original)

          @hypothesis.settings(

              suppress_health_check=[hypothesis.HealthCheck.large_base_example])

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            streaming=strategies.booleans(),

                            source_read_size=strategies.integers(1, 1048576))

          def test_stream_source_readall(self, original, level, streaming,

                                               source_read_size):

              cctx = zstd.ZstdCompressor(level=level)

              if streaming:

                  source = io.BytesIO()

                  writer = cctx.stream_writer(source)

                  writer.write(original)

                  writer.flush(zstd.FLUSH_FRAME)

                  source.seek(0)

              else:

                  frame = cctx.compress(original)

                  source = io.BytesIO(frame)

              dctx = zstd.ZstdDecompressor()

              data = dctx.stream_reader(source, read_size=source_read_size).readall()

              self.assertEqual(data, original)

          @hypothesis.settings(

              suppress_health_check=[hypothesis.HealthCheck.large_base_example])

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            streaming=strategies.booleans(),

                            source_read_size=strategies.integers(1, 1048576),

                            read_sizes=strategies.data())

          def test_stream_source_read1_variance(self, original, level, streaming,

                                                source_read_size, read_sizes):

              cctx = zstd.ZstdCompressor(level=level)

              if streaming:

                  source = io.BytesIO()

                  writer = cctx.stream_writer(source)

                  writer.write(original)

                  writer.flush(zstd.FLUSH_FRAME)

                  source.seek(0)

              else:

                  frame = cctx.compress(original)

                  source = io.BytesIO(frame)

              dctx = zstd.ZstdDecompressor()

              chunks = []

              with dctx.stream_reader(source, read_size=source_read_size) as reader:

                  while True:

                      read_size = read_sizes.draw(strategies.integers(-1, 131072))

                      chunk = reader.read1(read_size)

                      if not chunk and read_size:

                          break

                      chunks.append(chunk)

              self.assertEqual(b''.join(chunks), original)

          @hypothesis.settings(

              suppress_health_check=[hypothesis.HealthCheck.large_base_example])

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            streaming=strategies.booleans(),

                            source_read_size=strategies.integers(1, 1048576),

                            read_sizes=strategies.data())

          def test_stream_source_readinto1_variance(self, original, level, streaming,

                                                source_read_size, read_sizes):

              cctx = zstd.ZstdCompressor(level=level)

              if streaming:

                  source = io.BytesIO()

                  writer = cctx.stream_writer(source)

                  writer.write(original)

                  writer.flush(zstd.FLUSH_FRAME)

                  source.seek(0)

              else:

                  frame = cctx.compress(original)

                  source = io.BytesIO(frame)

              dctx = zstd.ZstdDecompressor()

              chunks = []

              with dctx.stream_reader(source, read_size=source_read_size) as reader:

                  while True:

                      read_size = read_sizes.draw(strategies.integers(1, 131072))

                      b = bytearray(read_size)

                      count = reader.readinto1(b)

                      if not count:

                          break

                      chunks.append(bytes(b[0:count]))

              self.assertEqual(b''.join(chunks), original)

          @hypothesis.settings(

              suppress_health_check=[hypothesis.HealthCheck.large_base_example])

          @hypothesis.given(

              original=strategies.sampled_from(random_input_data()),

              level=strategies.integers(min_value=1, max_value=5),

              source_read_size=strategies.integers(1, 1048576),

              seek_amounts=strategies.data(),

              read_sizes=strategies.data())

          def test_relative_seeks(self, original, level, source_read_size, seek_amounts,

                                  read_sizes):

              cctx = zstd.ZstdCompressor(level=level)

              frame = cctx.compress(original)

              dctx = zstd.ZstdDecompressor()

              with dctx.stream_reader(frame, read_size=source_read_size) as reader:

                  while True:

                      amount = seek_amounts.draw(strategies.integers(0, 16384))

                      reader.seek(amount, os.SEEK_CUR)

                      offset = reader.tell()

                      read_amount = read_sizes.draw(strategies.integers(1, 16384))

                      chunk = reader.read(read_amount)

                      if not chunk:

                          break

                      self.assertEqual(original[offset:offset + len(chunk)], chunk)

          @hypothesis.settings(

              suppress_health_check=[hypothesis.HealthCheck.large_base_example])

          @hypothesis.given(

              originals=strategies.data(),

              frame_count=strategies.integers(min_value=2, max_value=10),

              level=strategies.integers(min_value=1, max_value=5),

              source_read_size=strategies.integers(1, 1048576),

              read_sizes=strategies.data())

          def test_multiple_frames(self, originals, frame_count, level,

                                   source_read_size, read_sizes):

              cctx = zstd.ZstdCompressor(level=level)

              source = io.BytesIO()

              buffer = io.BytesIO()

              writer = cctx.stream_writer(buffer)

              for i in range(frame_count):

                  data = originals.draw(strategies.sampled_from(random_input_data()))

                  source.write(data)

                  writer.write(data)

                  writer.flush(zstd.FLUSH_FRAME)

              dctx = zstd.ZstdDecompressor()

              buffer.seek(0)

              reader = dctx.stream_reader(buffer, read_size=source_read_size,

                                          read_across_frames=True)

              chunks = []

              while True:

                  read_amount = read_sizes.draw(strategies.integers(-1, 16384))

                  chunk = reader.read(read_amount)

                  if not chunk and read_amount:

                      break

                  chunks.append(chunk)

              self.assertEqual(source.getvalue(), b''.join(chunks))

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      @make_cffi

      class TestDecompressor_stream_writer_fuzzing(unittest.TestCase):

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            write_size=strategies.integers(min_value=1, max_value=8192),

                            input_sizes=strategies.data())

          def test_write_size_variance(self, original, level, write_size, input_sizes):

              cctx = zstd.ZstdCompressor(level=level)

              frame = cctx.compress(original)

              dctx = zstd.ZstdDecompressor()

              source = io.BytesIO(frame)

              dest = NonClosingBytesIO()

              with dctx.stream_writer(dest, write_size=write_size) as decompressor:

                  while True:

                      input_size = input_sizes.draw(strategies.integers(1, 4096))

                      chunk = source.read(input_size)

                      if not chunk:

                          break

                      decompressor.write(chunk)

              self.assertEqual(dest.getvalue(), original)

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      @make_cffi

      class TestDecompressor_copy_stream_fuzzing(unittest.TestCase):

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            read_size=strategies.integers(min_value=1, max_value=8192),

                            write_size=strategies.integers(min_value=1, max_value=8192))

          def test_read_write_size_variance(self, original, level, read_size, write_size):

              cctx = zstd.ZstdCompressor(level=level)

              frame = cctx.compress(original)

              source = io.BytesIO(frame)

              dest = io.BytesIO()

              dctx = zstd.ZstdDecompressor()

              dctx.copy_stream(source, dest, read_size=read_size, write_size=write_size)

              self.assertEqual(dest.getvalue(), original)

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      @make_cffi

      class TestDecompressor_decompressobj_fuzzing(unittest.TestCase):

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            chunk_sizes=strategies.data())

          def test_random_input_sizes(self, original, level, chunk_sizes):

              cctx = zstd.ZstdCompressor(level=level)

              frame = cctx.compress(original)

              source = io.BytesIO(frame)

              dctx = zstd.ZstdDecompressor()

              dobj = dctx.decompressobj()

              chunks = []

              while True:

                  chunk_size = chunk_sizes.draw(strategies.integers(1, 4096))

                  chunk = source.read(chunk_size)

                  if not chunk:

                      break

                  chunks.append(dobj.decompress(chunk))

              self.assertEqual(b''.join(chunks), original)

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            write_size=strategies.integers(min_value=1,

                                                           max_value=4 * zstd.DECOMPRESSION_RECOMMENDED_OUTPUT_SIZE),

                            chunk_sizes=strategies.data())

          def test_random_output_sizes(self, original, level, write_size, chunk_sizes):

              cctx = zstd.ZstdCompressor(level=level)

              frame = cctx.compress(original)

              source = io.BytesIO(frame)

              dctx = zstd.ZstdDecompressor()

              dobj = dctx.decompressobj(write_size=write_size)

              chunks = []

              while True:

                  chunk_size = chunk_sizes.draw(strategies.integers(1, 4096))

                  chunk = source.read(chunk_size)

                  if not chunk:

                      break

                  chunks.append(dobj.decompress(chunk))

              self.assertEqual(b''.join(chunks), original)

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      @make_cffi

      class TestDecompressor_read_to_iter_fuzzing(unittest.TestCase):

          @hypothesis.given(original=strategies.sampled_from(random_input_data()),

                            level=strategies.integers(min_value=1, max_value=5),

                            read_size=strategies.integers(min_value=1, max_value=4096),

                            write_size=strategies.integers(min_value=1, max_value=4096))

          def test_read_write_size_variance(self, original, level, read_size, write_size):

              cctx = zstd.ZstdCompressor(level=level)

              frame = cctx.compress(original)

              source = io.BytesIO(frame)

              dctx = zstd.ZstdDecompressor()

              chunks = list(dctx.read_to_iter(source, read_size=read_size, write_size=write_size))

              self.assertEqual(b''.join(chunks), original)

      @unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')

      class TestDecompressor_multi_decompress_to_buffer_fuzzing(unittest.TestCase):

          @hypothesis.given(original=strategies.lists(strategies.sampled_from(random_input_data()),

                                              min_size=1, max_size=1024),

                      threads=strategies.integers(min_value=1, max_value=8),

                      use_dict=strategies.booleans())

          def test_data_equivalence(self, original, threads, use_dict):

              kwargs = {}

              if use_dict:

                  kwargs['dict_data'] = zstd.ZstdCompressionDict(original[0])

              cctx = zstd.ZstdCompressor(level=1,

                                         write_content_size=True,

                                         write_checksum=True,

                                         **kwargs)

              if not hasattr(cctx, 'multi_compress_to_buffer'):

                  self.skipTest('multi_compress_to_buffer not available')

              frames_buffer = cctx.multi_compress_to_buffer(original, threads=-1)

              dctx = zstd.ZstdDecompressor(**kwargs)

              result = dctx.multi_decompress_to_buffer(frames_buffer)

              self.assertEqual(len(result), len(original))

              for i, frame in enumerate(result):

                  self.assertEqual(frame.tobytes(), original[i])

              frames_list = [f.tobytes() for f in frames_buffer]

              result = dctx.multi_decompress_to_buffer(frames_list)

              self.assertEqual(len(result), len(original))

              for i, frame in enumerate(result):

                  self.assertEqual(frame.tobytes(), original[i])

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

				import io
				import os
				import unittest

				try:
				import hypothesis
				import hypothesis.strategies as strategies
				except ImportError:
				raise unittest.SkipTest('hypothesis not available')

				import zstandard as zstd

				from . common import (
				make_cffi,
				NonClosingBytesIO,
				random_input_data,
				)


				@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
				@make_cffi
				class TestDecompressor_stream_reader_fuzzing(unittest.TestCase):
				@hypothesis.settings(
				suppress_health_check=[hypothesis.HealthCheck.large_base_example])
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				streaming=strategies.booleans(),
				source_read_size=strategies.integers(1, 1048576),
				read_sizes=strategies.data())
				def test_stream_source_read_variance(self, original, level, streaming,
				source_read_size, read_sizes):
				cctx = zstd.ZstdCompressor(level=level)

				if streaming:
				source = io.BytesIO()
				writer = cctx.stream_writer(source)
				writer.write(original)
				writer.flush(zstd.FLUSH_FRAME)
				source.seek(0)
				else:
				frame = cctx.compress(original)
				source = io.BytesIO(frame)

				dctx = zstd.ZstdDecompressor()

				chunks = []
				with dctx.stream_reader(source, read_size=source_read_size) as reader:
				while True:
				read_size = read_sizes.draw(strategies.integers(-1, 131072))
				chunk = reader.read(read_size)
				if not chunk and read_size:
				break

				chunks.append(chunk)

				self.assertEqual(b''.join(chunks), original)

				# Similar to above except we have a constant read() size.
				@hypothesis.settings(
				suppress_health_check=[hypothesis.HealthCheck.large_base_example])
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				streaming=strategies.booleans(),
				source_read_size=strategies.integers(1, 1048576),
				read_size=strategies.integers(-1, 131072))
				def test_stream_source_read_size(self, original, level, streaming,
				source_read_size, read_size):
				if read_size == 0:
				read_size = 1

				cctx = zstd.ZstdCompressor(level=level)

				if streaming:
				source = io.BytesIO()
				writer = cctx.stream_writer(source)
				writer.write(original)
				writer.flush(zstd.FLUSH_FRAME)
				source.seek(0)
				else:
				frame = cctx.compress(original)
				source = io.BytesIO(frame)

				dctx = zstd.ZstdDecompressor()

				chunks = []
				reader = dctx.stream_reader(source, read_size=source_read_size)
				while True:
				chunk = reader.read(read_size)
				if not chunk and read_size:
				break

				chunks.append(chunk)

				self.assertEqual(b''.join(chunks), original)

				@hypothesis.settings(
				suppress_health_check=[hypothesis.HealthCheck.large_base_example])
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				streaming=strategies.booleans(),
				source_read_size=strategies.integers(1, 1048576),
				read_sizes=strategies.data())
				def test_buffer_source_read_variance(self, original, level, streaming,
				source_read_size, read_sizes):
				cctx = zstd.ZstdCompressor(level=level)

				if streaming:
				source = io.BytesIO()
				writer = cctx.stream_writer(source)
				writer.write(original)
				writer.flush(zstd.FLUSH_FRAME)
				frame = source.getvalue()
				else:
				frame = cctx.compress(original)

				dctx = zstd.ZstdDecompressor()
				chunks = []

				with dctx.stream_reader(frame, read_size=source_read_size) as reader:
				while True:
				read_size = read_sizes.draw(strategies.integers(-1, 131072))
				chunk = reader.read(read_size)
				if not chunk and read_size:
				break

				chunks.append(chunk)

				self.assertEqual(b''.join(chunks), original)

				# Similar to above except we have a constant read() size.
				@hypothesis.settings(
				suppress_health_check=[hypothesis.HealthCheck.large_base_example])
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				streaming=strategies.booleans(),
				source_read_size=strategies.integers(1, 1048576),
				read_size=strategies.integers(-1, 131072))
				def test_buffer_source_constant_read_size(self, original, level, streaming,
				source_read_size, read_size):
				if read_size == 0:
				read_size = -1

				cctx = zstd.ZstdCompressor(level=level)

				if streaming:
				source = io.BytesIO()
				writer = cctx.stream_writer(source)
				writer.write(original)
				writer.flush(zstd.FLUSH_FRAME)
				frame = source.getvalue()
				else:
				frame = cctx.compress(original)

				dctx = zstd.ZstdDecompressor()
				chunks = []

				reader = dctx.stream_reader(frame, read_size=source_read_size)
				while True:
				chunk = reader.read(read_size)
				if not chunk and read_size:
				break

				chunks.append(chunk)

				self.assertEqual(b''.join(chunks), original)

				@hypothesis.settings(
				suppress_health_check=[hypothesis.HealthCheck.large_base_example])
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				streaming=strategies.booleans(),
				source_read_size=strategies.integers(1, 1048576))
				def test_stream_source_readall(self, original, level, streaming,
				source_read_size):
				cctx = zstd.ZstdCompressor(level=level)

				if streaming:
				source = io.BytesIO()
				writer = cctx.stream_writer(source)
				writer.write(original)
				writer.flush(zstd.FLUSH_FRAME)
				source.seek(0)
				else:
				frame = cctx.compress(original)
				source = io.BytesIO(frame)

				dctx = zstd.ZstdDecompressor()

				data = dctx.stream_reader(source, read_size=source_read_size).readall()
				self.assertEqual(data, original)

				@hypothesis.settings(
				suppress_health_check=[hypothesis.HealthCheck.large_base_example])
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				streaming=strategies.booleans(),
				source_read_size=strategies.integers(1, 1048576),
				read_sizes=strategies.data())
				def test_stream_source_read1_variance(self, original, level, streaming,
				source_read_size, read_sizes):
				cctx = zstd.ZstdCompressor(level=level)

				if streaming:
				source = io.BytesIO()
				writer = cctx.stream_writer(source)
				writer.write(original)
				writer.flush(zstd.FLUSH_FRAME)
				source.seek(0)
				else:
				frame = cctx.compress(original)
				source = io.BytesIO(frame)

				dctx = zstd.ZstdDecompressor()

				chunks = []
				with dctx.stream_reader(source, read_size=source_read_size) as reader:
				while True:
				read_size = read_sizes.draw(strategies.integers(-1, 131072))
				chunk = reader.read1(read_size)
				if not chunk and read_size:
				break

				chunks.append(chunk)

				self.assertEqual(b''.join(chunks), original)

				@hypothesis.settings(
				suppress_health_check=[hypothesis.HealthCheck.large_base_example])
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				streaming=strategies.booleans(),
				source_read_size=strategies.integers(1, 1048576),
				read_sizes=strategies.data())
				def test_stream_source_readinto1_variance(self, original, level, streaming,
				source_read_size, read_sizes):
				cctx = zstd.ZstdCompressor(level=level)

				if streaming:
				source = io.BytesIO()
				writer = cctx.stream_writer(source)
				writer.write(original)
				writer.flush(zstd.FLUSH_FRAME)
				source.seek(0)
				else:
				frame = cctx.compress(original)
				source = io.BytesIO(frame)

				dctx = zstd.ZstdDecompressor()

				chunks = []
				with dctx.stream_reader(source, read_size=source_read_size) as reader:
				while True:
				read_size = read_sizes.draw(strategies.integers(1, 131072))
				b = bytearray(read_size)
				count = reader.readinto1(b)

				if not count:
				break

				chunks.append(bytes(b[0:count]))

				self.assertEqual(b''.join(chunks), original)

				@hypothesis.settings(
				suppress_health_check=[hypothesis.HealthCheck.large_base_example])
				@hypothesis.given(
				original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				source_read_size=strategies.integers(1, 1048576),
				seek_amounts=strategies.data(),
				read_sizes=strategies.data())
				def test_relative_seeks(self, original, level, source_read_size, seek_amounts,
				read_sizes):
				cctx = zstd.ZstdCompressor(level=level)
				frame = cctx.compress(original)

				dctx = zstd.ZstdDecompressor()

				with dctx.stream_reader(frame, read_size=source_read_size) as reader:
				while True:
				amount = seek_amounts.draw(strategies.integers(0, 16384))
				reader.seek(amount, os.SEEK_CUR)

				offset = reader.tell()
				read_amount = read_sizes.draw(strategies.integers(1, 16384))
				chunk = reader.read(read_amount)

				if not chunk:
				break

				self.assertEqual(original[offset:offset + len(chunk)], chunk)

				@hypothesis.settings(
				suppress_health_check=[hypothesis.HealthCheck.large_base_example])
				@hypothesis.given(
				originals=strategies.data(),
				frame_count=strategies.integers(min_value=2, max_value=10),
				level=strategies.integers(min_value=1, max_value=5),
				source_read_size=strategies.integers(1, 1048576),
				read_sizes=strategies.data())
				def test_multiple_frames(self, originals, frame_count, level,
				source_read_size, read_sizes):

				cctx = zstd.ZstdCompressor(level=level)
				source = io.BytesIO()
				buffer = io.BytesIO()
				writer = cctx.stream_writer(buffer)

				for i in range(frame_count):
				data = originals.draw(strategies.sampled_from(random_input_data()))
				source.write(data)
				writer.write(data)
				writer.flush(zstd.FLUSH_FRAME)

				dctx = zstd.ZstdDecompressor()
				buffer.seek(0)
				reader = dctx.stream_reader(buffer, read_size=source_read_size,
				read_across_frames=True)

				chunks = []

				while True:
				read_amount = read_sizes.draw(strategies.integers(-1, 16384))
				chunk = reader.read(read_amount)

				if not chunk and read_amount:
				break

				chunks.append(chunk)

				self.assertEqual(source.getvalue(), b''.join(chunks))


				@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
				@make_cffi
				class TestDecompressor_stream_writer_fuzzing(unittest.TestCase):
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				write_size=strategies.integers(min_value=1, max_value=8192),
				input_sizes=strategies.data())
				def test_write_size_variance(self, original, level, write_size, input_sizes):
				cctx = zstd.ZstdCompressor(level=level)
				frame = cctx.compress(original)

				dctx = zstd.ZstdDecompressor()
				source = io.BytesIO(frame)
				dest = NonClosingBytesIO()

				with dctx.stream_writer(dest, write_size=write_size) as decompressor:
				while True:
				input_size = input_sizes.draw(strategies.integers(1, 4096))
				chunk = source.read(input_size)
				if not chunk:
				break

				decompressor.write(chunk)

				self.assertEqual(dest.getvalue(), original)


				@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
				@make_cffi
				class TestDecompressor_copy_stream_fuzzing(unittest.TestCase):
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				read_size=strategies.integers(min_value=1, max_value=8192),
				write_size=strategies.integers(min_value=1, max_value=8192))
				def test_read_write_size_variance(self, original, level, read_size, write_size):
				cctx = zstd.ZstdCompressor(level=level)
				frame = cctx.compress(original)

				source = io.BytesIO(frame)
				dest = io.BytesIO()

				dctx = zstd.ZstdDecompressor()
				dctx.copy_stream(source, dest, read_size=read_size, write_size=write_size)

				self.assertEqual(dest.getvalue(), original)


				@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
				@make_cffi
				class TestDecompressor_decompressobj_fuzzing(unittest.TestCase):
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				chunk_sizes=strategies.data())
				def test_random_input_sizes(self, original, level, chunk_sizes):
				cctx = zstd.ZstdCompressor(level=level)
				frame = cctx.compress(original)

				source = io.BytesIO(frame)

				dctx = zstd.ZstdDecompressor()
				dobj = dctx.decompressobj()

				chunks = []
				while True:
				chunk_size = chunk_sizes.draw(strategies.integers(1, 4096))
				chunk = source.read(chunk_size)
				if not chunk:
				break

				chunks.append(dobj.decompress(chunk))

				self.assertEqual(b''.join(chunks), original)

				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				write_size=strategies.integers(min_value=1,
				max_value=4 * zstd.DECOMPRESSION_RECOMMENDED_OUTPUT_SIZE),
				chunk_sizes=strategies.data())
				def test_random_output_sizes(self, original, level, write_size, chunk_sizes):
				cctx = zstd.ZstdCompressor(level=level)
				frame = cctx.compress(original)

				source = io.BytesIO(frame)

				dctx = zstd.ZstdDecompressor()
				dobj = dctx.decompressobj(write_size=write_size)

				chunks = []
				while True:
				chunk_size = chunk_sizes.draw(strategies.integers(1, 4096))
				chunk = source.read(chunk_size)
				if not chunk:
				break

				chunks.append(dobj.decompress(chunk))

				self.assertEqual(b''.join(chunks), original)


				@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
				@make_cffi
				class TestDecompressor_read_to_iter_fuzzing(unittest.TestCase):
				@hypothesis.given(original=strategies.sampled_from(random_input_data()),
				level=strategies.integers(min_value=1, max_value=5),
				read_size=strategies.integers(min_value=1, max_value=4096),
				write_size=strategies.integers(min_value=1, max_value=4096))
				def test_read_write_size_variance(self, original, level, read_size, write_size):
				cctx = zstd.ZstdCompressor(level=level)
				frame = cctx.compress(original)

				source = io.BytesIO(frame)

				dctx = zstd.ZstdDecompressor()
				chunks = list(dctx.read_to_iter(source, read_size=read_size, write_size=write_size))

				self.assertEqual(b''.join(chunks), original)


				@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
				class TestDecompressor_multi_decompress_to_buffer_fuzzing(unittest.TestCase):
				@hypothesis.given(original=strategies.lists(strategies.sampled_from(random_input_data()),
				min_size=1, max_size=1024),
				threads=strategies.integers(min_value=1, max_value=8),
				use_dict=strategies.booleans())
				def test_data_equivalence(self, original, threads, use_dict):
				kwargs = {}
				if use_dict:
				kwargs['dict_data'] = zstd.ZstdCompressionDict(original[0])

				cctx = zstd.ZstdCompressor(level=1,
				write_content_size=True,
				write_checksum=True,
				**kwargs)

				if not hasattr(cctx, 'multi_compress_to_buffer'):
				self.skipTest('multi_compress_to_buffer not available')

				frames_buffer = cctx.multi_compress_to_buffer(original, threads=-1)

				dctx = zstd.ZstdDecompressor(**kwargs)
				result = dctx.multi_decompress_to_buffer(frames_buffer)

				self.assertEqual(len(result), len(original))
				for i, frame in enumerate(result):
				self.assertEqual(frame.tobytes(), original[i])

				frames_list = [f.tobytes() for f in frames_buffer]
				result = dctx.multi_decompress_to_buffer(frames_list)

				self.assertEqual(len(result), len(original))
				for i, frame in enumerate(result):
				self.assertEqual(frame.tobytes(), original[i])