upstream/ipython Commit - r24973:7044ff68

Add normalize parameter to Audio.

Matan Gover -

r24973:7044ff68

parent child

IPython/lib/display.py

0 +27 -10

                  autoplay : bool
                      Set to True if the audio should immediately start playing.
                      Default is `False`.
+                 normalize : bool
+                     Whether audio should be normalized (rescaled) to the maximum possible
+                     range. Default is `True`. When set to `False`, `data` must be between
+                     -1 and 1 (inclusive), otherwise an error is raised.
+                     Applies only when `data` is a list or array of samples; other types of
+                     audio are never normalized.
                  Examples
                  --------
                  """
                  _read_flags = 'rb'
-                 def __init__(self, data=None, filename=None, url=None, embed=None, rate=None, autoplay=False):
+                 def __init__(self, data=None, filename=None, url=None, embed=None, rate=None, autoplay=False, normalize=True):
                      if filename is None and url is None and data is None:
                          raise ValueError("No audio data found. Expecting filename, url, or data.")
                      if embed is False and url is None:
                      if self.data is not None and not isinstance(self.data, bytes):
                          if rate is None:
                              raise ValueError("rate must be specified when data is a numpy array or list of audio samples.")
-                         self.data = Audio._make_wav(data, rate)
+                         self.data = Audio._make_wav(data, rate, normalize)
                  def reload(self):
                      """Reload the raw data from file or URL."""
                          self.mimetype = "audio/wav"
                  @staticmethod
-                 def _make_wav(data, rate):
+                 def _make_wav(data, rate, normalize):
                      """ Transform a numpy array to a PCM bytestring """
                      import struct
                      from io import BytesIO
                      import wave
                      try:
-                         scaled, nchan = Audio._validate_and_normalize_with_numpy(data)
+                         scaled, nchan = Audio._validate_and_normalize_with_numpy(data, normalize)
                      except ImportError:
-                         scaled, nchan = Audio._validate_and_normalize_without_numpy(data)
+                         scaled, nchan = Audio._validate_and_normalize_without_numpy(data, normalize)
                      fp = BytesIO()
                      waveobj = wave.open(fp,mode='wb')
                      return val
                  @staticmethod
-                 def _validate_and_normalize_with_numpy(data):
+                 def _validate_and_normalize_with_numpy(data, normalize):
                      import numpy as np
                      data = np.array(data, dtype=float)
                          data = data.T.ravel()
                      else:
                          raise ValueError('Array audio input must be a 1D or 2D array')
-                     scaled = np.int16(data/np.max(np.abs(data))*32767).tolist()
+                     max_abs_value = np.max(np.abs(data))
+                     normalization_factor = Audio._get_normalization_factor(max_abs_value, normalize)
+                     scaled = np.int16(data / normalization_factor * 32767).tolist()
                      return scaled, nchan
                  @staticmethod
-                 def _validate_and_normalize_without_numpy(data):
+                 def _validate_and_normalize_without_numpy(data, normalize):
                      try:
-                         maxabsvalue = float(max([abs(x) for x in data]))
+                         max_abs_value = float(max([abs(x) for x in data]))
                      except TypeError:
                          raise TypeError('Only lists of mono audio are '
                              'supported if numpy is not installed')
-                     scaled = [int(x/maxabsvalue*32767) for x in data]
+                     normalization_factor = Audio._get_normalization_factor(max_abs_value, normalize)
+                     scaled = [int(x / normalization_factor * 32767) for x in data]
                      nchan = 1
                      return scaled, nchan
+                 @staticmethod
+                 def _get_normalization_factor(max_abs_value, normalize):
+                     if not normalize and max_abs_value > 1:
+                         raise ValueError('Audio data must be between -1 and 1 when normalize=False.')
+                     return max_abs_value if normalize else 1
                  def _data_and_metadata(self):
                      """shortcut for returning metadata with url information, if defined"""
                      md = {}

IPython/lib/tests/test_display.py

0 +63 -19

		@@ -19,7 +19,10 b' try:'
19	19	import pathlib
20	20	except ImportError:
21	21	pass
22		from unittest import mock
	22	from unittest import TestCase, mock
	23	import struct
	24	import wave
	25	from io import BytesIO
23	26
24	27	# Third-party imports
25	28	import nose.tools as nt
		@@ -184,25 +187,66 b' def test_audio_from_file():'
184	187	path = pjoin(dirname(__file__), 'test.wav')
185	188	display.Audio(filename=path)
186	189
187		def test_audio_from_numpy_array():
188		display.Audio(get_test_tone(), rate=44100)
189
190		def test_audio_from_list_without_numpy():
191		# Simulate numpy not installed.
192		with mock.patch('numpy.array', side_effect=ImportError):
193		display.Audio(list(get_test_tone()), rate=44100)
194
195		def test_audio_from_list_without_numpy_raises_for_nested_list():
196		# Simulate numpy not installed.
197		with mock.patch('numpy.array', side_effect=ImportError):
	190	class TestAudioDataWithNumpy(TestCase):
	191	def test_audio_from_numpy_array(self):
	192	test_tone = get_test_tone()
	193	audio = display.Audio(test_tone, rate=44100)
	194	nt.assert_equal(len(read_wav(audio.data)), len(test_tone))
	195
	196	def test_audio_from_list(self):
	197	test_tone = get_test_tone()
	198	audio = display.Audio(list(test_tone), rate=44100)
	199	nt.assert_equal(len(read_wav(audio.data)), len(test_tone))
	200
	201	def test_audio_from_numpy_array_without_rate_raises(self):
	202	nt.assert_raises(ValueError, display.Audio, get_test_tone())
	203
	204	def test_audio_data_normalization(self):
	205	expected_max_value = numpy.iinfo(numpy.int16).max
	206	for scale in [1, 0.5, 2]:
	207	audio = display.Audio(get_test_tone(scale), rate=44100)
	208	actual_max_value = numpy.max(numpy.abs(read_wav(audio.data)))
	209	nt.assert_equal(actual_max_value, expected_max_value)
	210
	211	def test_audio_data_without_normalization(self):
	212	max_int16 = numpy.iinfo(numpy.int16).max
	213	for scale in [1, 0.5, 0.2]:
	214	test_tone = get_test_tone(scale)
	215	test_tone_max_abs = numpy.max(numpy.abs(test_tone))
	216	expected_max_value = int(max_int16 * test_tone_max_abs)
	217	audio = display.Audio(test_tone, rate=44100, normalize=False)
	218	actual_max_value = numpy.max(numpy.abs(read_wav(audio.data)))
	219	nt.assert_equal(actual_max_value, expected_max_value)
	220
	221	def test_audio_data_without_normalization_raises_for_invalid_data(self):
	222	nt.assert_raises(
	223	ValueError,
	224	lambda: display.Audio([1.001], rate=44100, normalize=False))
	225	nt.assert_raises(
	226	ValueError,
	227	lambda: display.Audio([-1.001], rate=44100, normalize=False))
	228
	229	def simulate_numpy_not_installed():
	230	return mock.patch('numpy.array', mock.MagicMock(side_effect=ImportError))
	231
	232	@simulate_numpy_not_installed()
	233	class TestAudioDataWithoutNumpy(TestAudioDataWithNumpy):
	234	# All tests from `TestAudioDataWithNumpy` are inherited.
	235
	236	def test_audio_raises_for_nested_list(self):
198	237	stereo_signal = [list(get_test_tone())] * 2
199		nt.assert_raises(TypeError, lambda: display.Audio(stereo_signal, rate=44100))
200
201		def test_audio_from_numpy_array_without_rate_raises():
202		nt.assert_raises(ValueError, display.Audio, get_test_tone())
203
204		def get_test_tone():
205		return numpy.sin(2 * numpy.pi * 440 * numpy.linspace(0, 1, 44100))
	238	nt.assert_raises(
	239	TypeError,
	240	lambda: display.Audio(stereo_signal, rate=44100))
	241
	242	def get_test_tone(scale=1):
	243	return numpy.sin(2 * numpy.pi * 440 * numpy.linspace(0, 1, 44100)) * scale
	244
	245	def read_wav(data):
	246	with wave.open(BytesIO(data)) as wave_file:
	247	wave_data = wave_file.readframes(wave_file.getnframes())
	248	num_samples = wave_file.getnframes() * wave_file.getnchannels()
	249	return struct.unpack('<%sh' % num_samples, wave_data)
206	250
207	251	def test_code_from_file():
208	252	c = display.Code(filename=__file__)

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages