upstream/ipython Commit - r8650:5aa788d5

remove abspath in conversion process

Matthias BUSSONNIER -

r8650:5aa788d5

parent child

converters/base.py

0 +1 -1

             from __future__ import print_function, absolute_import
             from converters.utils import remove_fake_files_url
             # Stdlib
             import codecs
             import io
             import logging
             import os
             import pprint
             from types import FunctionType
             # From IPython
             from IPython.nbformat import current as nbformat
             # local
             #-----------------------------------------------------------------------------
             # Class declarations
             #-----------------------------------------------------------------------------
             class ConversionException(Exception):
                 pass
             class DocStringInheritor(type):
                 """
                 This metaclass will walk the list of bases until the desired
                 superclass method is found AND if that method has a docstring and only
                 THEN does it attach the superdocstring to the derived class method.
                 Please use carefully, I just did the metaclass thing by following
                 Michael Foord's Metaclass tutorial
                 (http://www.voidspace.org.uk/python/articles/metaclasses.shtml), I may
                 have missed a step or two.
                 source:
                 http://groups.google.com/group/comp.lang.python/msg/26f7b4fcb4d66c95
                 by Paul McGuire
                 """
                 def __new__(meta, classname, bases, classDict):
                     newClassDict = {}
                     for attributeName, attribute in classDict.items():
                         if type(attribute) == FunctionType:
                             # look through bases for matching function by name
                             for baseclass in bases:
                                 if hasattr(baseclass, attributeName):
                                     basefn = getattr(baseclass, attributeName)
                                     if basefn.__doc__:
                                         attribute.__doc__ = basefn.__doc__
                                         break
                         newClassDict[attributeName] = attribute
                     return type.__new__(meta, classname, bases, newClassDict)
             class Converter(object):
                 __metaclass__ = DocStringInheritor
                 default_encoding = 'utf-8'
                 extension = str()
                 figures_counter = 0
                 infile = str()
                 infile_dir = str()
                 infile_root = str()
                 files_dir = str()
                 with_preamble = True
                 user_preamble = None
                 output = unicode()
                 raw_as_verbatim = False
                 def __init__(self, infile):
                     self.infile = infile
                     self.infile_dir, infile_root = os.path.split(infile)
                     infile_root = os.path.splitext(infile_root)[0]
                     files_dir = os.path.join(self.infile_dir, infile_root + '_files')
                     if not os.path.isdir(files_dir):
                         os.mkdir(files_dir)
                     self.infile_root = infile_root
-                    self.files_dir = os.path.abspath(files_dir)
+                    self.files_dir = files_dir
                     self.outbase = os.path.join(self.infile_dir, infile_root)
                 def __del__(self):
                     if os.path.isdir(self.files_dir) and not os.listdir(self.files_dir):
                         os.rmdir(self.files_dir)
                 def dispatch(self, cell_type):
                     """return cell_type dependent render method,  for example render_code
                     """
                     return getattr(self, 'render_' + cell_type, self.render_unknown)
                 def dispatch_display_format(self, format):
                     """return output_type dependent render method,  for example render_output_text
                     """
                     return getattr(self, 'render_display_format_' + format, self.render_unknown_display)
                 def convert(self, cell_separator='\n'):
                     """
                     Generic method to converts notebook to a string representation.
                     This is accomplished by dispatching on the cell_type, so subclasses of
                     Convereter class do not need to re-implement this method, but just
                     need implementation for the methods that will be dispatched.
                     Parameters
                     ----------
                     cell_separator : string
                       Character or string to join cells with. Default is "\n"
                     Returns
                     -------
                     out : string
                     """
                     lines = []
                     lines.extend(self.optional_header())
                     lines.extend(self.main_body(cell_separator))
                     lines.extend(self.optional_footer())
                     return u'\n'.join(lines)
                 def main_body(self, cell_separator='\n'):
                     converted_cells = []
                     for worksheet in self.nb.worksheets:
                         for cell in worksheet.cells:
                             #print(cell.cell_type)  # dbg
                             conv_fn = self.dispatch(cell.cell_type)
                             if cell.cell_type in ('markdown', 'raw'):
                                 remove_fake_files_url(cell)
                             converted_cells.append('\n'.join(conv_fn(cell)))
                     cell_lines = cell_separator.join(converted_cells).split('\n')
                     return cell_lines
                 def render(self):
                     "read, convert, and save self.infile"
                     if not hasattr(self, 'nb'):
                         self.read()
                     self.output = self.convert()
                     assert(type(self.output) == unicode)
                     return self.save()
                 def read(self):
                     "read and parse notebook into NotebookNode called self.nb"
                     with open(self.infile) as f:
                         self.nb = nbformat.read(f, 'json')
                 def save(self, outfile=None, encoding=None):
                     "read and parse notebook into self.nb"
                     if outfile is None:
                         outfile = self.outbase + '.' + self.extension
                     if encoding is None:
                         encoding = self.default_encoding
                     with io.open(outfile, 'w', encoding=encoding) as f:
                         f.write(self.output)
                     return os.path.abspath(outfile)
                 def optional_header(self):
                     """
                     Optional header to insert at the top of the converted notebook
                     Returns a list
                     """
                     return []
                 def optional_footer(self):
                     """
                     Optional footer to insert at the end of the converted notebook
                     Returns a list
                     """
                     return []
                 def _new_figure(self, data, fmt):
                     """Create a new figure file in the given format.
                     Returns a path relative to the input file.
                     """
                     figname = '%s_fig_%02i.%s' % (self.infile_root,
                                                   self.figures_counter, fmt)
                     self.figures_counter += 1
                     fullname = os.path.join(self.files_dir, figname)
                     # Binary files are base64-encoded, SVG is already XML
                     if fmt in ('png', 'jpg', 'pdf'):
                         data = data.decode('base64')
                         fopen = lambda fname: open(fname, 'wb')
                     else:
                         fopen = lambda fname: codecs.open(fname, 'wb', self.default_encoding)
                     with fopen(fullname) as f:
                         f.write(data)
                     return fullname
                 def render_heading(self, cell):
                     """convert a heading cell
                     Returns list."""
                     raise NotImplementedError
                 def render_code(self, cell):
                     """Convert a code cell
                     Returns list."""
                     raise NotImplementedError
                 def render_markdown(self, cell):
                     """convert a markdown cell
                     Returns list."""
                     raise NotImplementedError
                 def _img_lines(self, img_file):
                     """Return list of lines to include an image file."""
                     # Note: subclasses may choose to implement format-specific _FMT_lines
                     # methods if they so choose (FMT in {png, svg, jpg, pdf}).
                     raise NotImplementedError
                 def render_display_data(self, output):
                     """convert display data from the output of a code cell
                     Returns list.
                     """
                     lines = []
                     for fmt in output.keys():
                         if fmt in ['png', 'svg', 'jpg', 'pdf']:
                             img_file = self._new_figure(output[fmt], fmt)
                             # Subclasses can have format-specific render functions (e.g.,
                             # latex has to auto-convert all SVG to PDF first).
                             lines_fun = getattr(self, '_%s_lines' % fmt, None)
                             if not lines_fun:
                                 lines_fun = self._img_lines
                             lines.extend(lines_fun(img_file))
                         elif fmt != 'output_type':
                             conv_fn = self.dispatch_display_format(fmt)
                             lines.extend(conv_fn(output))
                     return lines
                 def render_raw(self, cell):
                     """convert a cell with raw text
                     Returns list."""
                     raise NotImplementedError
                 def render_unknown(self, cell):
                     """Render cells of unkown type
                     Returns list."""
                     data = pprint.pformat(cell)
                     logging.warning('Unknown cell: %s' % cell.cell_type)
                     return self._unknown_lines(data)
                 def render_unknown_display(self, output, type):
                     """Render cells of unkown type
                     Returns list."""
                     data = pprint.pformat(output)
                     logging.warning('Unknown output: %s' % output.output_type)
                     return self._unknown_lines(data)
                 def render_stream(self, output):
                     """render the stream part of an output
                     Returns list.
                     Identical to render_display_format_text
                     """
                     return self.render_display_format_text(output)
                 def render_pyout(self, output):
                     """convert pyout part of a code cell
                     Returns list."""
                     raise NotImplementedError
                 def render_pyerr(self, output):
                     """convert pyerr part of a code cell
                     Returns list."""
                     raise NotImplementedError
                 def _unknown_lines(self, data):
                     """Return list of lines for an unknown cell.
                     Parameters
                     ----------
                     data : str
                       The content of the unknown data as a single string.
                     """
                     raise NotImplementedError
                 # These are the possible format types in an output node
                 def render_display_format_text(self, output):
                     """render the text part of an output
                     Returns list.
                     """
                     raise NotImplementedError
                 def render_display_format_html(self, output):
                     """render the html part of an output
                     Returns list.
                     """
                     raise NotImplementedError
                 def render_display_format_latex(self, output):
                     """render the latex part of an output
                     Returns list.
                     """
                     raise NotImplementedError
                 def render_display_format_json(self, output):
                     """render the json part of an output
                     Returns list.
                     """
                     raise NotImplementedError
                 def render_display_format_javascript(self, output):
                     """render the javascript part of an output
                     Returns list.
                     """
                     raise NotImplementedError

tests/ipynbref/IntroNumPy.orig.md

0 +10 -10

             # An Introduction to the Scientific Python Ecosystem
             While the Python language is an excellent tool for general-purpose programming, with a highly readable syntax, rich and powerful data types (strings, lists, sets, dictionaries, arbitrary length integers, etc) and a very comprehensive standard library, it was not designed specifically for mathematical and scientific computing.  Neither the language nor its standard library have facilities for the efficient representation of multidimensional datasets, tools for linear algebra and general matrix manipulations (an essential building block of virtually all technical computing), nor any data visualization facilities.
             In particular, Python lists are very flexible containers that can be nested arbitrarily deep and which can hold any Python object in them, but they are poorly suited to represent efficiently common mathematical constructs like vectors and matrices.  In contrast, much of our modern heritage of scientific computing has been built on top of libraries written in the Fortran language, which has native support for vectors and matrices as well as a library of mathematical functions that can efficiently operate on entire arrays at once.
             ## Scientific Python: a collaboration of projects built by scientists
             The scientific community has developed a set of related Python libraries that provide powerful array facilities, linear algebra, numerical algorithms, data visualization and more.  In this appendix, we will briefly outline the tools most frequently used for this purpose, that make "Scientific Python" something far more powerful than the Python language alone.
             For reasons of space, we can only describe in some detail the central Numpy library, but below we provide links to the websites of each project where you can read their documentation in more detail.
             First, let's look at an overview of the basic tools that most scientists use in daily research with Python.  The core of this ecosystem is composed of:
             * Numpy: the basic library that most others depend on, it provides a powerful array type that can represent multidmensional datasets of many different kinds and that supports arithmetic operations. Numpy also provides a library of common mathematical functions, basic linear algebra, random number generation and Fast Fourier Transforms.  Numpy can be found at [numpy.scipy.org](http://numpy.scipy.org)
             * Scipy: a large collection of numerical algorithms that operate on numpy arrays and provide facilities for many common tasks in scientific computing, including dense and sparse linear algebra support, optimization, special functions, statistics, n-dimensional image processing, signal processing and more. Scipy can be found at [scipy.org](http://scipy.org).
             * Matplotlib: a data visualization library with a strong focus on producing high-quality output, it supports a variety of common scientific plot types in two and three dimensions, with precise control over the final output and format for publication-quality results.  Matplotlib can also be controlled interactively allowing graphical manipulation of your data (zooming, panning, etc) and can be used with most modern user interface toolkits.  It can be found at [matplotlib.sf.net](http://matplotlib.sf.net).
             * IPython: while not strictly scientific in nature, IPython is the interactive environment in which many scientists spend their time.  IPython provides a powerful Python shell that integrates tightly with Matplotlib and with easy access to the files and operating system, and which can execute in a terminal or in a graphical Qt console. IPython also has a web-based notebook interface that can combine code with text, mathematical expressions, figures and multimedia.  It can be found at [ipython.org](http://ipython.org).
             While each of these tools can be installed separately, in our opinion the most convenient way today of accessing them (especially on Windows and Mac computers) is to install the [Free Edition of the Enthought Python Distribution](http://www.enthought.com/products/epd_free.php) which contain all the above.  Other free alternatives on Windows (but not on Macs) are [Python(x,y)](http://code.google.com/p/pythonxy) and [ Christoph Gohlke's packages page](http://www.lfd.uci.edu/~gohlke/pythonlibs).
             These four 'core' libraries are in practice complemented by a number of other tools for more specialized work.  We will briefly list here the ones that we think are the most commonly needed:
             * Sympy: a symbolic manipulation tool that turns a Python session into a computer algebra system.  It integrates with the IPython notebook, rendering results in properly typeset mathematical notation.  [sympy.org](http://sympy.org).
             * Mayavi: sophisticated 3d data visualization; [code.enthought.com/projects/mayavi](http://code.enthought.com/projects/mayavi).
             * Cython: a bridge language between Python and C, useful both to optimize performance bottlenecks in Python and to access C libraries directly; [cython.org](http://cython.org).
             * Pandas: high-performance data structures and data analysis tools, with powerful data alignment and structural manipulation capabilities; [pandas.pydata.org](http://pandas.pydata.org).
             * Statsmodels: statistical data exploration and model estimation; [statsmodels.sourceforge.net](http://statsmodels.sourceforge.net).
             * Scikit-learn: general purpose machine learning algorithms with a common interface; [scikit-learn.org](http://scikit-learn.org).
             * Scikits-image: image processing toolbox; [scikits-image.org](http://scikits-image.org).
             * NetworkX: analysis of complex networks (in the graph theoretical sense); [networkx.lanl.gov](http://networkx.lanl.gov).
             * PyTables: management of hierarchical datasets using the industry-standard HDF5 format; [www.pytables.org](http://www.pytables.org).
             Beyond these, for any specific problem you should look on the internet first, before starting to write code from scratch.  There's a good chance that someone, somewhere, has written an open source library that you can use for part or all of your problem.
             ## A note about the examples below
             In all subsequent examples, you will see blocks of input code, followed by the results of the code if the code generated output.  This output may include text, graphics and other result objects.  These blocks of input can be pasted into your interactive IPython session or notebook for you to execute.  In the print version of this document, a thin vertical bar on the left of the blocks of input and output shows which blocks go together.
             If you are reading this text as an actual IPython notebook, you can press `Shift-Enter` or use the 'play' button on the toolbar (right-pointing triangle) to execute each block of code, known as a 'cell' in IPython:
             <div class="highlight"><pre><span class="c"># This is a block of code, below you&#39;ll see its output</span>
             <span class="k">print</span> <span class="s">&quot;Welcome to the world of scientific computing with Python!&quot;</span>
             </pre></div>
                 Welcome to the world of scientific computing with Python!
             # Motivation: the trapezoidal rule
             In subsequent sections we'll provide a basic introduction to the nuts and bolts of the basic scientific python tools; but we'll first motivate it with a brief example that illustrates what you can do in a few lines with these tools.  For this, we will use the simple problem of approximating a definite integral with the trapezoid rule:
             $$
             \int_{a}^{b} f(x)\, dx \approx \frac{1}{2} \sum_{k=1}^{N} \left( x_{k} - x_{k-1} \right) \left( f(x_{k}) + f(x_{k-1}) \right).
             $$
             Our task will be to compute this formula for a function such as:
             $$
             f(x) = (x-3)(x-5)(x-7)+85
             $$
             integrated between $a=1$ and $b=9$.
             First, we define the function and sample it evenly between 0 and 10 at 200 points:
             <div class="highlight"><pre><span class="k">def</span> <span class="nf">f</span><span class="p">(</span><span class="n">x</span><span class="p">):</span>
                 <span class="k">return</span> <span class="p">(</span><span class="n">x</span><span class="o">-</span><span class="mi">3</span><span class="p">)</span><span class="o">*</span><span class="p">(</span><span class="n">x</span><span class="o">-</span><span class="mi">5</span><span class="p">)</span><span class="o">*</span><span class="p">(</span><span class="n">x</span><span class="o">-</span><span class="mi">7</span><span class="p">)</span><span class="o">+</span><span class="mi">85</span>
             <span class="kn">import</span> <span class="nn">numpy</span> <span class="kn">as</span> <span class="nn">np</span>
             <span class="n">x</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">linspace</span><span class="p">(</span><span class="mi">0</span><span class="p">,</span> <span class="mi">10</span><span class="p">,</span> <span class="mi">200</span><span class="p">)</span>
             <span class="n">y</span> <span class="o">=</span> <span class="n">f</span><span class="p">(</span><span class="n">x</span><span class="p">)</span>
             </pre></div>
             We select $a$ and $b$, our integration limits, and we take only a few points in that region to illustrate the error behavior of the trapezoid approximation:
             <div class="highlight"><pre><span class="n">a</span><span class="p">,</span> <span class="n">b</span> <span class="o">=</span> <span class="mi">1</span><span class="p">,</span> <span class="mi">9</span>
             <span class="n">xint</span> <span class="o">=</span> <span class="n">x</span><span class="p">[</span><span class="n">logical_and</span><span class="p">(</span><span class="n">x</span><span class="o">&gt;=</span><span class="n">a</span><span class="p">,</span> <span class="n">x</span><span class="o">&lt;=</span><span class="n">b</span><span class="p">)][::</span><span class="mi">30</span><span class="p">]</span>
             <span class="n">yint</span> <span class="o">=</span> <span class="n">y</span><span class="p">[</span><span class="n">logical_and</span><span class="p">(</span><span class="n">x</span><span class="o">&gt;=</span><span class="n">a</span><span class="p">,</span> <span class="n">x</span><span class="o">&lt;=</span><span class="n">b</span><span class="p">)][::</span><span class="mi">30</span><span class="p">]</span>
             </pre></div>
             Let's plot both the function and the area below it in the trapezoid approximation:
             <div class="highlight"><pre><span class="kn">import</span> <span class="nn">matplotlib.pyplot</span> <span class="kn">as</span> <span class="nn">plt</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">plot</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="n">y</span><span class="p">,</span> <span class="n">lw</span><span class="o">=</span><span class="mi">2</span><span class="p">)</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">axis</span><span class="p">([</span><span class="mi">0</span><span class="p">,</span> <span class="mi">10</span><span class="p">,</span> <span class="mi">0</span><span class="p">,</span> <span class="mi">140</span><span class="p">])</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">fill_between</span><span class="p">(</span><span class="n">xint</span><span class="p">,</span> <span class="mi">0</span><span class="p">,</span> <span class="n">yint</span><span class="p">,</span> <span class="n">facecolor</span><span class="o">=</span><span class="s">&#39;gray&#39;</span><span class="p">,</span> <span class="n">alpha</span><span class="o">=</span><span class="mf">0.4</span><span class="p">)</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">text</span><span class="p">(</span><span class="mf">0.5</span> <span class="o">*</span> <span class="p">(</span><span class="n">a</span> <span class="o">+</span> <span class="n">b</span><span class="p">),</span> <span class="mi">30</span><span class="p">,</span><span class="s">r&quot;$\int_a^b f(x)dx$&quot;</span><span class="p">,</span> <span class="n">horizontalalignment</span><span class="o">=</span><span class="s">&#39;center&#39;</span><span class="p">,</span> <span class="n">fontsize</span><span class="o">=</span><span class="mi">20</span><span class="p">);</span>
             </pre></div>
-            ![](/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_00.svg)
+            ![](tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_00.svg)
             Compute the integral both at high accuracy and with the trapezoid approximation
             <div class="highlight"><pre><span class="kn">from</span> <span class="nn">scipy.integrate</span> <span class="kn">import</span> <span class="n">quad</span><span class="p">,</span> <span class="n">trapz</span>
             <span class="n">integral</span><span class="p">,</span> <span class="n">error</span> <span class="o">=</span> <span class="n">quad</span><span class="p">(</span><span class="n">f</span><span class="p">,</span> <span class="mi">1</span><span class="p">,</span> <span class="mi">9</span><span class="p">)</span>
             <span class="n">trap_integral</span> <span class="o">=</span> <span class="n">trapz</span><span class="p">(</span><span class="n">yint</span><span class="p">,</span> <span class="n">xint</span><span class="p">)</span>
             <span class="k">print</span> <span class="s">&quot;The integral is: </span><span class="si">%g</span><span class="s"> +/- </span><span class="si">%.1e</span><span class="s">&quot;</span> <span class="o">%</span> <span class="p">(</span><span class="n">integral</span><span class="p">,</span> <span class="n">error</span><span class="p">)</span>
             <span class="k">print</span> <span class="s">&quot;The trapezoid approximation with&quot;</span><span class="p">,</span> <span class="nb">len</span><span class="p">(</span><span class="n">xint</span><span class="p">),</span> <span class="s">&quot;points is:&quot;</span><span class="p">,</span> <span class="n">trap_integral</span>
             <span class="k">print</span> <span class="s">&quot;The absolute error is:&quot;</span><span class="p">,</span> <span class="nb">abs</span><span class="p">(</span><span class="n">integral</span> <span class="o">-</span> <span class="n">trap_integral</span><span class="p">)</span>
             </pre></div>
                 The integral is: 680 +/- 7.5e-12
                 The trapezoid approximation with 6 points is: 621.286411141
                 The absolute error is: 58.7135888589
             This simple example showed us how, combining the numpy, scipy and matplotlib libraries we can provide an illustration of a standard method in elementary calculus with just a few lines of code.  We will now discuss with more detail the basic usage of these tools.
             # NumPy arrays: the right data structure for scientific computing
             ## Basics of Numpy arrays
             We now turn our attention to the Numpy library, which forms the base layer for the entire 'scipy ecosystem'.  Once you have installed numpy, you can import it as
             <div class="highlight"><pre><span class="kn">import</span> <span class="nn">numpy</span>
             </pre></div>
             though in this book we will use the common shorthand
             <div class="highlight"><pre><span class="kn">import</span> <span class="nn">numpy</span> <span class="kn">as</span> <span class="nn">np</span>
             </pre></div>
             As mentioned above, the main object provided by numpy is a powerful array.  We'll start by exploring how the numpy array differs from Python lists.  We start by creating a simple list and an array with the same contents of the list:
             <div class="highlight"><pre><span class="n">lst</span> <span class="o">=</span> <span class="p">[</span><span class="mi">10</span><span class="p">,</span> <span class="mi">20</span><span class="p">,</span> <span class="mi">30</span><span class="p">,</span> <span class="mi">40</span><span class="p">]</span>
             <span class="n">arr</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">array</span><span class="p">([</span><span class="mi">10</span><span class="p">,</span> <span class="mi">20</span><span class="p">,</span> <span class="mi">30</span><span class="p">,</span> <span class="mi">40</span><span class="p">])</span>
             </pre></div>
             Elements of a one-dimensional array are accessed with the same syntax as a list:
             <div class="highlight"><pre><span class="n">lst</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span>
             </pre></div>
             <pre>
             </pre>
             <div class="highlight"><pre><span class="n">arr</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span>
             </pre></div>
             <pre>
             </pre>
             <div class="highlight"><pre><span class="n">arr</span><span class="p">[</span><span class="o">-</span><span class="mi">1</span><span class="p">]</span>
             </pre></div>
             <pre>
             </pre>
             <div class="highlight"><pre><span class="n">arr</span><span class="p">[</span><span class="mi">2</span><span class="p">:]</span>
             </pre></div>
             <pre>
                 array([30, 40])
             </pre>
             The first difference to note between lists and arrays is that arrays are *homogeneous*; i.e. all elements of an array must be of the same type.  In contrast, lists can contain elements of arbitrary type. For example, we can change the last element in our list above to be a string:
             <div class="highlight"><pre><span class="n">lst</span><span class="p">[</span><span class="o">-</span><span class="mi">1</span><span class="p">]</span> <span class="o">=</span> <span class="s">&#39;a string inside a list&#39;</span>
             <span class="n">lst</span>
             </pre></div>
             <pre>
                 [10, 20, 30, 'a string inside a list']
             </pre>
             but the same can not be done with an array, as we get an error message:
             <div class="highlight"><pre><span class="n">arr</span><span class="p">[</span><span class="o">-</span><span class="mi">1</span><span class="p">]</span> <span class="o">=</span> <span class="s">&#39;a string inside an array&#39;</span>
             </pre></div>
                 ---------------------------------------------------------------------------
                 ValueError                                Traceback (most recent call last)
                 /home/fperez/teach/book-math-labtool/<ipython-input-13-29c0bfa5fa8a> in <module>()
                 ----> 1 arr[-1] = 'a string inside an array'
                 ValueError: invalid literal for long() with base 10: 'a string inside an array'
             The information about the type of an array is contained in its *dtype* attribute:
             <div class="highlight"><pre><span class="n">arr</span><span class="o">.</span><span class="n">dtype</span>
             </pre></div>
             <pre>
                 dtype('int32')
             </pre>
             Once an array has been created, its dtype is fixed and it can only store elements of the same type.  For this example where the dtype is integer, if we store a floating point number it will be automatically converted into an integer:
             <div class="highlight"><pre><span class="n">arr</span><span class="p">[</span><span class="o">-</span><span class="mi">1</span><span class="p">]</span> <span class="o">=</span> <span class="mf">1.234</span>
             <span class="n">arr</span>
             </pre></div>
             <pre>
                 array([10, 20, 30,  1])
             </pre>
             Above we created an array from an existing list; now let us now see other ways in which we can create arrays, which we'll illustrate next.  A common need is to have an array initialized with a constant value, and very often this value is 0 or 1 (suitable as starting value for additive and multiplicative loops respectively); `zeros` creates arrays of all zeros, with any desired dtype:
             <div class="highlight"><pre><span class="n">np</span><span class="o">.</span><span class="n">zeros</span><span class="p">(</span><span class="mi">5</span><span class="p">,</span> <span class="nb">float</span><span class="p">)</span>
             </pre></div>
             <pre>
                 array([ 0.,  0.,  0.,  0.,  0.])
             </pre>
             <div class="highlight"><pre><span class="n">np</span><span class="o">.</span><span class="n">zeros</span><span class="p">(</span><span class="mi">3</span><span class="p">,</span> <span class="nb">int</span><span class="p">)</span>
             </pre></div>
             <pre>
                 array([0, 0, 0])
             </pre>
             <div class="highlight"><pre><span class="n">np</span><span class="o">.</span><span class="n">zeros</span><span class="p">(</span><span class="mi">3</span><span class="p">,</span> <span class="nb">complex</span><span class="p">)</span>
             </pre></div>
             <pre>
                 array([ 0.+0.j,  0.+0.j,  0.+0.j])
             </pre>
             and similarly for `ones`:
             <div class="highlight"><pre><span class="k">print</span> <span class="s">&#39;5 ones:&#39;</span><span class="p">,</span> <span class="n">np</span><span class="o">.</span><span class="n">ones</span><span class="p">(</span><span class="mi">5</span><span class="p">)</span>
             </pre></div>
 ones: [ 1.  1.  1.  1.  1.]
             If we want an array initialized with an arbitrary value, we can create an empty array and then use the fill method to put the value we want into the array:
             <div class="highlight"><pre><span class="n">a</span> <span class="o">=</span> <span class="n">empty</span><span class="p">(</span><span class="mi">4</span><span class="p">)</span>
             <span class="n">a</span><span class="o">.</span><span class="n">fill</span><span class="p">(</span><span class="mf">5.5</span><span class="p">)</span>
             <span class="n">a</span>
             </pre></div>
             <pre>
                 array([ 5.5,  5.5,  5.5,  5.5])
             </pre>
             Numpy also offers the `arange` function, which works like the builtin `range` but returns an array instead of a list:
             <div class="highlight"><pre><span class="n">np</span><span class="o">.</span><span class="n">arange</span><span class="p">(</span><span class="mi">5</span><span class="p">)</span>
             </pre></div>
             <pre>
                 array([0, 1, 2, 3, 4])
             </pre>
             and the `linspace` and `logspace` functions to create linearly and logarithmically-spaced grids respectively, with a fixed number of points and including both ends of the specified interval:
             <div class="highlight"><pre><span class="k">print</span> <span class="s">&quot;A linear grid between 0 and 1:&quot;</span><span class="p">,</span> <span class="n">np</span><span class="o">.</span><span class="n">linspace</span><span class="p">(</span><span class="mi">0</span><span class="p">,</span> <span class="mi">1</span><span class="p">,</span> <span class="mi">5</span><span class="p">)</span>
             <span class="k">print</span> <span class="s">&quot;A logarithmic grid between 10**1 and 10**4: &quot;</span><span class="p">,</span> <span class="n">np</span><span class="o">.</span><span class="n">logspace</span><span class="p">(</span><span class="mi">1</span><span class="p">,</span> <span class="mi">4</span><span class="p">,</span> <span class="mi">4</span><span class="p">)</span>
             </pre></div>
                 A linear grid between 0 and 1: [ 0.    0.25  0.5   0.75  1.  ]
                 A logarithmic grid between 10**1 and 10**4:  [    10.    100.   1000.  10000.]
             Finally, it is often useful to create arrays with random numbers that follow a specific distribution.  The `np.random` module contains a number of functions that can be used to this effect, for example this will produce an array of 5 random samples taken from a standard normal distribution (0 mean and variance 1):
             <div class="highlight"><pre><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="mi">5</span><span class="p">)</span>
             </pre></div>
             <pre>
                 array([-0.08633343, -0.67375434,  1.00589536,  0.87081651,  1.65597822])
             </pre>
             whereas this will also give 5 samples, but from a normal distribution with a mean of 10 and a variance of 3:
             <div class="highlight"><pre><span class="n">norm10</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">normal</span><span class="p">(</span><span class="mi">10</span><span class="p">,</span> <span class="mi">3</span><span class="p">,</span> <span class="mi">5</span><span class="p">)</span>
             <span class="n">norm10</span>
             </pre></div>
             <pre>
                 array([  8.94879575,   5.53038269,   8.24847281,  12.14944165,  11.56209294])
             </pre>
             ## Indexing with other arrays
             Above we saw how to index arrays with single numbers and slices, just like Python lists.  But arrays allow for a more sophisticated kind of indexing which is very powerful: you can index an array with another array, and in particular with an array of boolean values.  This is particluarly useful to extract information from an array that matches a certain condition.
             Consider for example that in the array `norm10` we want to replace all values above 9 with the value 0.  We can do so by first finding the *mask* that indicates where this condition is true or false:
             <div class="highlight"><pre><span class="n">mask</span> <span class="o">=</span> <span class="n">norm10</span> <span class="o">&gt;</span> <span class="mi">9</span>
             <span class="n">mask</span>
             </pre></div>
             <pre>
                 array([False, False, False,  True,  True], dtype=bool)
             </pre>
             Now that we have this mask, we can use it to either read those values or to reset them to 0:
             <div class="highlight"><pre><span class="k">print</span> <span class="s">&#39;Values above 9:&#39;</span><span class="p">,</span> <span class="n">norm10</span><span class="p">[</span><span class="n">mask</span><span class="p">]</span>
             </pre></div>
                 Values above 9: [ 12.14944165  11.56209294]
             <div class="highlight"><pre><span class="k">print</span> <span class="s">&#39;Resetting all values above 9 to 0...&#39;</span>
             <span class="n">norm10</span><span class="p">[</span><span class="n">mask</span><span class="p">]</span> <span class="o">=</span> <span class="mi">0</span>
             <span class="k">print</span> <span class="n">norm10</span>
             </pre></div>
                 Resetting all values above 9 to 0...
                 [ 8.94879575  5.53038269  8.24847281  0.          0.        ]
             ## Arrays with more than one dimension
             Up until now all our examples have used one-dimensional arrays.  But Numpy can create arrays of aribtrary dimensions, and all the methods illustrated in the previous section work with more than one dimension.  For example, a list of lists can be used to initialize a two dimensional array:
             <div class="highlight"><pre><span class="n">lst2</span> <span class="o">=</span> <span class="p">[[</span><span class="mi">1</span><span class="p">,</span> <span class="mi">2</span><span class="p">],</span> <span class="p">[</span><span class="mi">3</span><span class="p">,</span> <span class="mi">4</span><span class="p">]]</span>
             <span class="n">arr2</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">array</span><span class="p">([[</span><span class="mi">1</span><span class="p">,</span> <span class="mi">2</span><span class="p">],</span> <span class="p">[</span><span class="mi">3</span><span class="p">,</span> <span class="mi">4</span><span class="p">]])</span>
             <span class="n">arr2</span>
             </pre></div>
             <pre>
                 array([[1, 2],
                        [3, 4]])
             </pre>
             With two-dimensional arrays we start seeing the power of numpy: while a nested list can be indexed using repeatedly the `[ ]` operator, multidimensional arrays support a much more natural indexing syntax with a single `[ ]` and a set of indices separated by commas:
             <div class="highlight"><pre><span class="k">print</span> <span class="n">lst2</span><span class="p">[</span><span class="mi">0</span><span class="p">][</span><span class="mi">1</span><span class="p">]</span>
             <span class="k">print</span> <span class="n">arr2</span><span class="p">[</span><span class="mi">0</span><span class="p">,</span><span class="mi">1</span><span class="p">]</span>
             </pre></div>
             Most of the array creation functions listed above can be used with more than one dimension, for example:
             <div class="highlight"><pre><span class="n">np</span><span class="o">.</span><span class="n">zeros</span><span class="p">((</span><span class="mi">2</span><span class="p">,</span><span class="mi">3</span><span class="p">))</span>
             </pre></div>
             <pre>
                 array([[ 0.,  0.,  0.],
                        [ 0.,  0.,  0.]])
             </pre>
             <div class="highlight"><pre><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">normal</span><span class="p">(</span><span class="mi">10</span><span class="p">,</span> <span class="mi">3</span><span class="p">,</span> <span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">4</span><span class="p">))</span>
             </pre></div>
             <pre>
                 array([[ 11.26788826,   4.29619866,  11.09346496,   9.73861307],
                        [ 10.54025996,   9.5146268 ,  10.80367214,  13.62204505]])
             </pre>
             In fact, the shape of an array can be changed at any time, as long as the total number of elements is unchanged.  For example, if we want a 2x4 array with numbers increasing from 0, the easiest way to create it is:
             <div class="highlight"><pre><span class="n">arr</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">arange</span><span class="p">(</span><span class="mi">8</span><span class="p">)</span><span class="o">.</span><span class="n">reshape</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span><span class="mi">4</span><span class="p">)</span>
             <span class="k">print</span> <span class="n">arr</span>
             </pre></div>
                 [[0 1 2 3]
                  [4 5 6 7]]
             With multidimensional arrays, you can also use slices, and you can mix and match slices and single indices in the different dimensions (using the same array as above):
             <div class="highlight"><pre><span class="k">print</span> <span class="s">&#39;Slicing in the second row:&#39;</span><span class="p">,</span> <span class="n">arr</span><span class="p">[</span><span class="mi">1</span><span class="p">,</span> <span class="mi">2</span><span class="p">:</span><span class="mi">4</span><span class="p">]</span>
             <span class="k">print</span> <span class="s">&#39;All rows, third column   :&#39;</span><span class="p">,</span> <span class="n">arr</span><span class="p">[:,</span> <span class="mi">2</span><span class="p">]</span>
             </pre></div>
                 Slicing in the second row: [6 7]
                 All rows, third column   : [2 6]
             If you only provide one index, then you will get an array with one less dimension containing that row:
             <div class="highlight"><pre><span class="k">print</span> <span class="s">&#39;First row:  &#39;</span><span class="p">,</span> <span class="n">arr</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span>
             <span class="k">print</span> <span class="s">&#39;Second row: &#39;</span><span class="p">,</span> <span class="n">arr</span><span class="p">[</span><span class="mi">1</span><span class="p">]</span>
             </pre></div>
                 First row:   [0 1 2 3]
                 Second row:  [4 5 6 7]
             Now that we have seen how to create arrays with more than one dimension, it's a good idea to look at some of the most useful properties and methods that arrays have.  The following provide basic information about the size, shape and data in the array:
             <div class="highlight"><pre><span class="k">print</span> <span class="s">&#39;Data type                :&#39;</span><span class="p">,</span> <span class="n">arr</span><span class="o">.</span><span class="n">dtype</span>
             <span class="k">print</span> <span class="s">&#39;Total number of elements :&#39;</span><span class="p">,</span> <span class="n">arr</span><span class="o">.</span><span class="n">size</span>
             <span class="k">print</span> <span class="s">&#39;Number of dimensions     :&#39;</span><span class="p">,</span> <span class="n">arr</span><span class="o">.</span><span class="n">ndim</span>
             <span class="k">print</span> <span class="s">&#39;Shape (dimensionality)   :&#39;</span><span class="p">,</span> <span class="n">arr</span><span class="o">.</span><span class="n">shape</span>
             <span class="k">print</span> <span class="s">&#39;Memory used (in bytes)   :&#39;</span><span class="p">,</span> <span class="n">arr</span><span class="o">.</span><span class="n">nbytes</span>
             </pre></div>
                 Data type                : int32
                 Total number of elements : 8
                 Number of dimensions     : 2
                 Shape (dimensionality)   : (2, 4)
                 Memory used (in bytes)   : 32
             Arrays also have many useful methods, some especially useful ones are:
             <div class="highlight"><pre><span class="k">print</span> <span class="s">&#39;Minimum and maximum             :&#39;</span><span class="p">,</span> <span class="n">arr</span><span class="o">.</span><span class="n">min</span><span class="p">(),</span> <span class="n">arr</span><span class="o">.</span><span class="n">max</span><span class="p">()</span>
             <span class="k">print</span> <span class="s">&#39;Sum and product of all elements :&#39;</span><span class="p">,</span> <span class="n">arr</span><span class="o">.</span><span class="n">sum</span><span class="p">(),</span> <span class="n">arr</span><span class="o">.</span><span class="n">prod</span><span class="p">()</span>
             <span class="k">print</span> <span class="s">&#39;Mean and standard deviation     :&#39;</span><span class="p">,</span> <span class="n">arr</span><span class="o">.</span><span class="n">mean</span><span class="p">(),</span> <span class="n">arr</span><span class="o">.</span><span class="n">std</span><span class="p">()</span>
             </pre></div>
                 Minimum and maximum             : 0 7
                 Sum and product of all elements : 28 0
                 Mean and standard deviation     : 3.5 2.29128784748
             For these methods, the above operations area all computed on all the elements of the array.  But for a multidimensional array, it's possible to do the computation along a single dimension, by passing the `axis` parameter; for example:
             <div class="highlight"><pre><span class="k">print</span> <span class="s">&#39;For the following array:</span><span class="se">\n</span><span class="s">&#39;</span><span class="p">,</span> <span class="n">arr</span>
             <span class="k">print</span> <span class="s">&#39;The sum of elements along the rows is    :&#39;</span><span class="p">,</span> <span class="n">arr</span><span class="o">.</span><span class="n">sum</span><span class="p">(</span><span class="n">axis</span><span class="o">=</span><span class="mi">1</span><span class="p">)</span>
             <span class="k">print</span> <span class="s">&#39;The sum of elements along the columns is :&#39;</span><span class="p">,</span> <span class="n">arr</span><span class="o">.</span><span class="n">sum</span><span class="p">(</span><span class="n">axis</span><span class="o">=</span><span class="mi">0</span><span class="p">)</span>
             </pre></div>
                 For the following array:
                 [[0 1 2 3]
                  [4 5 6 7]]
                 The sum of elements along the rows is    : [ 6 22]
                 The sum of elements along the columns is : [ 4  6  8 10]
             As you can see in this example, the value of the `axis` parameter is the dimension which will be *consumed* once the operation has been carried out.  This is why to sum along the rows we use `axis=0`.
             This can be easily illustrated with an example that has more dimensions; we create an array with 4 dimensions and shape `(3,4,5,6)` and sum along the axis number 2 (i.e. the *third* axis, since in Python all counts are 0-based).  That consumes the dimension whose length was 5, leaving us with a new array that has shape `(3,4,6)`:
             <div class="highlight"><pre><span class="n">np</span><span class="o">.</span><span class="n">zeros</span><span class="p">((</span><span class="mi">3</span><span class="p">,</span><span class="mi">4</span><span class="p">,</span><span class="mi">5</span><span class="p">,</span><span class="mi">6</span><span class="p">))</span><span class="o">.</span><span class="n">sum</span><span class="p">(</span><span class="mi">2</span><span class="p">)</span><span class="o">.</span><span class="n">shape</span>
             </pre></div>
             <pre>
                 (3, 4, 6)
             </pre>
             Another widely used property of arrays is the `.T` attribute, which allows you to access the transpose of the array:
             <div class="highlight"><pre><span class="k">print</span> <span class="s">&#39;Array:</span><span class="se">\n</span><span class="s">&#39;</span><span class="p">,</span> <span class="n">arr</span>
             <span class="k">print</span> <span class="s">&#39;Transpose:</span><span class="se">\n</span><span class="s">&#39;</span><span class="p">,</span> <span class="n">arr</span><span class="o">.</span><span class="n">T</span>
             </pre></div>
                 Array:
                 [[0 1 2 3]
                  [4 5 6 7]]
                 Transpose:
                 [[0 4]
                  [1 5]
                  [2 6]
                  [3 7]]
             We don't have time here to look at all the methods and properties of arrays, here's a complete list.  Simply try exploring some of these IPython to learn more, or read their description in the full Numpy documentation:
                 arr.T             arr.copy          arr.getfield      arr.put           arr.squeeze
                 arr.all           arr.ctypes        arr.imag          arr.ravel         arr.std
                 arr.any           arr.cumprod       arr.item          arr.real          arr.strides
                 arr.argmax        arr.cumsum        arr.itemset       arr.repeat        arr.sum
                 arr.argmin        arr.data          arr.itemsize      arr.reshape       arr.swapaxes
                 arr.argsort       arr.diagonal      arr.max           arr.resize        arr.take
                 arr.astype        arr.dot           arr.mean          arr.round         arr.tofile
                 arr.base          arr.dtype         arr.min           arr.searchsorted  arr.tolist
                 arr.byteswap      arr.dump          arr.nbytes        arr.setasflat     arr.tostring
                 arr.choose        arr.dumps         arr.ndim          arr.setfield      arr.trace
                 arr.clip          arr.fill          arr.newbyteorder  arr.setflags      arr.transpose
                 arr.compress      arr.flags         arr.nonzero       arr.shape         arr.var
                 arr.conj          arr.flat          arr.prod          arr.size          arr.view
                 arr.conjugate     arr.flatten       arr.ptp           arr.sort
             ## Operating with arrays
             Arrays support all regular arithmetic operators, and the numpy library also contains a complete collection of basic mathematical functions that operate on arrays.  It is important to remember that in general, all operations with arrays are applied *element-wise*, i.e., are applied to all the elements of the array at the same time.  Consider for example:
             <div class="highlight"><pre><span class="n">arr1</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">arange</span><span class="p">(</span><span class="mi">4</span><span class="p">)</span>
             <span class="n">arr2</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">arange</span><span class="p">(</span><span class="mi">10</span><span class="p">,</span> <span class="mi">14</span><span class="p">)</span>
             <span class="k">print</span> <span class="n">arr1</span><span class="p">,</span> <span class="s">&#39;+&#39;</span><span class="p">,</span> <span class="n">arr2</span><span class="p">,</span> <span class="s">&#39;=&#39;</span><span class="p">,</span> <span class="n">arr1</span><span class="o">+</span><span class="n">arr2</span>
             </pre></div>
                 [0 1 2 3] + [10 11 12 13] = [10 12 14 16]
             Importantly, you must remember that even the multiplication operator is by default applied element-wise, it is *not* the matrix multiplication from linear algebra (as is the case in Matlab, for example):
             <div class="highlight"><pre><span class="k">print</span> <span class="n">arr1</span><span class="p">,</span> <span class="s">&#39;*&#39;</span><span class="p">,</span> <span class="n">arr2</span><span class="p">,</span> <span class="s">&#39;=&#39;</span><span class="p">,</span> <span class="n">arr1</span><span class="o">*</span><span class="n">arr2</span>
             </pre></div>
                 [0 1 2 3] * [10 11 12 13] = [ 0 11 24 39]
             While this means that in principle arrays must always match in their dimensionality in order for an operation to be valid, numpy will *broadcast* dimensions when possible.  For example, suppose that you want to add the number 1.5 to `arr1`; the following would be a valid way to do it:
             <div class="highlight"><pre><span class="n">arr1</span> <span class="o">+</span> <span class="mf">1.5</span><span class="o">*</span><span class="n">np</span><span class="o">.</span><span class="n">ones</span><span class="p">(</span><span class="mi">4</span><span class="p">)</span>
             </pre></div>
             <pre>
                 array([ 1.5,  2.5,  3.5,  4.5])
             </pre>
             But thanks to numpy's broadcasting rules, the following is equally valid:
             <div class="highlight"><pre><span class="n">arr1</span> <span class="o">+</span> <span class="mf">1.5</span>
             </pre></div>
             <pre>
                 array([ 1.5,  2.5,  3.5,  4.5])
             </pre>
             In this case, numpy looked at both operands and saw that the first (`arr1`) was a one-dimensional array of length 4 and the second was a scalar, considered a zero-dimensional object. The broadcasting rules allow numpy to:
             * *create* new dimensions of length 1 (since this doesn't change the size of the array)
             * 'stretch' a dimension of length 1 that needs to be matched to a dimension of a different size.
             So in the above example, the scalar 1.5 is effectively:
             * first 'promoted' to a 1-dimensional array of length 1
             * then, this array is 'stretched' to length 4 to match the dimension of `arr1`.
             After these two operations are complete, the addition can proceed as now both operands are one-dimensional arrays of length 4.
             This broadcasting behavior is in practice enormously powerful, especially because when numpy broadcasts to create new dimensions or to 'stretch' existing ones, it doesn't actually replicate the data.  In the example above the operation is carried *as if* the 1.5 was a 1-d array with 1.5 in all of its entries, but no actual array was ever created.  This can save lots of memory in cases when the arrays in question are large and can have significant performance implications.
             The general rule is: when operating on two arrays, NumPy compares their shapes element-wise. It starts with the trailing dimensions, and works its way forward, creating dimensions of length 1 as needed. Two dimensions are considered compatible when
             * they are equal to begin with, or
             * one of them is 1; in this case numpy will do the 'stretching' to make them equal.
             If these conditions are not met, a `ValueError: frames are not aligned` exception is thrown, indicating that the arrays have incompatible shapes. The size of the resulting array is the maximum size along each dimension of the input arrays.
             This shows how the broadcasting rules work in several dimensions:
             <div class="highlight"><pre><span class="n">b</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">array</span><span class="p">([</span><span class="mi">2</span><span class="p">,</span> <span class="mi">3</span><span class="p">,</span> <span class="mi">4</span><span class="p">,</span> <span class="mi">5</span><span class="p">])</span>
             <span class="k">print</span> <span class="n">arr</span><span class="p">,</span> <span class="s">&#39;</span><span class="se">\n\n</span><span class="s">+&#39;</span><span class="p">,</span> <span class="n">b</span> <span class="p">,</span> <span class="s">&#39;</span><span class="se">\n</span><span class="s">----------------</span><span class="se">\n</span><span class="s">&#39;</span><span class="p">,</span> <span class="n">arr</span> <span class="o">+</span> <span class="n">b</span>
             </pre></div>
                 [[0 1 2 3]
                  [4 5 6 7]]
                 + [2 3 4 5]
                 ----------------
                 [[ 2  4  6  8]
                  [ 6  8 10 12]]
             Now, how could you use broadcasting to say add `[4, 6]` along the rows to `arr` above?  Simply performing the direct addition will produce the error we previously mentioned:
             <div class="highlight"><pre><span class="n">c</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">array</span><span class="p">([</span><span class="mi">4</span><span class="p">,</span> <span class="mi">6</span><span class="p">])</span>
             <span class="n">arr</span> <span class="o">+</span> <span class="n">c</span>
             </pre></div>
                 ---------------------------------------------------------------------------
                 ValueError                                Traceback (most recent call last)
                 /home/fperez/teach/book-math-labtool/<ipython-input-45-62aa20ac1980> in <module>()
 c = np.array([4, 6])
                 ----> 2 arr + c
                 ValueError: operands could not be broadcast together with shapes (2,4) (2)
             According to the rules above, the array `c` would need to have a *trailing* dimension of 1 for the broadcasting to work.  It turns out that numpy allows you to 'inject' new dimensions anywhere into an array on the fly, by indexing it with the special object `np.newaxis`:
             <div class="highlight"><pre><span class="p">(</span><span class="n">c</span><span class="p">[:,</span> <span class="n">np</span><span class="o">.</span><span class="n">newaxis</span><span class="p">])</span><span class="o">.</span><span class="n">shape</span>
             </pre></div>
             <pre>
                 (2, 1)
             </pre>
             This is exactly what we need, and indeed it works:
             <div class="highlight"><pre><span class="n">arr</span> <span class="o">+</span> <span class="n">c</span><span class="p">[:,</span> <span class="n">np</span><span class="o">.</span><span class="n">newaxis</span><span class="p">]</span>
             </pre></div>
             <pre>
                 array([[ 4,  5,  6,  7],
                        [10, 11, 12, 13]])
             </pre>
             For the full broadcasting rules, please see the official Numpy docs, which describe them in detail and with more complex examples.
             As we mentioned before, Numpy ships with a full complement of mathematical functions that work on entire arrays, including logarithms, exponentials, trigonometric and hyperbolic trigonometric functions, etc.  Furthermore, scipy ships a rich special function library in the `scipy.special` module that includes Bessel, Airy, Fresnel, Laguerre and other classical special functions.  For example, sampling the sine function at 100 points between $0$ and $2\pi$ is as simple as:
             <div class="highlight"><pre><span class="n">x</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">linspace</span><span class="p">(</span><span class="mi">0</span><span class="p">,</span> <span class="mi">2</span><span class="o">*</span><span class="n">np</span><span class="o">.</span><span class="n">pi</span><span class="p">,</span> <span class="mi">100</span><span class="p">)</span>
             <span class="n">y</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">sin</span><span class="p">(</span><span class="n">x</span><span class="p">)</span>
             </pre></div>
             ## Linear algebra in numpy
             Numpy ships with a basic linear algebra library, and all arrays have a `dot` method whose behavior is that of the scalar dot product when its arguments are vectors (one-dimensional arrays) and the traditional matrix multiplication when one or both of its arguments are two-dimensional arrays:
             <div class="highlight"><pre><span class="n">v1</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">array</span><span class="p">([</span><span class="mi">2</span><span class="p">,</span> <span class="mi">3</span><span class="p">,</span> <span class="mi">4</span><span class="p">])</span>
             <span class="n">v2</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">array</span><span class="p">([</span><span class="mi">1</span><span class="p">,</span> <span class="mi">0</span><span class="p">,</span> <span class="mi">1</span><span class="p">])</span>
             <span class="k">print</span> <span class="n">v1</span><span class="p">,</span> <span class="s">&#39;.&#39;</span><span class="p">,</span> <span class="n">v2</span><span class="p">,</span> <span class="s">&#39;=&#39;</span><span class="p">,</span> <span class="n">v1</span><span class="o">.</span><span class="n">dot</span><span class="p">(</span><span class="n">v2</span><span class="p">)</span>
             </pre></div>
                 [2 3 4] . [1 0 1] = 6
             Here is a regular matrix-vector multiplication, note that the array `v1` should be viewed as a *column* vector in traditional linear algebra notation; numpy makes no distinction between row and column vectors and simply verifies that the dimensions match the required rules of matrix multiplication, in this case we have a $2 \times 3$ matrix multiplied by a 3-vector, which produces a 2-vector:
             <div class="highlight"><pre><span class="n">A</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">arange</span><span class="p">(</span><span class="mi">6</span><span class="p">)</span><span class="o">.</span><span class="n">reshape</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">3</span><span class="p">)</span>
             <span class="k">print</span> <span class="n">A</span><span class="p">,</span> <span class="s">&#39;x&#39;</span><span class="p">,</span> <span class="n">v1</span><span class="p">,</span> <span class="s">&#39;=&#39;</span><span class="p">,</span> <span class="n">A</span><span class="o">.</span><span class="n">dot</span><span class="p">(</span><span class="n">v1</span><span class="p">)</span>
             </pre></div>
                 [[0 1 2]
                  [3 4 5]] x [2 3 4] = [11 38]
             For matrix-matrix multiplication, the same dimension-matching rules must be satisfied, e.g. consider the difference between $A \times A^T$:
             <div class="highlight"><pre><span class="k">print</span> <span class="n">A</span><span class="o">.</span><span class="n">dot</span><span class="p">(</span><span class="n">A</span><span class="o">.</span><span class="n">T</span><span class="p">)</span>
             </pre></div>
                 [[ 5 14]
                  [14 50]]
             and $A^T \times A$:
             <div class="highlight"><pre><span class="k">print</span> <span class="n">A</span><span class="o">.</span><span class="n">T</span><span class="o">.</span><span class="n">dot</span><span class="p">(</span><span class="n">A</span><span class="p">)</span>
             </pre></div>
                 [[ 9 12 15]
                  [12 17 22]
                  [15 22 29]]
             Furthermore, the `numpy.linalg` module includes additional functionality such as determinants, matrix norms, Cholesky, eigenvalue and singular value decompositions, etc.  For even more linear algebra tools, `scipy.linalg` contains the majority of the tools in the classic LAPACK libraries as well as functions to operate on sparse matrices.  We refer the reader to the Numpy and Scipy documentations for additional details on these.
             ## Reading and writing arrays to disk
             Numpy lets you read and write arrays into files in a number of ways.  In order to use these tools well, it is critical to understand the difference between a *text* and a *binary* file containing numerical data.  In a text file, the number $\pi$ could be written as "3.141592653589793", for example: a string of digits that a human can read, with in this case 15 decimal digits.  In contrast, that same number written to a binary file would be encoded as 8 characters (bytes) that are not readable by a human but which contain the exact same data that the variable `pi` had in the computer's memory.
             The tradeoffs between the two modes are thus:
             * Text mode: occupies more space, precision can be lost (if not all digits are written to disk), but is readable and editable by hand with a text editor.  Can *only* be used for one- and two-dimensional arrays.
             * Binary mode: compact and exact representation of the data in memory, can't be read or edited by hand.  Arrays of any size and dimensionality can be saved and read without loss of information.
             First, let's see how to read and write arrays in text mode.  The `np.savetxt` function saves an array to a text file, with options to control the precision, separators and even adding a header:
             <div class="highlight"><pre><span class="n">arr</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">arange</span><span class="p">(</span><span class="mi">10</span><span class="p">)</span><span class="o">.</span><span class="n">reshape</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">5</span><span class="p">)</span>
             <span class="n">np</span><span class="o">.</span><span class="n">savetxt</span><span class="p">(</span><span class="s">&#39;test.out&#39;</span><span class="p">,</span> <span class="n">arr</span><span class="p">,</span> <span class="n">fmt</span><span class="o">=</span><span class="s">&#39;</span><span class="si">%.2e</span><span class="s">&#39;</span><span class="p">,</span> <span class="n">header</span><span class="o">=</span><span class="s">&quot;My dataset&quot;</span><span class="p">)</span>
             <span class="o">!</span>cat test.out
             </pre></div>
                 # My dataset
 .00e+00 1.00e+00 2.00e+00 3.00e+00 4.00e+00
 .00e+00 6.00e+00 7.00e+00 8.00e+00 9.00e+00
             And this same type of file can then be read with the matching `np.loadtxt` function:
             <div class="highlight"><pre><span class="n">arr2</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">loadtxt</span><span class="p">(</span><span class="s">&#39;test.out&#39;</span><span class="p">)</span>
             <span class="k">print</span> <span class="n">arr2</span>
             </pre></div>
                 [[ 0.  1.  2.  3.  4.]
                  [ 5.  6.  7.  8.  9.]]
             For binary data, Numpy provides the `np.save` and `np.savez` routines.  The first saves a single array to a file with `.npy` extension, while the latter can be used to save a *group* of arrays into a single file with `.npz` extension.  The files created with these routines can then be read with the `np.load` function.
             Let us first see how to use the simpler `np.save` function to save a single array:
             <div class="highlight"><pre><span class="n">np</span><span class="o">.</span><span class="n">save</span><span class="p">(</span><span class="s">&#39;test.npy&#39;</span><span class="p">,</span> <span class="n">arr2</span><span class="p">)</span>
             <span class="c"># Now we read this back</span>
             <span class="n">arr2n</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">load</span><span class="p">(</span><span class="s">&#39;test.npy&#39;</span><span class="p">)</span>
             <span class="c"># Let&#39;s see if any element is non-zero in the difference.</span>
             <span class="c"># A value of True would be a problem.</span>
             <span class="k">print</span> <span class="s">&#39;Any differences?&#39;</span><span class="p">,</span> <span class="n">np</span><span class="o">.</span><span class="n">any</span><span class="p">(</span><span class="n">arr2</span><span class="o">-</span><span class="n">arr2n</span><span class="p">)</span>
             </pre></div>
                 Any differences? False
             Now let us see how the `np.savez` function works.  You give it a filename and either a sequence of arrays or a set of keywords.  In the first mode, the function will auotmatically name the saved arrays in the archive as `arr_0`, `arr_1`, etc:
             <div class="highlight"><pre><span class="n">np</span><span class="o">.</span><span class="n">savez</span><span class="p">(</span><span class="s">&#39;test.npz&#39;</span><span class="p">,</span> <span class="n">arr</span><span class="p">,</span> <span class="n">arr2</span><span class="p">)</span>
             <span class="n">arrays</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">load</span><span class="p">(</span><span class="s">&#39;test.npz&#39;</span><span class="p">)</span>
             <span class="n">arrays</span><span class="o">.</span><span class="n">files</span>
             </pre></div>
             <pre>
                 ['arr_1', 'arr_0']
             </pre>
             Alternatively, we can explicitly choose how to name the arrays we save:
             <div class="highlight"><pre><span class="n">np</span><span class="o">.</span><span class="n">savez</span><span class="p">(</span><span class="s">&#39;test.npz&#39;</span><span class="p">,</span> <span class="n">array1</span><span class="o">=</span><span class="n">arr</span><span class="p">,</span> <span class="n">array2</span><span class="o">=</span><span class="n">arr2</span><span class="p">)</span>
             <span class="n">arrays</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">load</span><span class="p">(</span><span class="s">&#39;test.npz&#39;</span><span class="p">)</span>
             <span class="n">arrays</span><span class="o">.</span><span class="n">files</span>
             </pre></div>
             <pre>
                 ['array2', 'array1']
             </pre>
             The object returned by `np.load` from an `.npz` file works like a dictionary, though you can also access its constituent files by attribute using its special `.f` field; this is best illustrated with an example with the `arrays` object from above:
             <div class="highlight"><pre><span class="k">print</span> <span class="s">&#39;First row of first array:&#39;</span><span class="p">,</span> <span class="n">arrays</span><span class="p">[</span><span class="s">&#39;array1&#39;</span><span class="p">][</span><span class="mi">0</span><span class="p">]</span>
             <span class="c"># This is an equivalent way to get the same field</span>
             <span class="k">print</span> <span class="s">&#39;First row of first array:&#39;</span><span class="p">,</span> <span class="n">arrays</span><span class="o">.</span><span class="n">f</span><span class="o">.</span><span class="n">array1</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span>
             </pre></div>
                 First row of first array: [0 1 2 3 4]
                 First row of first array: [0 1 2 3 4]
             This `.npz` format is a very convenient way to package compactly and without loss of information, into a single file, a group of related arrays that pertain to a specific problem.  At some point, however, the complexity of your dataset may be such that the optimal approach is to use one of the standard formats in scientific data processing that have been designed to handle complex datasets, such as NetCDF or HDF5.
             Fortunately, there are tools for manipulating these formats in Python, and for storing data in other ways such as databases.  A complete discussion of the possibilities is beyond the scope of this discussion, but of particular interest for scientific users we at least mention the following:
             * The `scipy.io` module contains routines to read and write Matlab files in `.mat` format and files in the NetCDF format that is widely used in certain scientific disciplines.
             * For manipulating files in the HDF5 format, there are two excellent options in Python: The PyTables project offers a high-level, object oriented approach to manipulating HDF5 datasets, while the h5py project offers a more direct mapping to the standard HDF5 library interface.  Both are excellent tools; if you need to work with HDF5 datasets you should read some of their documentation and examples and decide which approach is a better match for your needs.
             # High quality data visualization with Matplotlib
             The [matplotlib](http://matplotlib.sf.net) library is a powerful tool capable of producing complex publication-quality figures with fine layout control in two and three dimensions; here we will only provide a minimal self-contained introduction to its usage that covers the functionality needed for the rest of the book.  We encourage the reader to read the tutorials included with the matplotlib documentation as well as to browse its extensive gallery of examples that include source code.
             Just as we typically use the shorthand `np` for Numpy, we will use `plt` for the `matplotlib.pyplot` module where the easy-to-use plotting functions reside (the library contains a rich object-oriented architecture that we don't have the space to discuss here):
             <div class="highlight"><pre><span class="kn">import</span> <span class="nn">matplotlib.pyplot</span> <span class="kn">as</span> <span class="nn">plt</span>
             </pre></div>
             The most frequently used function is simply called `plot`, here is how you can make a simple plot of $\sin(x)$ for $x \in [0, 2\pi]$ with labels and a grid (we use the semicolon in the last line to suppress the display of some information that is unnecessary right now):
             <div class="highlight"><pre><span class="n">x</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">linspace</span><span class="p">(</span><span class="mi">0</span><span class="p">,</span> <span class="mi">2</span><span class="o">*</span><span class="n">np</span><span class="o">.</span><span class="n">pi</span><span class="p">)</span>
             <span class="n">y</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">sin</span><span class="p">(</span><span class="n">x</span><span class="p">)</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">plot</span><span class="p">(</span><span class="n">x</span><span class="p">,</span><span class="n">y</span><span class="p">,</span> <span class="n">label</span><span class="o">=</span><span class="s">&#39;sin(x)&#39;</span><span class="p">)</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">legend</span><span class="p">()</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">grid</span><span class="p">()</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">title</span><span class="p">(</span><span class="s">&#39;Harmonic&#39;</span><span class="p">)</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">xlabel</span><span class="p">(</span><span class="s">&#39;x&#39;</span><span class="p">)</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">ylabel</span><span class="p">(</span><span class="s">&#39;y&#39;</span><span class="p">);</span>
             </pre></div>
-            ![](/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_01.svg)
+            ![](tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_01.svg)
             You can control the style, color and other properties of the markers, for example:
             <div class="highlight"><pre><span class="n">plt</span><span class="o">.</span><span class="n">plot</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="n">y</span><span class="p">,</span> <span class="n">linewidth</span><span class="o">=</span><span class="mi">2</span><span class="p">);</span>
             </pre></div>
-            ![](/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_02.svg)
+            ![](tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_02.svg)
             <div class="highlight"><pre><span class="n">plt</span><span class="o">.</span><span class="n">plot</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="n">y</span><span class="p">,</span> <span class="s">&#39;o&#39;</span><span class="p">,</span> <span class="n">markersize</span><span class="o">=</span><span class="mi">5</span><span class="p">,</span> <span class="n">color</span><span class="o">=</span><span class="s">&#39;r&#39;</span><span class="p">);</span>
             </pre></div>
-            ![](/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_03.svg)
+            ![](tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_03.svg)
             We will now see how to create a few other common plot types, such as a simple error plot:
             <div class="highlight"><pre><span class="c"># example data</span>
             <span class="n">x</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">arange</span><span class="p">(</span><span class="mf">0.1</span><span class="p">,</span> <span class="mi">4</span><span class="p">,</span> <span class="mf">0.5</span><span class="p">)</span>
             <span class="n">y</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">exp</span><span class="p">(</span><span class="o">-</span><span class="n">x</span><span class="p">)</span>
             <span class="c"># example variable error bar values</span>
             <span class="n">yerr</span> <span class="o">=</span> <span class="mf">0.1</span> <span class="o">+</span> <span class="mf">0.2</span><span class="o">*</span><span class="n">np</span><span class="o">.</span><span class="n">sqrt</span><span class="p">(</span><span class="n">x</span><span class="p">)</span>
             <span class="n">xerr</span> <span class="o">=</span> <span class="mf">0.1</span> <span class="o">+</span> <span class="n">yerr</span>
             <span class="c"># First illustrate basic pyplot interface, using defaults where possible.</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">figure</span><span class="p">()</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">errorbar</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="n">y</span><span class="p">,</span> <span class="n">xerr</span><span class="o">=</span><span class="mf">0.2</span><span class="p">,</span> <span class="n">yerr</span><span class="o">=</span><span class="mf">0.4</span><span class="p">)</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">title</span><span class="p">(</span><span class="s">&quot;Simplest errorbars, 0.2 in x, 0.4 in y&quot;</span><span class="p">);</span>
             </pre></div>
-            ![](/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_04.svg)
+            ![](tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_04.svg)
             A simple log plot
             <div class="highlight"><pre><span class="n">x</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">linspace</span><span class="p">(</span><span class="o">-</span><span class="mi">5</span><span class="p">,</span> <span class="mi">5</span><span class="p">)</span>
             <span class="n">y</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">exp</span><span class="p">(</span><span class="o">-</span><span class="n">x</span><span class="o">**</span><span class="mi">2</span><span class="p">)</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">semilogy</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="n">y</span><span class="p">);</span>
             </pre></div>
-            ![](/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_05.svg)
+            ![](tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_05.svg)
             A histogram annotated with text inside the plot, using the `text` function:
             <div class="highlight"><pre><span class="n">mu</span><span class="p">,</span> <span class="n">sigma</span> <span class="o">=</span> <span class="mi">100</span><span class="p">,</span> <span class="mi">15</span>
             <span class="n">x</span> <span class="o">=</span> <span class="n">mu</span> <span class="o">+</span> <span class="n">sigma</span> <span class="o">*</span> <span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="mi">10000</span><span class="p">)</span>
             <span class="c"># the histogram of the data</span>
             <span class="n">n</span><span class="p">,</span> <span class="n">bins</span><span class="p">,</span> <span class="n">patches</span> <span class="o">=</span> <span class="n">plt</span><span class="o">.</span><span class="n">hist</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="mi">50</span><span class="p">,</span> <span class="n">normed</span><span class="o">=</span><span class="mi">1</span><span class="p">,</span> <span class="n">facecolor</span><span class="o">=</span><span class="s">&#39;g&#39;</span><span class="p">,</span> <span class="n">alpha</span><span class="o">=</span><span class="mf">0.75</span><span class="p">)</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">xlabel</span><span class="p">(</span><span class="s">&#39;Smarts&#39;</span><span class="p">)</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">ylabel</span><span class="p">(</span><span class="s">&#39;Probability&#39;</span><span class="p">)</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">title</span><span class="p">(</span><span class="s">&#39;Histogram of IQ&#39;</span><span class="p">)</span>
             <span class="c"># This will put a text fragment at the position given:</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">text</span><span class="p">(</span><span class="mi">55</span><span class="p">,</span> <span class="o">.</span><span class="mo">027</span><span class="p">,</span> <span class="s">r&#39;$\mu=100,\ \sigma=15$&#39;</span><span class="p">,</span> <span class="n">fontsize</span><span class="o">=</span><span class="mi">14</span><span class="p">)</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">axis</span><span class="p">([</span><span class="mi">40</span><span class="p">,</span> <span class="mi">160</span><span class="p">,</span> <span class="mi">0</span><span class="p">,</span> <span class="mf">0.03</span><span class="p">])</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">grid</span><span class="p">(</span><span class="bp">True</span><span class="p">)</span>
             </pre></div>
-            ![](/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_06.svg)
+            ![](tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_06.svg)
             ## Image display
             The `imshow` command can display single or multi-channel images.  A simple array of random numbers, plotted in grayscale:
             <div class="highlight"><pre><span class="kn">from</span> <span class="nn">matplotlib</span> <span class="kn">import</span> <span class="n">cm</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">imshow</span><span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">rand</span><span class="p">(</span><span class="mi">5</span><span class="p">,</span> <span class="mi">10</span><span class="p">),</span> <span class="n">cmap</span><span class="o">=</span><span class="n">cm</span><span class="o">.</span><span class="n">gray</span><span class="p">,</span> <span class="n">interpolation</span><span class="o">=</span><span class="s">&#39;nearest&#39;</span><span class="p">);</span>
             </pre></div>
-            ![](/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_07.svg)
+            ![](tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_07.svg)
             A real photograph is a multichannel image, `imshow` interprets it correctly:
             <div class="highlight"><pre><span class="n">img</span> <span class="o">=</span> <span class="n">plt</span><span class="o">.</span><span class="n">imread</span><span class="p">(</span><span class="s">&#39;stinkbug.png&#39;</span><span class="p">)</span>
             <span class="k">print</span> <span class="s">&#39;Dimensions of the array img:&#39;</span><span class="p">,</span> <span class="n">img</span><span class="o">.</span><span class="n">shape</span>
             <span class="n">plt</span><span class="o">.</span><span class="n">imshow</span><span class="p">(</span><span class="n">img</span><span class="p">);</span>
             </pre></div>
                 Dimensions of the array img: (375, 500, 3)
-            ![](/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_08.svg)
+            ![](tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_08.svg)
             ## Simple 3d plotting with matplotlib
             Note that you must execute at least once in your session:
             <div class="highlight"><pre><span class="kn">from</span> <span class="nn">mpl_toolkits.mplot3d</span> <span class="kn">import</span> <span class="n">Axes3D</span>
             </pre></div>
             One this has been done, you can create 3d axes with the `projection='3d'` keyword to `add_subplot`:
                 fig = plt.figure()
                 fig.add_subplot(<other arguments here>, projection='3d')
             A simple surface plot:
             <div class="highlight"><pre><span class="kn">from</span> <span class="nn">mpl_toolkits.mplot3d.axes3d</span> <span class="kn">import</span> <span class="n">Axes3D</span>
             <span class="kn">from</span> <span class="nn">matplotlib</span> <span class="kn">import</span> <span class="n">cm</span>
             <span class="n">fig</span> <span class="o">=</span> <span class="n">plt</span><span class="o">.</span><span class="n">figure</span><span class="p">()</span>
             <span class="n">ax</span> <span class="o">=</span> <span class="n">fig</span><span class="o">.</span><span class="n">add_subplot</span><span class="p">(</span><span class="mi">1</span><span class="p">,</span> <span class="mi">1</span><span class="p">,</span> <span class="mi">1</span><span class="p">,</span> <span class="n">projection</span><span class="o">=</span><span class="s">&#39;3d&#39;</span><span class="p">)</span>
             <span class="n">X</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">arange</span><span class="p">(</span><span class="o">-</span><span class="mi">5</span><span class="p">,</span> <span class="mi">5</span><span class="p">,</span> <span class="mf">0.25</span><span class="p">)</span>
             <span class="n">Y</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">arange</span><span class="p">(</span><span class="o">-</span><span class="mi">5</span><span class="p">,</span> <span class="mi">5</span><span class="p">,</span> <span class="mf">0.25</span><span class="p">)</span>
             <span class="n">X</span><span class="p">,</span> <span class="n">Y</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">meshgrid</span><span class="p">(</span><span class="n">X</span><span class="p">,</span> <span class="n">Y</span><span class="p">)</span>
             <span class="n">R</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">sqrt</span><span class="p">(</span><span class="n">X</span><span class="o">**</span><span class="mi">2</span> <span class="o">+</span> <span class="n">Y</span><span class="o">**</span><span class="mi">2</span><span class="p">)</span>
             <span class="n">Z</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">sin</span><span class="p">(</span><span class="n">R</span><span class="p">)</span>
             <span class="n">surf</span> <span class="o">=</span> <span class="n">ax</span><span class="o">.</span><span class="n">plot_surface</span><span class="p">(</span><span class="n">X</span><span class="p">,</span> <span class="n">Y</span><span class="p">,</span> <span class="n">Z</span><span class="p">,</span> <span class="n">rstride</span><span class="o">=</span><span class="mi">1</span><span class="p">,</span> <span class="n">cstride</span><span class="o">=</span><span class="mi">1</span><span class="p">,</span> <span class="n">cmap</span><span class="o">=</span><span class="n">cm</span><span class="o">.</span><span class="n">jet</span><span class="p">,</span>
                     <span class="n">linewidth</span><span class="o">=</span><span class="mi">0</span><span class="p">,</span> <span class="n">antialiased</span><span class="o">=</span><span class="bp">False</span><span class="p">)</span>
             <span class="n">ax</span><span class="o">.</span><span class="n">set_zlim3d</span><span class="p">(</span><span class="o">-</span><span class="mf">1.01</span><span class="p">,</span> <span class="mf">1.01</span><span class="p">);</span>
             </pre></div>
-            ![](/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_09.svg)
+            ![](tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_09.svg)
             # IPython: a powerful interactive environment
             A key component of the everyday workflow of most scientific computing environments is a good interactive environment, that is, a system in which you can execute small amounts of code and view the results immediately, combining both printing out data and opening graphical visualizations.  All modern systems for scientific computing, commercial and open source, include such functionality.
             Out of the box, Python also offers a simple interactive shell with very limited capabilities.  But just like the scientific community built Numpy to provide arrays suited for scientific work (since Pytyhon's lists aren't optimal for this task), it has also developed an interactive environment much more sophisticated than the built-in one.  The [IPython project](http://ipython.org) offers a set of tools to make productive use of the Python language, all the while working interactively and with immedate feedback on your results.  The basic tools that IPython provides are:
 . A powerful terminal shell, with many features designed to increase the fluidity and productivity of everyday scientific workflows, including:
                 * rich introspection of all objects and variables including easy access to the source code of any function
                 * powerful and extensible tab completion of variables and filenames,
                 * tight integration with matplotlib, supporting interactive figures that don't block the terminal,
                 * direct access to the filesystem and underlying operating system,
                 * an extensible system for shell-like commands called 'magics' that reduce the work needed to perform many common tasks,
                 * tools for easily running, timing, profiling and debugging your codes,
                 * syntax highlighted error messages with much more detail than the default Python ones,
                 * logging and access to all previous history of inputs, including across sessions
 . A Qt console that provides the look and feel of a terminal, but adds support for inline figures, graphical calltips, a persistent session that can survive crashes (even segfaults) of the kernel process, and more.
 . A web-based notebook that can execute code and also contain rich text and figures, mathematical equations and arbitrary HTML. This notebook presents a document-like view with cells where code is executed but that can be edited in-place, reordered, mixed with explanatory text and figures, etc.
 . A high-performance, low-latency system for parallel computing that supports the control of a cluster of IPython engines communicating over a network, with optimizations that minimize unnecessary copying of large objects (especially numpy arrays).
             We will now discuss the highlights of the tools 1-3 above so that you can make them an effective part of your workflow.  The topic of parallel computing is beyond the scope of this document, but we encourage you to read the extensive [documentation](http://ipython.org/ipython-doc/rel-0.12.1/parallel/index.html) and [tutorials](http://minrk.github.com/scipy-tutorial-2011/) on this available on the IPython website.
             ## The IPython terminal
             You can start IPython at the terminal simply by typing:
                 $ ipython
             which will provide you some basic information about how to get started and will then open a prompt labeled `In [1]:` for you to start typing.  Here we type $2^{64}$ and Python computes the result for us in exact arithmetic, returning it as `Out[1]`:
                 $ ipython
                 Python 2.7.2+ (default, Oct  4 2011, 20:03:08)
                 Type "copyright", "credits" or "license" for more information.
                 IPython 0.13.dev -- An enhanced Interactive Python.
                 ?         -> Introduction and overview of IPython's features.
                 %quickref -> Quick reference.
                 help      -> Python's own help system.
                 object?   -> Details about 'object', use 'object??' for extra details.
                 In [1]: 2**64
                 Out[1]: 18446744073709551616L
             The first thing you should know about IPython is that all your inputs and outputs are saved. There are two variables named `In` and `Out` which are filled as you work with your results.  Furthermore, all outputs are also saved to auto-created variables of the form `_NN` where `NN` is the prompt number, and inputs to `_iNN`.  This allows you to recover quickly the result of a prior computation by referring to its number even if you forgot to store it as a variable.  For example, later on in the above session you can do:
                 In [6]: print _1
                 18446744073709551616
             We strongly recommend that you take a few minutes to read at least the basic introduction provided by the `?` command, and keep in mind that the `%quickref` command at all times can be used as a quick reference "cheat sheet" of the most frequently used features of IPython.
             At the IPython prompt, any valid Python code that you type will be executed similarly to the default Python shell (though often with more informative feedback).  But since IPython is a *superset* of the default Python shell; let's have a brief look at some of its additional functionality.
             **Object introspection**
             A simple `?` command provides a general introduction to IPython, but as indicated in the banner above, you can use the `?` syntax to ask for details about any object.  For example, if we type `_1?`, IPython will print the following details about this variable:
                 In [14]: _1?
                 Type:       long
                 Base Class: <type 'long'>
                 String Form:18446744073709551616
                 Namespace:  Interactive
                 Docstring:
                 long(x[, base]) -> integer
                 Convert a string or number to a long integer, if possible.  A floating
                 [etc... snipped for brevity]
             If you add a second `?` and for any oobject `x` type `x??`, IPython will try to provide an even more detailed analsysi of the object, including its syntax-highlighted source code when it can be found.  It's possible that `x??` returns the same information as `x?`, but in many cases `x??` will indeed provide additional details.
             Finally, the `?` syntax is also useful to search *namespaces* with wildcards.  Suppose you are wondering if there is any function in Numpy that may do text-related things; with `np.*txt*?`, IPython will print all the names in the `np` namespace (our Numpy shorthand) that have 'txt' anywhere in their name:
                 In [17]: np.*txt*?
                 np.genfromtxt
                 np.loadtxt
                 np.mafromtxt
                 np.ndfromtxt
                 np.recfromtxt
                 np.savetxt
             **Tab completion**
             IPython makes the tab key work extra hard for you as a way to rapidly inspect objects and libraries.  Whenever you have typed something at the prompt, by hitting the `<tab>` key IPython will try to complete the rest of the line.  For this, IPython will analyze the text you had so far and try to search for Python data or files that may match the context you have already provided.
             For example, if you type `np.load` and hit the <tab> key, you'll see:
                 In [21]: np.load<TAB HERE>
                 np.load     np.loads    np.loadtxt
             so you can quickly find all the load-related functionality in numpy.  Tab completion works even for function arguments, for example consider this function definition:
                 In [20]: def f(x, frobinate=False):
                    ....:     if frobinate:
                    ....:         return x**2
                    ....:
             If you now use the `<tab>` key after having typed 'fro' you'll get all valid Python completions, but those marked with `=` at the end are known to be keywords of your function:
                 In [21]: f(2, fro<TAB HERE>
                 frobinate=    frombuffer    fromfunction  frompyfunc    fromstring
                 from          fromfile      fromiter      fromregex     frozenset
             at this point you can add the `b` letter and hit `<tab>` once more, and IPython will finish the line for you:
                 In [21]: f(2, frobinate=
             As a beginner, simply get into the habit of using `<tab>` after most objects; it should quickly become second nature as you will see how helps keep a fluid workflow and discover useful information.  Later on you can also customize this behavior by writing your own completion code, if you so desire.
             **Matplotlib integration**
             One of the most useful features of IPython for scientists is its tight integration with matplotlib: at the terminal IPython lets you open matplotlib figures without blocking your typing (which is what happens if you try to do the same thing at the default Python shell), and in the Qt console and notebook you can even view your figures embedded in your workspace next to the code that created them.
             The matplotlib support can be either activated when you start IPython by passing the `--pylab` flag, or at any point later in your session by using the `%pylab` command.  If you start IPython with `--pylab`, you'll see something like this (note the extra message about pylab):
                 $ ipython --pylab
                 Python 2.7.2+ (default, Oct  4 2011, 20:03:08)
                 Type "copyright", "credits" or "license" for more information.
                 IPython 0.13.dev -- An enhanced Interactive Python.
                 ?         -> Introduction and overview of IPython's features.
                 %quickref -> Quick reference.
                 help      -> Python's own help system.
                 object?   -> Details about 'object', use 'object??' for extra details.
                 Welcome to pylab, a matplotlib-based Python environment [backend: Qt4Agg].
                 For more information, type 'help(pylab)'.
                 In [1]:
             Furthermore, IPython will import `numpy` with the `np` shorthand, `matplotlib.pyplot` as `plt`, and it will also load all of the numpy and pyplot top-level names so that you can directly type something like:
                 In [1]: x = linspace(0, 2*pi, 200)
                 In [2]: plot(x, sin(x))
                 Out[2]: [<matplotlib.lines.Line2D at 0x9e7c16c>]
             instead of having to prefix each call with its full signature (as we have been doing in the examples thus far):
                 In [3]: x = np.linspace(0, 2*np.pi, 200)
                 In [4]: plt.plot(x, np.sin(x))
                 Out[4]: [<matplotlib.lines.Line2D at 0x9e900ac>]
             This shorthand notation can be a huge time-saver when working interactively (it's a few characters but you are likely to type them hundreds of times in a session).  But we should note that as you develop persistent scripts and notebooks meant for reuse, it's best to get in the habit of using the longer notation (known as *fully qualified names* as it's clearer where things come from and it makes for more robust, readable and maintainable code in the long run).
             **Access to the operating system and files**
             In IPython, you can type `ls` to see your files or `cd` to change directories, just like you would at a regular system prompt:
                 In [2]: cd tests
                 /home/fperez/ipython/nbconvert/tests
                 In [3]: ls test.*
                 test.aux  test.html  test.ipynb  test.log  test.out  test.pdf  test.rst  test.tex
             Furthermore, if you use the `!` at the beginning of a line, any commands you pass afterwards go directly to the operating system:
                 In [4]: !echo "Hello IPython"
                 Hello IPython
             IPython offers a useful twist in this feature: it will substitute in the command the value of any *Python* variable you may have if you prepend it with a `$` sign:
                 In [5]: message = 'IPython interpolates from Python to the shell'
                 In [6]: !echo $message
                 IPython interpolates from Python to the shell
             This feature can be extremely useful, as it lets you combine the power and clarity of Python for complex logic with the immediacy and familiarity of many shell commands.  Additionally, if you start the line with *two* `$$` signs, the output of the command will be automatically captured as a list of lines, e.g.:
                 In [10]: !!ls test.*
                 Out[10]:
                 ['test.aux',
                  'test.html',
                  'test.ipynb',
                  'test.log',
                  'test.out',
                  'test.pdf',
                  'test.rst',
                  'test.tex']
             As explained above, you can now use this as the variable `_10`.  If you directly want to capture the output of a system command to a Python variable, you can use the syntax `=!`:
                 In [11]: testfiles =! ls test.*
                 In [12]: print testfiles
                 ['test.aux', 'test.html', 'test.ipynb', 'test.log', 'test.out', 'test.pdf', 'test.rst', 'test.tex']
             Finally, the special `%alias` command lets you define names that are shorthands for system commands, so that you can type them without having to prefix them via `!` explicitly (for example, `ls` is an alias that has been predefined for you at startup).
             **Magic commands**
             IPython has a system for special commands, called 'magics', that let you control IPython itself and perform many common tasks with a more shell-like syntax: it uses spaces for delimiting arguments, flags can be set with dashes and all arguments are treated as strings, so no additional quoting is required.  This kind of syntax is invalid in the Python language but very convenient for interactive typing (less parentheses, commans and quoting everywhere); IPython distinguishes the two by detecting lines that start with the `%` character.
             You can learn more about the magic system by simply typing `%magic` at the prompt, which will give you a short description plus the documentation on *all* available magics.  If you want to see only a listing of existing magics, you can use `%lsmagic`:
                 In [4]: lsmagic
                 Available magic functions:
                 %alias  %autocall  %autoindent  %automagic  %bookmark  %c  %cd  %colors  %config  %cpaste
                 %debug  %dhist  %dirs  %doctest_mode  %ds  %ed  %edit  %env  %gui  %hist  %history
                 %install_default_config  %install_ext  %install_profiles  %load_ext  %loadpy  %logoff  %logon
                 %logstart  %logstate  %logstop  %lsmagic  %macro  %magic  %notebook  %page  %paste  %pastebin
                 %pd  %pdb  %pdef  %pdoc  %pfile  %pinfo  %pinfo2  %pop  %popd  %pprint  %precision  %profile
                 %prun  %psearch  %psource  %pushd  %pwd  %pycat  %pylab  %quickref  %recall  %rehashx
                 %reload_ext  %rep  %rerun  %reset  %reset_selective  %run  %save  %sc  %stop  %store  %sx  %tb
                 %time  %timeit  %unalias  %unload_ext  %who  %who_ls  %whos  %xdel  %xmode
                 Automagic is ON, % prefix NOT needed for magic functions.
             Note how the example above omitted the eplicit `%` marker and simply uses `lsmagic`.  As long as the 'automagic' feature is on (which it is by default), you can omit the `%` marker as long as there is no ambiguity with a Python variable of the same name.
             **Running your code**
             While it's easy to type a few lines of code in IPython, for any long-lived work you should keep your codes in Python scripts (or in IPython notebooks, see below).  Consider that you have a script, in this case trivially simple for the sake of brevity, named `simple.py`:
                 In [12]: !cat simple.py
                 import numpy as np
                 x = np.random.normal(size=100)
                 print 'First elment of x:', x[0]
             The typical workflow with IPython is to use the `%run` magic to execute your script (you can omit the .py extension if you want).  When you run it, the script will execute just as if it had been run at the system prompt with `python simple.py` (though since modules don't get re-executed on new imports by Python, all system initialization is essentially free, which can have a significant run time impact in some cases):
                 In [13]: run simple
                 First elment of x: -1.55872256289
             Once it completes, all variables defined in it become available for you to use interactively:
                 In [14]: x.shape
                 Out[14]: (100,)
             This allows you to plot data, try out ideas, etc, in a `%run`/interact/edit cycle that can be very productive.  As you start understanding your problem better you can refine your script further, incrementally improving it based on the work you do at the IPython prompt.  At any point you can use the `%hist` magic to print out your history without prompts, so that you can copy useful fragments back into the script.
             By default, `%run` executes scripts in a completely empty namespace, to better mimic how they would execute at the system prompt with plain Python.  But if you use the `-i` flag, the script will also see your interactively defined variables.  This lets you edit in a script larger amounts of code that still behave as if you had typed them at the IPython prompt.
             You can also get a summary of the time taken by your script with the `-t` flag; consider a different script `randsvd.py` that takes a bit longer to run:
                 In [21]: run -t randsvd.py
                 IPython CPU timings (estimated):
                   User   :       0.38 s.
                   System :       0.04 s.
                 Wall time:       0.34 s.
             `User` is the time spent by the computer executing your code, while `System` is the time the operating system had to work on your behalf, doing things like memory allocation that are needed by your code but that you didn't explicitly program and that happen inside the kernel.  The `Wall time` is the time on a 'clock on the wall' between the start and end of your program.
             If `Wall > User+System`, your code is most likely waiting idle for certain periods.  That could be waiting for data to arrive from a remote source or perhaps because the operating system has to swap large amounts of virtual memory.  If you know that your code doesn't explicitly wait for remote data to arrive, you should investigate further to identify possible ways of improving the performance profile.
             If you only want to time how long a single statement takes, you don't need to put it into a script as you can use the `%timeit` magic, which uses Python's `timeit` module to very carefully measure timig data; `timeit` can measure even short statements that execute extremely fast:
                 In [27]: %timeit a=1
                 10000000 loops, best of 3: 23 ns per loop
             and for code that runs longer, it automatically adjusts so the overall measurement doesn't take too long:
                 In [28]: %timeit np.linalg.svd(x)
 loops, best of 3: 310 ms per loop
             The `%run` magic still has more options for debugging and profiling data; you should read its documentation for many useful details (as always, just type `%run?`).
             ## The graphical Qt console
             If you type at the system prompt (see the IPython website for installation details, as this requires some additional libraries):
                 $ ipython qtconsole
             instead of opening in a terminal as before, IPython will start a graphical console that at first sight appears just like a terminal, but which is in fact much more capable than a text-only terminal.  This is a specialized terminal designed for interactive scientific work, and it supports full multi-line editing with color highlighting and graphical calltips for functions, it can keep multiple IPython sessions open simultaneously in tabs, and when scripts run it can display the figures inline directly in the work area.
             <center><img src="ipython_qtconsole2.png" width=400px></center>
             % This cell is for the pdflatex output only
             \begin{figure}[htbp]
             \centering
             \includegraphics[width=3in]{ipython_qtconsole2.png}
             \caption{The IPython Qt console: a lightweight terminal for scientific exploration, with code, results and graphics in a soingle environment.}
             \end{figure}
             The Qt console accepts the same `--pylab` startup flags as the terminal, but you can additionally supply the value `--pylab inline`, which enables the support for inline graphics shown in the figure.  This is ideal for keeping all the code and figures in the same session, given that the console can save the output of your entire session to HTML or PDF.
             Since the Qt console makes it far more convenient than the terminal to edit blocks of code with multiple lines, in this environment it's worth knowing about the `%loadpy` magic function.  `%loadpy` takes a path to a local file or remote URL, fetches its contents, and puts it in the work area for you to further edit and execute.  It can be an extremely fast and convenient way of loading code from local disk or remote examples from sites such as the [Matplotlib gallery](http://matplotlib.sourceforge.net/gallery.html).
             Other than its enhanced capabilities for code and graphics, all of the features of IPython we've explained before remain functional in this graphical console.
             ## The IPython Notebook
             The third way to interact with IPython, in addition to the terminal and graphical Qt console, is a powerful web interface called the "IPython Notebook".  If you run at the system console (you can omit the `pylab` flags if you don't need plotting support):
                 $ ipython notebook --pylab inline
             IPython will start a process that runs a web server in your local machine and to which a web browser can connect.  The Notebook is a workspace that lets you execute code in blocks called 'cells' and displays any results and figures, but which can also contain arbitrary text (including LaTeX-formatted mathematical expressions) and any rich media that a modern web browser is capable of displaying.
             <center><img src="ipython-notebook-specgram-2.png" width=400px></center>
             % This cell is for the pdflatex output only
             \begin{figure}[htbp]
             \centering
             \includegraphics[width=3in]{ipython-notebook-specgram-2.png}
             \caption{The IPython Notebook: text, equations, code, results, graphics and other multimedia in an open format for scientific exploration and collaboration}
             \end{figure}
             In fact, this document was written as a Notebook, and only exported to LaTeX for printing.  Inside of each cell, all the features of IPython that we have discussed before remain functional, since ultimately this web client is communicating with the same IPython code that runs in the terminal.  But this interface is a much more rich and powerful environment for maintaining long-term "live and executable" scientific documents.
             Notebook environments have existed in commercial systems like Mathematica(TM) and Maple(TM) for a long time; in the open source world the [Sage](http://sagemath.org) project blazed this particular trail starting in 2006, and now we bring all the features that have made IPython such a widely used tool to a Notebook model.
             Since the Notebook runs as a web application, it is possible to configure it for remote access, letting you run your computations on a persistent server close to your data, which you can then access remotely from any browser-equipped computer.  We encourage you to read the extensive documentation provided by the IPython project for details on how to do this and many more features of the notebook.
             Finally, as we said earlier, IPython also has a high-level and easy to use set of libraries for parallel computing, that let you control (interactively if desired) not just one IPython but an entire cluster of 'IPython engines'.   Unfortunately a detailed discussion of these tools is beyond the scope of this text, but should you need to parallelize your analysis codes, a quick read of the tutorials and examples provided at the IPython site may prove fruitful.

tests/ipynbref/IntroNumPy.orig.py

0 +10 -10

             ## An Introduction to the Scientific Python Ecosystem
             # While the Python language is an excellent tool for general-purpose programming, with a highly readable syntax, rich and powerful data types (strings, lists, sets, dictionaries, arbitrary length integers, etc) and a very comprehensive standard library, it was not designed specifically for mathematical and scientific computing.  Neither the language nor its standard library have facilities for the efficient representation of multidimensional datasets, tools for linear algebra and general matrix manipulations (an essential building block of virtually all technical computing), nor any data visualization facilities.
             #
             # In particular, Python lists are very flexible containers that can be nested arbitrarily deep and which can hold any Python object in them, but they are poorly suited to represent efficiently common mathematical constructs like vectors and matrices.  In contrast, much of our modern heritage of scientific computing has been built on top of libraries written in the Fortran language, which has native support for vectors and matrices as well as a library of mathematical functions that can efficiently operate on entire arrays at once.
             ### Scientific Python: a collaboration of projects built by scientists
             # The scientific community has developed a set of related Python libraries that provide powerful array facilities, linear algebra, numerical algorithms, data visualization and more.  In this appendix, we will briefly outline the tools most frequently used for this purpose, that make "Scientific Python" something far more powerful than the Python language alone.
             #
             # For reasons of space, we can only describe in some detail the central Numpy library, but below we provide links to the websites of each project where you can read their documentation in more detail.
             #
             # First, let's look at an overview of the basic tools that most scientists use in daily research with Python.  The core of this ecosystem is composed of:
             #
             # * Numpy: the basic library that most others depend on, it provides a powerful array type that can represent multidmensional datasets of many different kinds and that supports arithmetic operations. Numpy also provides a library of common mathematical functions, basic linear algebra, random number generation and Fast Fourier Transforms.  Numpy can be found at [numpy.scipy.org](http://numpy.scipy.org)
             #
             # * Scipy: a large collection of numerical algorithms that operate on numpy arrays and provide facilities for many common tasks in scientific computing, including dense and sparse linear algebra support, optimization, special functions, statistics, n-dimensional image processing, signal processing and more. Scipy can be found at [scipy.org](http://scipy.org).
             #
             # * Matplotlib: a data visualization library with a strong focus on producing high-quality output, it supports a variety of common scientific plot types in two and three dimensions, with precise control over the final output and format for publication-quality results.  Matplotlib can also be controlled interactively allowing graphical manipulation of your data (zooming, panning, etc) and can be used with most modern user interface toolkits.  It can be found at [matplotlib.sf.net](http://matplotlib.sf.net).
             #
             # * IPython: while not strictly scientific in nature, IPython is the interactive environment in which many scientists spend their time.  IPython provides a powerful Python shell that integrates tightly with Matplotlib and with easy access to the files and operating system, and which can execute in a terminal or in a graphical Qt console. IPython also has a web-based notebook interface that can combine code with text, mathematical expressions, figures and multimedia.  It can be found at [ipython.org](http://ipython.org).
             #
             # While each of these tools can be installed separately, in our opinion the most convenient way today of accessing them (especially on Windows and Mac computers) is to install the [Free Edition of the Enthought Python Distribution](http://www.enthought.com/products/epd_free.php) which contain all the above.  Other free alternatives on Windows (but not on Macs) are [Python(x,y)](http://code.google.com/p/pythonxy) and [ Christoph Gohlke's packages page](http://www.lfd.uci.edu/~gohlke/pythonlibs).
             #
             # These four 'core' libraries are in practice complemented by a number of other tools for more specialized work.  We will briefly list here the ones that we think are the most commonly needed:
             #
             # * Sympy: a symbolic manipulation tool that turns a Python session into a computer algebra system.  It integrates with the IPython notebook, rendering results in properly typeset mathematical notation.  [sympy.org](http://sympy.org).
             #
             # * Mayavi: sophisticated 3d data visualization; [code.enthought.com/projects/mayavi](http://code.enthought.com/projects/mayavi).
             #
             # * Cython: a bridge language between Python and C, useful both to optimize performance bottlenecks in Python and to access C libraries directly; [cython.org](http://cython.org).
             #
             # * Pandas: high-performance data structures and data analysis tools, with powerful data alignment and structural manipulation capabilities; [pandas.pydata.org](http://pandas.pydata.org).
             #
             # * Statsmodels: statistical data exploration and model estimation; [statsmodels.sourceforge.net](http://statsmodels.sourceforge.net).
             #
             # * Scikit-learn: general purpose machine learning algorithms with a common interface; [scikit-learn.org](http://scikit-learn.org).
             #
             # * Scikits-image: image processing toolbox; [scikits-image.org](http://scikits-image.org).
             #
             # * NetworkX: analysis of complex networks (in the graph theoretical sense); [networkx.lanl.gov](http://networkx.lanl.gov).
             #
             # * PyTables: management of hierarchical datasets using the industry-standard HDF5 format; [www.pytables.org](http://www.pytables.org).
             #
             # Beyond these, for any specific problem you should look on the internet first, before starting to write code from scratch.  There's a good chance that someone, somewhere, has written an open source library that you can use for part or all of your problem.
             ### A note about the examples below
             # In all subsequent examples, you will see blocks of input code, followed by the results of the code if the code generated output.  This output may include text, graphics and other result objects.  These blocks of input can be pasted into your interactive IPython session or notebook for you to execute.  In the print version of this document, a thin vertical bar on the left of the blocks of input and output shows which blocks go together.
             #
             # If you are reading this text as an actual IPython notebook, you can press `Shift-Enter` or use the 'play' button on the toolbar (right-pointing triangle) to execute each block of code, known as a 'cell' in IPython:
             # In[71]:
             # This is a block of code, below you'll see its output
             print "Welcome to the world of scientific computing with Python!"
             # Out[71]:
             #     Welcome to the world of scientific computing with Python!
             #
             ## Motivation: the trapezoidal rule
             # In subsequent sections we'll provide a basic introduction to the nuts and bolts of the basic scientific python tools; but we'll first motivate it with a brief example that illustrates what you can do in a few lines with these tools.  For this, we will use the simple problem of approximating a definite integral with the trapezoid rule:
             #
             # $$
             # \int_{a}^{b} f(x)\, dx \approx \frac{1}{2} \sum_{k=1}^{N} \left( x_{k} - x_{k-1} \right) \left( f(x_{k}) + f(x_{k-1}) \right).
             # $$
             #
             # Our task will be to compute this formula for a function such as:
             #
             # $$
             # f(x) = (x-3)(x-5)(x-7)+85
             # $$
             #
             # integrated between $a=1$ and $b=9$.
             #
             # First, we define the function and sample it evenly between 0 and 10 at 200 points:
             # In[1]:
             def f(x):
                 return (x-3)*(x-5)*(x-7)+85
             import numpy as np
             x = np.linspace(0, 10, 200)
             y = f(x)
             # We select $a$ and $b$, our integration limits, and we take only a few points in that region to illustrate the error behavior of the trapezoid approximation:
             # In[2]:
             a, b = 1, 9
             xint = x[logical_and(x>=a, x<=b)][::30]
             yint = y[logical_and(x>=a, x<=b)][::30]
             # Let's plot both the function and the area below it in the trapezoid approximation:
             # In[3]:
             import matplotlib.pyplot as plt
             plt.plot(x, y, lw=2)
             plt.axis([0, 10, 0, 140])
             plt.fill_between(xint, 0, yint, facecolor='gray', alpha=0.4)
             plt.text(0.5 * (a + b), 30,r"$\int_a^b f(x)dx$", horizontalalignment='center', fontsize=20);
             # Out[3]:
-            # image file: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_00.svg
+            # image file: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_00.svg
             # Compute the integral both at high accuracy and with the trapezoid approximation
             # In[4]:
             from scipy.integrate import quad, trapz
             integral, error = quad(f, 1, 9)
             trap_integral = trapz(yint, xint)
             print "The integral is: %g +/- %.1e" % (integral, error)
             print "The trapezoid approximation with", len(xint), "points is:", trap_integral
             print "The absolute error is:", abs(integral - trap_integral)
             # Out[4]:
             #     The integral is: 680 +/- 7.5e-12
             #     The trapezoid approximation with 6 points is: 621.286411141
             #     The absolute error is: 58.7135888589
             #
             # This simple example showed us how, combining the numpy, scipy and matplotlib libraries we can provide an illustration of a standard method in elementary calculus with just a few lines of code.  We will now discuss with more detail the basic usage of these tools.
             ## NumPy arrays: the right data structure for scientific computing
             ### Basics of Numpy arrays
             # We now turn our attention to the Numpy library, which forms the base layer for the entire 'scipy ecosystem'.  Once you have installed numpy, you can import it as
             # In[5]:
             import numpy
             # though in this book we will use the common shorthand
             # In[6]:
             import numpy as np
             # As mentioned above, the main object provided by numpy is a powerful array.  We'll start by exploring how the numpy array differs from Python lists.  We start by creating a simple list and an array with the same contents of the list:
             # In[7]:
             lst = [10, 20, 30, 40]
             arr = np.array([10, 20, 30, 40])
             # Elements of a one-dimensional array are accessed with the same syntax as a list:
             # In[8]:
             lst[0]
             # Out[8]:
             #     10
             # In[9]:
             arr[0]
             # Out[9]:
             #     10
             # In[10]:
             arr[-1]
             # Out[10]:
             #     40
             # In[11]:
             arr[2:]
             # Out[11]:
             #     array([30, 40])
             # The first difference to note between lists and arrays is that arrays are *homogeneous*; i.e. all elements of an array must be of the same type.  In contrast, lists can contain elements of arbitrary type. For example, we can change the last element in our list above to be a string:
             # In[12]:
             lst[-1] = 'a string inside a list'
             lst
             # Out[12]:
             #     [10, 20, 30, 'a string inside a list']
             # but the same can not be done with an array, as we get an error message:
             # In[13]:
             arr[-1] = 'a string inside an array'
             # Out[13]:
                 ---------------------------------------------------------------------------
                 ValueError                                Traceback (most recent call last)
                 /home/fperez/teach/book-math-labtool/<ipython-input-13-29c0bfa5fa8a> in <module>()
                 ----> 1 arr[-1] = 'a string inside an array'
                 ValueError: invalid literal for long() with base 10: 'a string inside an array'
             # The information about the type of an array is contained in its *dtype* attribute:
             # In[14]:
             arr.dtype
             # Out[14]:
             #     dtype('int32')
             # Once an array has been created, its dtype is fixed and it can only store elements of the same type.  For this example where the dtype is integer, if we store a floating point number it will be automatically converted into an integer:
             # In[15]:
             arr[-1] = 1.234
             arr
             # Out[15]:
             #     array([10, 20, 30,  1])
             # Above we created an array from an existing list; now let us now see other ways in which we can create arrays, which we'll illustrate next.  A common need is to have an array initialized with a constant value, and very often this value is 0 or 1 (suitable as starting value for additive and multiplicative loops respectively); `zeros` creates arrays of all zeros, with any desired dtype:
             # In[16]:
             np.zeros(5, float)
             # Out[16]:
             #     array([ 0.,  0.,  0.,  0.,  0.])
             # In[17]:
             np.zeros(3, int)
             # Out[17]:
             #     array([0, 0, 0])
             # In[18]:
             np.zeros(3, complex)
             # Out[18]:
             #     array([ 0.+0.j,  0.+0.j,  0.+0.j])
             # and similarly for `ones`:
             # In[19]:
             print '5 ones:', np.ones(5)
             # Out[19]:
             #     5 ones: [ 1.  1.  1.  1.  1.]
             #
             # If we want an array initialized with an arbitrary value, we can create an empty array and then use the fill method to put the value we want into the array:
             # In[20]:
             a = empty(4)
             a.fill(5.5)
             a
             # Out[20]:
             #     array([ 5.5,  5.5,  5.5,  5.5])
             # Numpy also offers the `arange` function, which works like the builtin `range` but returns an array instead of a list:
             # In[21]:
             np.arange(5)
             # Out[21]:
             #     array([0, 1, 2, 3, 4])
             # and the `linspace` and `logspace` functions to create linearly and logarithmically-spaced grids respectively, with a fixed number of points and including both ends of the specified interval:
             # In[22]:
             print "A linear grid between 0 and 1:", np.linspace(0, 1, 5)
             print "A logarithmic grid between 10**1 and 10**4: ", np.logspace(1, 4, 4)
             # Out[22]:
             #     A linear grid between 0 and 1: [ 0.    0.25  0.5   0.75  1.  ]
             #     A logarithmic grid between 10**1 and 10**4:  [    10.    100.   1000.  10000.]
             #
             # Finally, it is often useful to create arrays with random numbers that follow a specific distribution.  The `np.random` module contains a number of functions that can be used to this effect, for example this will produce an array of 5 random samples taken from a standard normal distribution (0 mean and variance 1):
             # In[23]:
             np.random.randn(5)
             # Out[23]:
             #     array([-0.08633343, -0.67375434,  1.00589536,  0.87081651,  1.65597822])
             # whereas this will also give 5 samples, but from a normal distribution with a mean of 10 and a variance of 3:
             # In[24]:
             norm10 = np.random.normal(10, 3, 5)
             norm10
             # Out[24]:
             #     array([  8.94879575,   5.53038269,   8.24847281,  12.14944165,  11.56209294])
             ### Indexing with other arrays
             # Above we saw how to index arrays with single numbers and slices, just like Python lists.  But arrays allow for a more sophisticated kind of indexing which is very powerful: you can index an array with another array, and in particular with an array of boolean values.  This is particluarly useful to extract information from an array that matches a certain condition.
             #
             # Consider for example that in the array `norm10` we want to replace all values above 9 with the value 0.  We can do so by first finding the *mask* that indicates where this condition is true or false:
             # In[25]:
             mask = norm10 > 9
             mask
             # Out[25]:
             #     array([False, False, False,  True,  True], dtype=bool)
             # Now that we have this mask, we can use it to either read those values or to reset them to 0:
             # In[26]:
             print 'Values above 9:', norm10[mask]
             # Out[26]:
             #     Values above 9: [ 12.14944165  11.56209294]
             #
             # In[27]:
             print 'Resetting all values above 9 to 0...'
             norm10[mask] = 0
             print norm10
             # Out[27]:
             #     Resetting all values above 9 to 0...
             #     [ 8.94879575  5.53038269  8.24847281  0.          0.        ]
             #
             ### Arrays with more than one dimension
             # Up until now all our examples have used one-dimensional arrays.  But Numpy can create arrays of aribtrary dimensions, and all the methods illustrated in the previous section work with more than one dimension.  For example, a list of lists can be used to initialize a two dimensional array:
             # In[28]:
             lst2 = [[1, 2], [3, 4]]
             arr2 = np.array([[1, 2], [3, 4]])
             arr2
             # Out[28]:
             #     array([[1, 2],
             #            [3, 4]])
             # With two-dimensional arrays we start seeing the power of numpy: while a nested list can be indexed using repeatedly the `[ ]` operator, multidimensional arrays support a much more natural indexing syntax with a single `[ ]` and a set of indices separated by commas:
             # In[29]:
             print lst2[0][1]
             print arr2[0,1]
             # Out[29]:
             #     2
             #     2
             #
             # Most of the array creation functions listed above can be used with more than one dimension, for example:
             # In[30]:
             np.zeros((2,3))
             # Out[30]:
             #     array([[ 0.,  0.,  0.],
             #            [ 0.,  0.,  0.]])
             # In[31]:
             np.random.normal(10, 3, (2, 4))
             # Out[31]:
             #     array([[ 11.26788826,   4.29619866,  11.09346496,   9.73861307],
             #            [ 10.54025996,   9.5146268 ,  10.80367214,  13.62204505]])
             # In fact, the shape of an array can be changed at any time, as long as the total number of elements is unchanged.  For example, if we want a 2x4 array with numbers increasing from 0, the easiest way to create it is:
             # In[32]:
             arr = np.arange(8).reshape(2,4)
             print arr
             # Out[32]:
             #     [[0 1 2 3]
             #      [4 5 6 7]]
             #
             # With multidimensional arrays, you can also use slices, and you can mix and match slices and single indices in the different dimensions (using the same array as above):
             # In[33]:
             print 'Slicing in the second row:', arr[1, 2:4]
             print 'All rows, third column   :', arr[:, 2]
             # Out[33]:
             #     Slicing in the second row: [6 7]
             #     All rows, third column   : [2 6]
             #
             # If you only provide one index, then you will get an array with one less dimension containing that row:
             # In[34]:
             print 'First row:  ', arr[0]
             print 'Second row: ', arr[1]
             # Out[34]:
             #     First row:   [0 1 2 3]
             #     Second row:  [4 5 6 7]
             #
             # Now that we have seen how to create arrays with more than one dimension, it's a good idea to look at some of the most useful properties and methods that arrays have.  The following provide basic information about the size, shape and data in the array:
             # In[35]:
             print 'Data type                :', arr.dtype
             print 'Total number of elements :', arr.size
             print 'Number of dimensions     :', arr.ndim
             print 'Shape (dimensionality)   :', arr.shape
             print 'Memory used (in bytes)   :', arr.nbytes
             # Out[35]:
             #     Data type                : int32
             #     Total number of elements : 8
             #     Number of dimensions     : 2
             #     Shape (dimensionality)   : (2, 4)
             #     Memory used (in bytes)   : 32
             #
             # Arrays also have many useful methods, some especially useful ones are:
             # In[36]:
             print 'Minimum and maximum             :', arr.min(), arr.max()
             print 'Sum and product of all elements :', arr.sum(), arr.prod()
             print 'Mean and standard deviation     :', arr.mean(), arr.std()
             # Out[36]:
             #     Minimum and maximum             : 0 7
             #     Sum and product of all elements : 28 0
             #     Mean and standard deviation     : 3.5 2.29128784748
             #
             # For these methods, the above operations area all computed on all the elements of the array.  But for a multidimensional array, it's possible to do the computation along a single dimension, by passing the `axis` parameter; for example:
             # In[37]:
             print 'For the following array:\n', arr
             print 'The sum of elements along the rows is    :', arr.sum(axis=1)
             print 'The sum of elements along the columns is :', arr.sum(axis=0)
             # Out[37]:
             #     For the following array:
             #     [[0 1 2 3]
             #      [4 5 6 7]]
             #     The sum of elements along the rows is    : [ 6 22]
             #     The sum of elements along the columns is : [ 4  6  8 10]
             #
             # As you can see in this example, the value of the `axis` parameter is the dimension which will be *consumed* once the operation has been carried out.  This is why to sum along the rows we use `axis=0`.
             #
             # This can be easily illustrated with an example that has more dimensions; we create an array with 4 dimensions and shape `(3,4,5,6)` and sum along the axis number 2 (i.e. the *third* axis, since in Python all counts are 0-based).  That consumes the dimension whose length was 5, leaving us with a new array that has shape `(3,4,6)`:
             # In[38]:
             np.zeros((3,4,5,6)).sum(2).shape
             # Out[38]:
             #     (3, 4, 6)
             # Another widely used property of arrays is the `.T` attribute, which allows you to access the transpose of the array:
             # In[39]:
             print 'Array:\n', arr
             print 'Transpose:\n', arr.T
             # Out[39]:
             #     Array:
             #     [[0 1 2 3]
             #      [4 5 6 7]]
             #     Transpose:
             #     [[0 4]
             #      [1 5]
             #      [2 6]
             #      [3 7]]
             #
             # We don't have time here to look at all the methods and properties of arrays, here's a complete list.  Simply try exploring some of these IPython to learn more, or read their description in the full Numpy documentation:
             #
             #     arr.T             arr.copy          arr.getfield      arr.put           arr.squeeze
             #     arr.all           arr.ctypes        arr.imag          arr.ravel         arr.std
             #     arr.any           arr.cumprod       arr.item          arr.real          arr.strides
             #     arr.argmax        arr.cumsum        arr.itemset       arr.repeat        arr.sum
             #     arr.argmin        arr.data          arr.itemsize      arr.reshape       arr.swapaxes
             #     arr.argsort       arr.diagonal      arr.max           arr.resize        arr.take
             #     arr.astype        arr.dot           arr.mean          arr.round         arr.tofile
             #     arr.base          arr.dtype         arr.min           arr.searchsorted  arr.tolist
             #     arr.byteswap      arr.dump          arr.nbytes        arr.setasflat     arr.tostring
             #     arr.choose        arr.dumps         arr.ndim          arr.setfield      arr.trace
             #     arr.clip          arr.fill          arr.newbyteorder  arr.setflags      arr.transpose
             #     arr.compress      arr.flags         arr.nonzero       arr.shape         arr.var
             #     arr.conj          arr.flat          arr.prod          arr.size          arr.view
             #     arr.conjugate     arr.flatten       arr.ptp           arr.sort
             ### Operating with arrays
             # Arrays support all regular arithmetic operators, and the numpy library also contains a complete collection of basic mathematical functions that operate on arrays.  It is important to remember that in general, all operations with arrays are applied *element-wise*, i.e., are applied to all the elements of the array at the same time.  Consider for example:
             # In[40]:
             arr1 = np.arange(4)
             arr2 = np.arange(10, 14)
             print arr1, '+', arr2, '=', arr1+arr2
             # Out[40]:
             #     [0 1 2 3] + [10 11 12 13] = [10 12 14 16]
             #
             # Importantly, you must remember that even the multiplication operator is by default applied element-wise, it is *not* the matrix multiplication from linear algebra (as is the case in Matlab, for example):
             # In[41]:
             print arr1, '*', arr2, '=', arr1*arr2
             # Out[41]:
             #     [0 1 2 3] * [10 11 12 13] = [ 0 11 24 39]
             #
             # While this means that in principle arrays must always match in their dimensionality in order for an operation to be valid, numpy will *broadcast* dimensions when possible.  For example, suppose that you want to add the number 1.5 to `arr1`; the following would be a valid way to do it:
             # In[42]:
             arr1 + 1.5*np.ones(4)
             # Out[42]:
             #     array([ 1.5,  2.5,  3.5,  4.5])
             # But thanks to numpy's broadcasting rules, the following is equally valid:
             # In[43]:
             arr1 + 1.5
             # Out[43]:
             #     array([ 1.5,  2.5,  3.5,  4.5])
             # In this case, numpy looked at both operands and saw that the first (`arr1`) was a one-dimensional array of length 4 and the second was a scalar, considered a zero-dimensional object. The broadcasting rules allow numpy to:
             #
             # * *create* new dimensions of length 1 (since this doesn't change the size of the array)
             # * 'stretch' a dimension of length 1 that needs to be matched to a dimension of a different size.
             #
             # So in the above example, the scalar 1.5 is effectively:
             #
             # * first 'promoted' to a 1-dimensional array of length 1
             # * then, this array is 'stretched' to length 4 to match the dimension of `arr1`.
             #
             # After these two operations are complete, the addition can proceed as now both operands are one-dimensional arrays of length 4.
             #
             # This broadcasting behavior is in practice enormously powerful, especially because when numpy broadcasts to create new dimensions or to 'stretch' existing ones, it doesn't actually replicate the data.  In the example above the operation is carried *as if* the 1.5 was a 1-d array with 1.5 in all of its entries, but no actual array was ever created.  This can save lots of memory in cases when the arrays in question are large and can have significant performance implications.
             #
             # The general rule is: when operating on two arrays, NumPy compares their shapes element-wise. It starts with the trailing dimensions, and works its way forward, creating dimensions of length 1 as needed. Two dimensions are considered compatible when
             #
             # * they are equal to begin with, or
             # * one of them is 1; in this case numpy will do the 'stretching' to make them equal.
             #
             # If these conditions are not met, a `ValueError: frames are not aligned` exception is thrown, indicating that the arrays have incompatible shapes. The size of the resulting array is the maximum size along each dimension of the input arrays.
             # This shows how the broadcasting rules work in several dimensions:
             # In[44]:
             b = np.array([2, 3, 4, 5])
             print arr, '\n\n+', b , '\n----------------\n', arr + b
             # Out[44]:
             #     [[0 1 2 3]
             #      [4 5 6 7]]
             #
             #     + [2 3 4 5]
             #     ----------------
             #     [[ 2  4  6  8]
             #      [ 6  8 10 12]]
             #
             # Now, how could you use broadcasting to say add `[4, 6]` along the rows to `arr` above?  Simply performing the direct addition will produce the error we previously mentioned:
             # In[45]:
             c = np.array([4, 6])
             arr + c
             # Out[45]:
                 ---------------------------------------------------------------------------
                 ValueError                                Traceback (most recent call last)
                 /home/fperez/teach/book-math-labtool/<ipython-input-45-62aa20ac1980> in <module>()
 c = np.array([4, 6])
                 ----> 2 arr + c
                 ValueError: operands could not be broadcast together with shapes (2,4) (2)
             # According to the rules above, the array `c` would need to have a *trailing* dimension of 1 for the broadcasting to work.  It turns out that numpy allows you to 'inject' new dimensions anywhere into an array on the fly, by indexing it with the special object `np.newaxis`:
             # In[46]:
             (c[:, np.newaxis]).shape
             # Out[46]:
             #     (2, 1)
             # This is exactly what we need, and indeed it works:
             # In[47]:
             arr + c[:, np.newaxis]
             # Out[47]:
             #     array([[ 4,  5,  6,  7],
             #            [10, 11, 12, 13]])
             # For the full broadcasting rules, please see the official Numpy docs, which describe them in detail and with more complex examples.
             # As we mentioned before, Numpy ships with a full complement of mathematical functions that work on entire arrays, including logarithms, exponentials, trigonometric and hyperbolic trigonometric functions, etc.  Furthermore, scipy ships a rich special function library in the `scipy.special` module that includes Bessel, Airy, Fresnel, Laguerre and other classical special functions.  For example, sampling the sine function at 100 points between $0$ and $2\pi$ is as simple as:
             # In[48]:
             x = np.linspace(0, 2*np.pi, 100)
             y = np.sin(x)
             ### Linear algebra in numpy
             # Numpy ships with a basic linear algebra library, and all arrays have a `dot` method whose behavior is that of the scalar dot product when its arguments are vectors (one-dimensional arrays) and the traditional matrix multiplication when one or both of its arguments are two-dimensional arrays:
             # In[49]:
             v1 = np.array([2, 3, 4])
             v2 = np.array([1, 0, 1])
             print v1, '.', v2, '=', v1.dot(v2)
             # Out[49]:
             #     [2 3 4] . [1 0 1] = 6
             #
             # Here is a regular matrix-vector multiplication, note that the array `v1` should be viewed as a *column* vector in traditional linear algebra notation; numpy makes no distinction between row and column vectors and simply verifies that the dimensions match the required rules of matrix multiplication, in this case we have a $2 \times 3$ matrix multiplied by a 3-vector, which produces a 2-vector:
             # In[50]:
             A = np.arange(6).reshape(2, 3)
             print A, 'x', v1, '=', A.dot(v1)
             # Out[50]:
             #     [[0 1 2]
             #      [3 4 5]] x [2 3 4] = [11 38]
             #
             # For matrix-matrix multiplication, the same dimension-matching rules must be satisfied, e.g. consider the difference between $A \times A^T$:
             # In[51]:
             print A.dot(A.T)
             # Out[51]:
             #     [[ 5 14]
             #      [14 50]]
             #
             # and $A^T \times A$:
             # In[52]:
             print A.T.dot(A)
             # Out[52]:
             #     [[ 9 12 15]
             #      [12 17 22]
             #      [15 22 29]]
             #
             # Furthermore, the `numpy.linalg` module includes additional functionality such as determinants, matrix norms, Cholesky, eigenvalue and singular value decompositions, etc.  For even more linear algebra tools, `scipy.linalg` contains the majority of the tools in the classic LAPACK libraries as well as functions to operate on sparse matrices.  We refer the reader to the Numpy and Scipy documentations for additional details on these.
             ### Reading and writing arrays to disk
             # Numpy lets you read and write arrays into files in a number of ways.  In order to use these tools well, it is critical to understand the difference between a *text* and a *binary* file containing numerical data.  In a text file, the number $\pi$ could be written as "3.141592653589793", for example: a string of digits that a human can read, with in this case 15 decimal digits.  In contrast, that same number written to a binary file would be encoded as 8 characters (bytes) that are not readable by a human but which contain the exact same data that the variable `pi` had in the computer's memory.
             #
             # The tradeoffs between the two modes are thus:
             #
             # * Text mode: occupies more space, precision can be lost (if not all digits are written to disk), but is readable and editable by hand with a text editor.  Can *only* be used for one- and two-dimensional arrays.
             #
             # * Binary mode: compact and exact representation of the data in memory, can't be read or edited by hand.  Arrays of any size and dimensionality can be saved and read without loss of information.
             #
             # First, let's see how to read and write arrays in text mode.  The `np.savetxt` function saves an array to a text file, with options to control the precision, separators and even adding a header:
             # In[53]:
             arr = np.arange(10).reshape(2, 5)
             np.savetxt('test.out', arr, fmt='%.2e', header="My dataset")
             !cat test.out
             # Out[53]:
             #     # My dataset
             #     0.00e+00 1.00e+00 2.00e+00 3.00e+00 4.00e+00
             #     5.00e+00 6.00e+00 7.00e+00 8.00e+00 9.00e+00
             #
             # And this same type of file can then be read with the matching `np.loadtxt` function:
             # In[54]:
             arr2 = np.loadtxt('test.out')
             print arr2
             # Out[54]:
             #     [[ 0.  1.  2.  3.  4.]
             #      [ 5.  6.  7.  8.  9.]]
             #
             # For binary data, Numpy provides the `np.save` and `np.savez` routines.  The first saves a single array to a file with `.npy` extension, while the latter can be used to save a *group* of arrays into a single file with `.npz` extension.  The files created with these routines can then be read with the `np.load` function.
             #
             # Let us first see how to use the simpler `np.save` function to save a single array:
             # In[55]:
             np.save('test.npy', arr2)
             # Now we read this back
             arr2n = np.load('test.npy')
             # Let's see if any element is non-zero in the difference.
             # A value of True would be a problem.
             print 'Any differences?', np.any(arr2-arr2n)
             # Out[55]:
             #     Any differences? False
             #
             # Now let us see how the `np.savez` function works.  You give it a filename and either a sequence of arrays or a set of keywords.  In the first mode, the function will auotmatically name the saved arrays in the archive as `arr_0`, `arr_1`, etc:
             # In[56]:
             np.savez('test.npz', arr, arr2)
             arrays = np.load('test.npz')
             arrays.files
             # Out[56]:
             #     ['arr_1', 'arr_0']
             # Alternatively, we can explicitly choose how to name the arrays we save:
             # In[57]:
             np.savez('test.npz', array1=arr, array2=arr2)
             arrays = np.load('test.npz')
             arrays.files
             # Out[57]:
             #     ['array2', 'array1']
             # The object returned by `np.load` from an `.npz` file works like a dictionary, though you can also access its constituent files by attribute using its special `.f` field; this is best illustrated with an example with the `arrays` object from above:
             # In[58]:
             print 'First row of first array:', arrays['array1'][0]
             # This is an equivalent way to get the same field
             print 'First row of first array:', arrays.f.array1[0]
             # Out[58]:
             #     First row of first array: [0 1 2 3 4]
             #     First row of first array: [0 1 2 3 4]
             #
             # This `.npz` format is a very convenient way to package compactly and without loss of information, into a single file, a group of related arrays that pertain to a specific problem.  At some point, however, the complexity of your dataset may be such that the optimal approach is to use one of the standard formats in scientific data processing that have been designed to handle complex datasets, such as NetCDF or HDF5.
             #
             # Fortunately, there are tools for manipulating these formats in Python, and for storing data in other ways such as databases.  A complete discussion of the possibilities is beyond the scope of this discussion, but of particular interest for scientific users we at least mention the following:
             #
             # * The `scipy.io` module contains routines to read and write Matlab files in `.mat` format and files in the NetCDF format that is widely used in certain scientific disciplines.
             #
             # * For manipulating files in the HDF5 format, there are two excellent options in Python: The PyTables project offers a high-level, object oriented approach to manipulating HDF5 datasets, while the h5py project offers a more direct mapping to the standard HDF5 library interface.  Both are excellent tools; if you need to work with HDF5 datasets you should read some of their documentation and examples and decide which approach is a better match for your needs.
             ## High quality data visualization with Matplotlib
             # The [matplotlib](http://matplotlib.sf.net) library is a powerful tool capable of producing complex publication-quality figures with fine layout control in two and three dimensions; here we will only provide a minimal self-contained introduction to its usage that covers the functionality needed for the rest of the book.  We encourage the reader to read the tutorials included with the matplotlib documentation as well as to browse its extensive gallery of examples that include source code.
             #
             # Just as we typically use the shorthand `np` for Numpy, we will use `plt` for the `matplotlib.pyplot` module where the easy-to-use plotting functions reside (the library contains a rich object-oriented architecture that we don't have the space to discuss here):
             # In[59]:
             import matplotlib.pyplot as plt
             # The most frequently used function is simply called `plot`, here is how you can make a simple plot of $\sin(x)$ for $x \in [0, 2\pi]$ with labels and a grid (we use the semicolon in the last line to suppress the display of some information that is unnecessary right now):
             # In[60]:
             x = np.linspace(0, 2*np.pi)
             y = np.sin(x)
             plt.plot(x,y, label='sin(x)')
             plt.legend()
             plt.grid()
             plt.title('Harmonic')
             plt.xlabel('x')
             plt.ylabel('y');
             # Out[60]:
-            # image file: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_01.svg
+            # image file: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_01.svg
             # You can control the style, color and other properties of the markers, for example:
             # In[61]:
             plt.plot(x, y, linewidth=2);
             # Out[61]:
-            # image file: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_02.svg
+            # image file: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_02.svg
             # In[62]:
             plt.plot(x, y, 'o', markersize=5, color='r');
             # Out[62]:
-            # image file: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_03.svg
+            # image file: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_03.svg
             # We will now see how to create a few other common plot types, such as a simple error plot:
             # In[63]:
             # example data
             x = np.arange(0.1, 4, 0.5)
             y = np.exp(-x)
             # example variable error bar values
             yerr = 0.1 + 0.2*np.sqrt(x)
             xerr = 0.1 + yerr
             # First illustrate basic pyplot interface, using defaults where possible.
             plt.figure()
             plt.errorbar(x, y, xerr=0.2, yerr=0.4)
             plt.title("Simplest errorbars, 0.2 in x, 0.4 in y");
             # Out[63]:
-            # image file: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_04.svg
+            # image file: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_04.svg
             # A simple log plot
             # In[64]:
             x = np.linspace(-5, 5)
             y = np.exp(-x**2)
             plt.semilogy(x, y);
             # Out[64]:
-            # image file: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_05.svg
+            # image file: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_05.svg
             # A histogram annotated with text inside the plot, using the `text` function:
             # In[65]:
             mu, sigma = 100, 15
             x = mu + sigma * np.random.randn(10000)
             # the histogram of the data
             n, bins, patches = plt.hist(x, 50, normed=1, facecolor='g', alpha=0.75)
             plt.xlabel('Smarts')
             plt.ylabel('Probability')
             plt.title('Histogram of IQ')
             # This will put a text fragment at the position given:
             plt.text(55, .027, r'$\mu=100,\ \sigma=15$', fontsize=14)
             plt.axis([40, 160, 0, 0.03])
             plt.grid(True)
             # Out[65]:
-            # image file: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_06.svg
+            # image file: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_06.svg
             ### Image display
             # The `imshow` command can display single or multi-channel images.  A simple array of random numbers, plotted in grayscale:
             # In[66]:
             from matplotlib import cm
             plt.imshow(np.random.rand(5, 10), cmap=cm.gray, interpolation='nearest');
             # Out[66]:
-            # image file: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_07.svg
+            # image file: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_07.svg
             # A real photograph is a multichannel image, `imshow` interprets it correctly:
             # In[67]:
             img = plt.imread('stinkbug.png')
             print 'Dimensions of the array img:', img.shape
             plt.imshow(img);
             # Out[67]:
             #     Dimensions of the array img: (375, 500, 3)
             #
-            # image file: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_08.svg
+            # image file: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_08.svg
             ### Simple 3d plotting with matplotlib
             # Note that you must execute at least once in your session:
             # In[68]:
             from mpl_toolkits.mplot3d import Axes3D
             # One this has been done, you can create 3d axes with the `projection='3d'` keyword to `add_subplot`:
             #
             #     fig = plt.figure()
             #     fig.add_subplot(<other arguments here>, projection='3d')
             # A simple surface plot:
             # In[72]:
             from mpl_toolkits.mplot3d.axes3d import Axes3D
             from matplotlib import cm
             fig = plt.figure()
             ax = fig.add_subplot(1, 1, 1, projection='3d')
             X = np.arange(-5, 5, 0.25)
             Y = np.arange(-5, 5, 0.25)
             X, Y = np.meshgrid(X, Y)
             R = np.sqrt(X**2 + Y**2)
             Z = np.sin(R)
             surf = ax.plot_surface(X, Y, Z, rstride=1, cstride=1, cmap=cm.jet,
                     linewidth=0, antialiased=False)
             ax.set_zlim3d(-1.01, 1.01);
             # Out[72]:
-            # image file: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_09.svg
+            # image file: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_09.svg
             ## IPython: a powerful interactive environment
             # A key component of the everyday workflow of most scientific computing environments is a good interactive environment, that is, a system in which you can execute small amounts of code and view the results immediately, combining both printing out data and opening graphical visualizations.  All modern systems for scientific computing, commercial and open source, include such functionality.
             #
             # Out of the box, Python also offers a simple interactive shell with very limited capabilities.  But just like the scientific community built Numpy to provide arrays suited for scientific work (since Pytyhon's lists aren't optimal for this task), it has also developed an interactive environment much more sophisticated than the built-in one.  The [IPython project](http://ipython.org) offers a set of tools to make productive use of the Python language, all the while working interactively and with immedate feedback on your results.  The basic tools that IPython provides are:
             #
             # 1. A powerful terminal shell, with many features designed to increase the fluidity and productivity of everyday scientific workflows, including:
             #
             #     * rich introspection of all objects and variables including easy access to the source code of any function
             #     * powerful and extensible tab completion of variables and filenames,
             #     * tight integration with matplotlib, supporting interactive figures that don't block the terminal,
             #     * direct access to the filesystem and underlying operating system,
             #     * an extensible system for shell-like commands called 'magics' that reduce the work needed to perform many common tasks,
             #     * tools for easily running, timing, profiling and debugging your codes,
             #     * syntax highlighted error messages with much more detail than the default Python ones,
             #     * logging and access to all previous history of inputs, including across sessions
             #
             # 2. A Qt console that provides the look and feel of a terminal, but adds support for inline figures, graphical calltips, a persistent session that can survive crashes (even segfaults) of the kernel process, and more.
             #
             # 3. A web-based notebook that can execute code and also contain rich text and figures, mathematical equations and arbitrary HTML. This notebook presents a document-like view with cells where code is executed but that can be edited in-place, reordered, mixed with explanatory text and figures, etc.
             #
             # 4. A high-performance, low-latency system for parallel computing that supports the control of a cluster of IPython engines communicating over a network, with optimizations that minimize unnecessary copying of large objects (especially numpy arrays).
             #
             # We will now discuss the highlights of the tools 1-3 above so that you can make them an effective part of your workflow.  The topic of parallel computing is beyond the scope of this document, but we encourage you to read the extensive [documentation](http://ipython.org/ipython-doc/rel-0.12.1/parallel/index.html) and [tutorials](http://minrk.github.com/scipy-tutorial-2011/) on this available on the IPython website.
             ### The IPython terminal
             # You can start IPython at the terminal simply by typing:
             #
             #     $ ipython
             #
             # which will provide you some basic information about how to get started and will then open a prompt labeled `In [1]:` for you to start typing.  Here we type $2^{64}$ and Python computes the result for us in exact arithmetic, returning it as `Out[1]`:
             #
             #     $ ipython
             #     Python 2.7.2+ (default, Oct  4 2011, 20:03:08)
             #     Type "copyright", "credits" or "license" for more information.
             #
             #     IPython 0.13.dev -- An enhanced Interactive Python.
             #     ?         -> Introduction and overview of IPython's features.
             #     %quickref -> Quick reference.
             #     help      -> Python's own help system.
             #     object?   -> Details about 'object', use 'object??' for extra details.
             #
             #     In [1]: 2**64
             #     Out[1]: 18446744073709551616L
             #
             # The first thing you should know about IPython is that all your inputs and outputs are saved. There are two variables named `In` and `Out` which are filled as you work with your results.  Furthermore, all outputs are also saved to auto-created variables of the form `_NN` where `NN` is the prompt number, and inputs to `_iNN`.  This allows you to recover quickly the result of a prior computation by referring to its number even if you forgot to store it as a variable.  For example, later on in the above session you can do:
             #
             #     In [6]: print _1
             #     18446744073709551616
             # We strongly recommend that you take a few minutes to read at least the basic introduction provided by the `?` command, and keep in mind that the `%quickref` command at all times can be used as a quick reference "cheat sheet" of the most frequently used features of IPython.
             #
             # At the IPython prompt, any valid Python code that you type will be executed similarly to the default Python shell (though often with more informative feedback).  But since IPython is a *superset* of the default Python shell; let's have a brief look at some of its additional functionality.
             # **Object introspection**
             #
             # A simple `?` command provides a general introduction to IPython, but as indicated in the banner above, you can use the `?` syntax to ask for details about any object.  For example, if we type `_1?`, IPython will print the following details about this variable:
             #
             #     In [14]: _1?
             #     Type:       long
             #     Base Class: <type 'long'>
             #     String Form:18446744073709551616
             #     Namespace:  Interactive
             #     Docstring:
             #     long(x[, base]) -> integer
             #
             #     Convert a string or number to a long integer, if possible.  A floating
             #
             #     [etc... snipped for brevity]
             #
             # If you add a second `?` and for any oobject `x` type `x??`, IPython will try to provide an even more detailed analsysi of the object, including its syntax-highlighted source code when it can be found.  It's possible that `x??` returns the same information as `x?`, but in many cases `x??` will indeed provide additional details.
             #
             # Finally, the `?` syntax is also useful to search *namespaces* with wildcards.  Suppose you are wondering if there is any function in Numpy that may do text-related things; with `np.*txt*?`, IPython will print all the names in the `np` namespace (our Numpy shorthand) that have 'txt' anywhere in their name:
             #
             #     In [17]: np.*txt*?
             #     np.genfromtxt
             #     np.loadtxt
             #     np.mafromtxt
             #     np.ndfromtxt
             #     np.recfromtxt
             #     np.savetxt
             # **Tab completion**
             #
             # IPython makes the tab key work extra hard for you as a way to rapidly inspect objects and libraries.  Whenever you have typed something at the prompt, by hitting the `<tab>` key IPython will try to complete the rest of the line.  For this, IPython will analyze the text you had so far and try to search for Python data or files that may match the context you have already provided.
             #
             # For example, if you type `np.load` and hit the <tab> key, you'll see:
             #
             #     In [21]: np.load<TAB HERE>
             #     np.load     np.loads    np.loadtxt
             #
             # so you can quickly find all the load-related functionality in numpy.  Tab completion works even for function arguments, for example consider this function definition:
             #
             #     In [20]: def f(x, frobinate=False):
             #        ....:     if frobinate:
             #        ....:         return x**2
             #        ....:
             #
             # If you now use the `<tab>` key after having typed 'fro' you'll get all valid Python completions, but those marked with `=` at the end are known to be keywords of your function:
             #
             #     In [21]: f(2, fro<TAB HERE>
             #     frobinate=    frombuffer    fromfunction  frompyfunc    fromstring
             #     from          fromfile      fromiter      fromregex     frozenset
             #
             # at this point you can add the `b` letter and hit `<tab>` once more, and IPython will finish the line for you:
             #
             #     In [21]: f(2, frobinate=
             #
             # As a beginner, simply get into the habit of using `<tab>` after most objects; it should quickly become second nature as you will see how helps keep a fluid workflow and discover useful information.  Later on you can also customize this behavior by writing your own completion code, if you so desire.
             # **Matplotlib integration**
             #
             # One of the most useful features of IPython for scientists is its tight integration with matplotlib: at the terminal IPython lets you open matplotlib figures without blocking your typing (which is what happens if you try to do the same thing at the default Python shell), and in the Qt console and notebook you can even view your figures embedded in your workspace next to the code that created them.
             #
             # The matplotlib support can be either activated when you start IPython by passing the `--pylab` flag, or at any point later in your session by using the `%pylab` command.  If you start IPython with `--pylab`, you'll see something like this (note the extra message about pylab):
             #
             #     $ ipython --pylab
             #     Python 2.7.2+ (default, Oct  4 2011, 20:03:08)
             #     Type "copyright", "credits" or "license" for more information.
             #
             #     IPython 0.13.dev -- An enhanced Interactive Python.
             #     ?         -> Introduction and overview of IPython's features.
             #     %quickref -> Quick reference.
             #     help      -> Python's own help system.
             #     object?   -> Details about 'object', use 'object??' for extra details.
             #
             #     Welcome to pylab, a matplotlib-based Python environment [backend: Qt4Agg].
             #     For more information, type 'help(pylab)'.
             #
             #     In [1]:
             #
             # Furthermore, IPython will import `numpy` with the `np` shorthand, `matplotlib.pyplot` as `plt`, and it will also load all of the numpy and pyplot top-level names so that you can directly type something like:
             #
             #     In [1]: x = linspace(0, 2*pi, 200)
             #
             #     In [2]: plot(x, sin(x))
             #     Out[2]: [<matplotlib.lines.Line2D at 0x9e7c16c>]
             #
             # instead of having to prefix each call with its full signature (as we have been doing in the examples thus far):
             #
             #     In [3]: x = np.linspace(0, 2*np.pi, 200)
             #
             #     In [4]: plt.plot(x, np.sin(x))
             #     Out[4]: [<matplotlib.lines.Line2D at 0x9e900ac>]
             #
             # This shorthand notation can be a huge time-saver when working interactively (it's a few characters but you are likely to type them hundreds of times in a session).  But we should note that as you develop persistent scripts and notebooks meant for reuse, it's best to get in the habit of using the longer notation (known as *fully qualified names* as it's clearer where things come from and it makes for more robust, readable and maintainable code in the long run).
             # **Access to the operating system and files**
             #
             # In IPython, you can type `ls` to see your files or `cd` to change directories, just like you would at a regular system prompt:
             #
             #     In [2]: cd tests
             #     /home/fperez/ipython/nbconvert/tests
             #
             #     In [3]: ls test.*
             #     test.aux  test.html  test.ipynb  test.log  test.out  test.pdf  test.rst  test.tex
             #
             # Furthermore, if you use the `!` at the beginning of a line, any commands you pass afterwards go directly to the operating system:
             #
             #     In [4]: !echo "Hello IPython"
             #     Hello IPython
             #
             # IPython offers a useful twist in this feature: it will substitute in the command the value of any *Python* variable you may have if you prepend it with a `$` sign:
             #
             #     In [5]: message = 'IPython interpolates from Python to the shell'
             #
             #     In [6]: !echo $message
             #     IPython interpolates from Python to the shell
             #
             # This feature can be extremely useful, as it lets you combine the power and clarity of Python for complex logic with the immediacy and familiarity of many shell commands.  Additionally, if you start the line with *two* `$$` signs, the output of the command will be automatically captured as a list of lines, e.g.:
             #
             #     In [10]: !!ls test.*
             #     Out[10]:
             #     ['test.aux',
             #      'test.html',
             #      'test.ipynb',
             #      'test.log',
             #      'test.out',
             #      'test.pdf',
             #      'test.rst',
             #      'test.tex']
             #
             # As explained above, you can now use this as the variable `_10`.  If you directly want to capture the output of a system command to a Python variable, you can use the syntax `=!`:
             #
             #     In [11]: testfiles =! ls test.*
             #
             #     In [12]: print testfiles
             #     ['test.aux', 'test.html', 'test.ipynb', 'test.log', 'test.out', 'test.pdf', 'test.rst', 'test.tex']
             #
             # Finally, the special `%alias` command lets you define names that are shorthands for system commands, so that you can type them without having to prefix them via `!` explicitly (for example, `ls` is an alias that has been predefined for you at startup).
             # **Magic commands**
             #
             # IPython has a system for special commands, called 'magics', that let you control IPython itself and perform many common tasks with a more shell-like syntax: it uses spaces for delimiting arguments, flags can be set with dashes and all arguments are treated as strings, so no additional quoting is required.  This kind of syntax is invalid in the Python language but very convenient for interactive typing (less parentheses, commans and quoting everywhere); IPython distinguishes the two by detecting lines that start with the `%` character.
             #
             # You can learn more about the magic system by simply typing `%magic` at the prompt, which will give you a short description plus the documentation on *all* available magics.  If you want to see only a listing of existing magics, you can use `%lsmagic`:
             #
             #     In [4]: lsmagic
             #     Available magic functions:
             #     %alias  %autocall  %autoindent  %automagic  %bookmark  %c  %cd  %colors  %config  %cpaste
             #     %debug  %dhist  %dirs  %doctest_mode  %ds  %ed  %edit  %env  %gui  %hist  %history
             #     %install_default_config  %install_ext  %install_profiles  %load_ext  %loadpy  %logoff  %logon
             #     %logstart  %logstate  %logstop  %lsmagic  %macro  %magic  %notebook  %page  %paste  %pastebin
             #     %pd  %pdb  %pdef  %pdoc  %pfile  %pinfo  %pinfo2  %pop  %popd  %pprint  %precision  %profile
             #     %prun  %psearch  %psource  %pushd  %pwd  %pycat  %pylab  %quickref  %recall  %rehashx
             #     %reload_ext  %rep  %rerun  %reset  %reset_selective  %run  %save  %sc  %stop  %store  %sx  %tb
             #     %time  %timeit  %unalias  %unload_ext  %who  %who_ls  %whos  %xdel  %xmode
             #
             #     Automagic is ON, % prefix NOT needed for magic functions.
             #
             # Note how the example above omitted the eplicit `%` marker and simply uses `lsmagic`.  As long as the 'automagic' feature is on (which it is by default), you can omit the `%` marker as long as there is no ambiguity with a Python variable of the same name.
             # **Running your code**
             #
             # While it's easy to type a few lines of code in IPython, for any long-lived work you should keep your codes in Python scripts (or in IPython notebooks, see below).  Consider that you have a script, in this case trivially simple for the sake of brevity, named `simple.py`:
             #
             #     In [12]: !cat simple.py
             #     import numpy as np
             #
             #     x = np.random.normal(size=100)
             #
             #     print 'First elment of x:', x[0]
             #
             # The typical workflow with IPython is to use the `%run` magic to execute your script (you can omit the .py extension if you want).  When you run it, the script will execute just as if it had been run at the system prompt with `python simple.py` (though since modules don't get re-executed on new imports by Python, all system initialization is essentially free, which can have a significant run time impact in some cases):
             #
             #     In [13]: run simple
             #     First elment of x: -1.55872256289
             #
             # Once it completes, all variables defined in it become available for you to use interactively:
             #
             #     In [14]: x.shape
             #     Out[14]: (100,)
             #
             # This allows you to plot data, try out ideas, etc, in a `%run`/interact/edit cycle that can be very productive.  As you start understanding your problem better you can refine your script further, incrementally improving it based on the work you do at the IPython prompt.  At any point you can use the `%hist` magic to print out your history without prompts, so that you can copy useful fragments back into the script.
             #
             # By default, `%run` executes scripts in a completely empty namespace, to better mimic how they would execute at the system prompt with plain Python.  But if you use the `-i` flag, the script will also see your interactively defined variables.  This lets you edit in a script larger amounts of code that still behave as if you had typed them at the IPython prompt.
             #
             # You can also get a summary of the time taken by your script with the `-t` flag; consider a different script `randsvd.py` that takes a bit longer to run:
             #
             #     In [21]: run -t randsvd.py
             #
             #     IPython CPU timings (estimated):
             #       User   :       0.38 s.
             #       System :       0.04 s.
             #     Wall time:       0.34 s.
             #
             # `User` is the time spent by the computer executing your code, while `System` is the time the operating system had to work on your behalf, doing things like memory allocation that are needed by your code but that you didn't explicitly program and that happen inside the kernel.  The `Wall time` is the time on a 'clock on the wall' between the start and end of your program.
             #
             # If `Wall > User+System`, your code is most likely waiting idle for certain periods.  That could be waiting for data to arrive from a remote source or perhaps because the operating system has to swap large amounts of virtual memory.  If you know that your code doesn't explicitly wait for remote data to arrive, you should investigate further to identify possible ways of improving the performance profile.
             #
             # If you only want to time how long a single statement takes, you don't need to put it into a script as you can use the `%timeit` magic, which uses Python's `timeit` module to very carefully measure timig data; `timeit` can measure even short statements that execute extremely fast:
             #
             #     In [27]: %timeit a=1
             #     10000000 loops, best of 3: 23 ns per loop
             #
             # and for code that runs longer, it automatically adjusts so the overall measurement doesn't take too long:
             #
             #     In [28]: %timeit np.linalg.svd(x)
             #     1 loops, best of 3: 310 ms per loop
             #
             # The `%run` magic still has more options for debugging and profiling data; you should read its documentation for many useful details (as always, just type `%run?`).
             ### The graphical Qt console
             # If you type at the system prompt (see the IPython website for installation details, as this requires some additional libraries):
             #
             #     $ ipython qtconsole
             #
             # instead of opening in a terminal as before, IPython will start a graphical console that at first sight appears just like a terminal, but which is in fact much more capable than a text-only terminal.  This is a specialized terminal designed for interactive scientific work, and it supports full multi-line editing with color highlighting and graphical calltips for functions, it can keep multiple IPython sessions open simultaneously in tabs, and when scripts run it can display the figures inline directly in the work area.
             #
             # <center><img src="ipython_qtconsole2.png" width=400px></center>
             # % This cell is for the pdflatex output only
             # \begin{figure}[htbp]
             # \centering
             # \includegraphics[width=3in]{ipython_qtconsole2.png}
             # \caption{The IPython Qt console: a lightweight terminal for scientific exploration, with code, results and graphics in a soingle environment.}
             # \end{figure}
             # The Qt console accepts the same `--pylab` startup flags as the terminal, but you can additionally supply the value `--pylab inline`, which enables the support for inline graphics shown in the figure.  This is ideal for keeping all the code and figures in the same session, given that the console can save the output of your entire session to HTML or PDF.
             #
             # Since the Qt console makes it far more convenient than the terminal to edit blocks of code with multiple lines, in this environment it's worth knowing about the `%loadpy` magic function.  `%loadpy` takes a path to a local file or remote URL, fetches its contents, and puts it in the work area for you to further edit and execute.  It can be an extremely fast and convenient way of loading code from local disk or remote examples from sites such as the [Matplotlib gallery](http://matplotlib.sourceforge.net/gallery.html).
             #
             # Other than its enhanced capabilities for code and graphics, all of the features of IPython we've explained before remain functional in this graphical console.
             ### The IPython Notebook
             # The third way to interact with IPython, in addition to the terminal and graphical Qt console, is a powerful web interface called the "IPython Notebook".  If you run at the system console (you can omit the `pylab` flags if you don't need plotting support):
             #
             #     $ ipython notebook --pylab inline
             #
             # IPython will start a process that runs a web server in your local machine and to which a web browser can connect.  The Notebook is a workspace that lets you execute code in blocks called 'cells' and displays any results and figures, but which can also contain arbitrary text (including LaTeX-formatted mathematical expressions) and any rich media that a modern web browser is capable of displaying.
             #
             # <center><img src="ipython-notebook-specgram-2.png" width=400px></center>
             # % This cell is for the pdflatex output only
             # \begin{figure}[htbp]
             # \centering
             # \includegraphics[width=3in]{ipython-notebook-specgram-2.png}
             # \caption{The IPython Notebook: text, equations, code, results, graphics and other multimedia in an open format for scientific exploration and collaboration}
             # \end{figure}
             # In fact, this document was written as a Notebook, and only exported to LaTeX for printing.  Inside of each cell, all the features of IPython that we have discussed before remain functional, since ultimately this web client is communicating with the same IPython code that runs in the terminal.  But this interface is a much more rich and powerful environment for maintaining long-term "live and executable" scientific documents.
             #
             # Notebook environments have existed in commercial systems like Mathematica(TM) and Maple(TM) for a long time; in the open source world the [Sage](http://sagemath.org) project blazed this particular trail starting in 2006, and now we bring all the features that have made IPython such a widely used tool to a Notebook model.
             #
             # Since the Notebook runs as a web application, it is possible to configure it for remote access, letting you run your computations on a persistent server close to your data, which you can then access remotely from any browser-equipped computer.  We encourage you to read the extensive documentation provided by the IPython project for details on how to do this and many more features of the notebook.
             #
             # Finally, as we said earlier, IPython also has a high-level and easy to use set of libraries for parallel computing, that let you control (interactively if desired) not just one IPython but an entire cluster of 'IPython engines'.   Unfortunately a detailed discussion of these tools is beyond the scope of this text, but should you need to parallelize your analysis codes, a quick read of the tutorials and examples provided at the IPython site may prove fruitful.

tests/ipynbref/IntroNumPy.orig.rst

0 +10 -10

             An Introduction to the Scientific Python Ecosystem
             ==================================================
             While the Python language is an excellent tool for general-purpose
             programming, with a highly readable syntax, rich and powerful data types
             (strings, lists, sets, dictionaries, arbitrary length integers, etc) and
             a very comprehensive standard library, it was not designed specifically
             for mathematical and scientific computing. Neither the language nor its
             standard library have facilities for the efficient representation of
             multidimensional datasets, tools for linear algebra and general matrix
             manipulations (an essential building block of virtually all technical
             computing), nor any data visualization facilities.
             In particular, Python lists are very flexible containers that can be
             nested arbitrarily deep and which can hold any Python object in them,
             but they are poorly suited to represent efficiently common mathematical
             constructs like vectors and matrices. In contrast, much of our modern
             heritage of scientific computing has been built on top of libraries
             written in the Fortran language, which has native support for vectors
             and matrices as well as a library of mathematical functions that can
             efficiently operate on entire arrays at once.
             Scientific Python: a collaboration of projects built by scientists
             ------------------------------------------------------------------
             The scientific community has developed a set of related Python libraries
             that provide powerful array facilities, linear algebra, numerical
             algorithms, data visualization and more. In this appendix, we will
             briefly outline the tools most frequently used for this purpose, that
             make "Scientific Python" something far more powerful than the Python
             language alone.
             For reasons of space, we can only describe in some detail the central
             Numpy library, but below we provide links to the websites of each
             project where you can read their documentation in more detail.
             First, let's look at an overview of the basic tools that most scientists
             use in daily research with Python. The core of this ecosystem is
             composed of:
             -  Numpy: the basic library that most others depend on, it provides a
                powerful array type that can represent multidmensional datasets of
                many different kinds and that supports arithmetic operations. Numpy
                also provides a library of common mathematical functions, basic
                linear algebra, random number generation and Fast Fourier Transforms.
                Numpy can be found at `numpy.scipy.org <http://numpy.scipy.org>`_
             -  Scipy: a large collection of numerical algorithms that operate on
                numpy arrays and provide facilities for many common tasks in
                scientific computing, including dense and sparse linear algebra
                support, optimization, special functions, statistics, n-dimensional
                image processing, signal processing and more. Scipy can be found at
                `scipy.org <http://scipy.org>`_.
             -  Matplotlib: a data visualization library with a strong focus on
                producing high-quality output, it supports a variety of common
                scientific plot types in two and three dimensions, with precise
                control over the final output and format for publication-quality
                results. Matplotlib can also be controlled interactively allowing
                graphical manipulation of your data (zooming, panning, etc) and can
                be used with most modern user interface toolkits. It can be found at
                `matplotlib.sf.net <http://matplotlib.sf.net>`_.
             -  IPython: while not strictly scientific in nature, IPython is the
                interactive environment in which many scientists spend their time.
                IPython provides a powerful Python shell that integrates tightly with
                Matplotlib and with easy access to the files and operating system,
                and which can execute in a terminal or in a graphical Qt console.
                IPython also has a web-based notebook interface that can combine code
                with text, mathematical expressions, figures and multimedia. It can
                be found at `ipython.org <http://ipython.org>`_.
             While each of these tools can be installed separately, in our opinion
             the most convenient way today of accessing them (especially on Windows
             and Mac computers) is to install the `Free Edition of the Enthought
             Python Distribution <http://www.enthought.com/products/epd_free.php>`_
             which contain all the above. Other free alternatives on Windows (but not
             on Macs) are `Python(x,y) <http://code.google.com/p/pythonxy>`_ and
             `Christoph Gohlke's packages
             page <http://www.lfd.uci.edu/~gohlke/pythonlibs>`_.
             These four 'core' libraries are in practice complemented by a number of
             other tools for more specialized work. We will briefly list here the
             ones that we think are the most commonly needed:
             -  Sympy: a symbolic manipulation tool that turns a Python session into
                a computer algebra system. It integrates with the IPython notebook,
                rendering results in properly typeset mathematical notation.
                `sympy.org <http://sympy.org>`_.
             -  Mayavi: sophisticated 3d data visualization;
                `code.enthought.com/projects/mayavi <http://code.enthought.com/projects/mayavi>`_.
             -  Cython: a bridge language between Python and C, useful both to
                optimize performance bottlenecks in Python and to access C libraries
                directly; `cython.org <http://cython.org>`_.
             -  Pandas: high-performance data structures and data analysis tools,
                with powerful data alignment and structural manipulation
                capabilities; `pandas.pydata.org <http://pandas.pydata.org>`_.
             -  Statsmodels: statistical data exploration and model estimation;
                `statsmodels.sourceforge.net <http://statsmodels.sourceforge.net>`_.
             -  Scikit-learn: general purpose machine learning algorithms with a
                common interface; `scikit-learn.org <http://scikit-learn.org>`_.
             -  Scikits-image: image processing toolbox;
                `scikits-image.org <http://scikits-image.org>`_.
             -  NetworkX: analysis of complex networks (in the graph theoretical
                sense); `networkx.lanl.gov <http://networkx.lanl.gov>`_.
             -  PyTables: management of hierarchical datasets using the
                industry-standard HDF5 format;
                `www.pytables.org <http://www.pytables.org>`_.
             Beyond these, for any specific problem you should look on the internet
             first, before starting to write code from scratch. There's a good chance
             that someone, somewhere, has written an open source library that you can
             use for part or all of your problem.
             A note about the examples below
             -------------------------------
             In all subsequent examples, you will see blocks of input code, followed
             by the results of the code if the code generated output. This output may
             include text, graphics and other result objects. These blocks of input
             can be pasted into your interactive IPython session or notebook for you
             to execute. In the print version of this document, a thin vertical bar
             on the left of the blocks of input and output shows which blocks go
             together.
             If you are reading this text as an actual IPython notebook, you can
             press ``Shift-Enter`` or use the 'play' button on the toolbar
             (right-pointing triangle) to execute each block of code, known as a
             'cell' in IPython:
             In[71]:
             .. code:: python
                 # This is a block of code, below you'll see its output
                 print "Welcome to the world of scientific computing with Python!"
             .. parsed-literal::
                 Welcome to the world of scientific computing with Python!
             Motivation: the trapezoidal rule
             ================================
             In subsequent sections we'll provide a basic introduction to the nuts
             and bolts of the basic scientific python tools; but we'll first motivate
             it with a brief example that illustrates what you can do in a few lines
             with these tools. For this, we will use the simple problem of
             approximating a definite integral with the trapezoid rule:
             .. math::
                \int_{a}^{b} f(x)\, dx \approx \frac{1}{2} \sum_{k=1}^{N} \left( x_{k} - x_{k-1} \right) \left( f(x_{k}) + f(x_{k-1}) \right).
             Our task will be to compute this formula for a function such as:
             .. math::
                f(x) = (x-3)(x-5)(x-7)+85
             integrated between :math:`a=1` and :math:`b=9`.
             First, we define the function and sample it evenly between 0 and 10 at
 points:
             In[1]:
             .. code:: python
                 def f(x):
                     return (x-3)*(x-5)*(x-7)+85
                 import numpy as np
                 x = np.linspace(0, 10, 200)
                 y = f(x)
             We select :math:`a` and :math:`b`, our integration limits, and we take
             only a few points in that region to illustrate the error behavior of the
             trapezoid approximation:
             In[2]:
             .. code:: python
                 a, b = 1, 9
                 xint = x[logical_and(x>=a, x<=b)][::30]
                 yint = y[logical_and(x>=a, x<=b)][::30]
             Let's plot both the function and the area below it in the trapezoid
             approximation:
             In[3]:
             .. code:: python
                 import matplotlib.pyplot as plt
                 plt.plot(x, y, lw=2)
                 plt.axis([0, 10, 0, 140])
                 plt.fill_between(xint, 0, yint, facecolor='gray', alpha=0.4)
                 plt.text(0.5 * (a + b), 30,r"$\int_a^b f(x)dx$", horizontalalignment='center', fontsize=20);
-            .. image:: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_00.svg
+            .. image:: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_00.svg
             Compute the integral both at high accuracy and with the trapezoid
             approximation
             In[4]:
             .. code:: python
                 from scipy.integrate import quad, trapz
                 integral, error = quad(f, 1, 9)
                 trap_integral = trapz(yint, xint)
                 print "The integral is: %g +/- %.1e" % (integral, error)
                 print "The trapezoid approximation with", len(xint), "points is:", trap_integral
                 print "The absolute error is:", abs(integral - trap_integral)
             .. parsed-literal::
                 The integral is: 680 +/- 7.5e-12
                 The trapezoid approximation with 6 points is: 621.286411141
                 The absolute error is: 58.7135888589
             This simple example showed us how, combining the numpy, scipy and
             matplotlib libraries we can provide an illustration of a standard method
             in elementary calculus with just a few lines of code. We will now
             discuss with more detail the basic usage of these tools.
             NumPy arrays: the right data structure for scientific computing
             ===============================================================
             Basics of Numpy arrays
             ----------------------
             We now turn our attention to the Numpy library, which forms the base
             layer for the entire 'scipy ecosystem'. Once you have installed numpy,
             you can import it as
             In[5]:
             .. code:: python
                 import numpy
             though in this book we will use the common shorthand
             In[6]:
             .. code:: python
                 import numpy as np
             As mentioned above, the main object provided by numpy is a powerful
             array. We'll start by exploring how the numpy array differs from Python
             lists. We start by creating a simple list and an array with the same
             contents of the list:
             In[7]:
             .. code:: python
                 lst = [10, 20, 30, 40]
                 arr = np.array([10, 20, 30, 40])
             Elements of a one-dimensional array are accessed with the same syntax as
             a list:
             In[8]:
             .. code:: python
                 lst[0]
             Out[8]:
             .. parsed-literal::
             In[9]:
             .. code:: python
                 arr[0]
             Out[9]:
             .. parsed-literal::
             In[10]:
             .. code:: python
                 arr[-1]
             Out[10]:
             .. parsed-literal::
             In[11]:
             .. code:: python
                 arr[2:]
             Out[11]:
             .. parsed-literal::
                 array([30, 40])
             The first difference to note between lists and arrays is that arrays are
             *homogeneous*; i.e. all elements of an array must be of the same type.
             In contrast, lists can contain elements of arbitrary type. For example,
             we can change the last element in our list above to be a string:
             In[12]:
             .. code:: python
                 lst[-1] = 'a string inside a list'
                 lst
             Out[12]:
             .. parsed-literal::
                 [10, 20, 30, 'a string inside a list']
             but the same can not be done with an array, as we get an error message:
             In[13]:
             .. code:: python
                 arr[-1] = 'a string inside an array'
             ::
                 ---------------------------------------------------------------------------
                 ValueError                                Traceback (most recent call last)
                 /home/fperez/teach/book-math-labtool/<ipython-input-13-29c0bfa5fa8a> in <module>()
                 ----> 1 arr[-1] = 'a string inside an array'
                 ValueError: invalid literal for long() with base 10: 'a string inside an array'
             The information about the type of an array is contained in its *dtype*
             attribute:
             In[14]:
             .. code:: python
                 arr.dtype
             Out[14]:
             .. parsed-literal::
                 dtype('int32')
             Once an array has been created, its dtype is fixed and it can only store
             elements of the same type. For this example where the dtype is integer,
             if we store a floating point number it will be automatically converted
             into an integer:
             In[15]:
             .. code:: python
                 arr[-1] = 1.234
                 arr
             Out[15]:
             .. parsed-literal::
                 array([10, 20, 30,  1])
             Above we created an array from an existing list; now let us now see
             other ways in which we can create arrays, which we'll illustrate next. A
             common need is to have an array initialized with a constant value, and
             very often this value is 0 or 1 (suitable as starting value for additive
             and multiplicative loops respectively); ``zeros`` creates arrays of all
             zeros, with any desired dtype:
             In[16]:
             .. code:: python
                 np.zeros(5, float)
             Out[16]:
             .. parsed-literal::
                 array([ 0.,  0.,  0.,  0.,  0.])
             In[17]:
             .. code:: python
                 np.zeros(3, int)
             Out[17]:
             .. parsed-literal::
                 array([0, 0, 0])
             In[18]:
             .. code:: python
                 np.zeros(3, complex)
             Out[18]:
             .. parsed-literal::
                 array([ 0.+0.j,  0.+0.j,  0.+0.j])
             and similarly for ``ones``:
             In[19]:
             .. code:: python
                 print '5 ones:', np.ones(5)
             .. parsed-literal::
 ones: [ 1.  1.  1.  1.  1.]
             If we want an array initialized with an arbitrary value, we can create
             an empty array and then use the fill method to put the value we want
             into the array:
             In[20]:
             .. code:: python
                 a = empty(4)
                 a.fill(5.5)
                 a
             Out[20]:
             .. parsed-literal::
                 array([ 5.5,  5.5,  5.5,  5.5])
             Numpy also offers the ``arange`` function, which works like the builtin
             ``range`` but returns an array instead of a list:
             In[21]:
             .. code:: python
                 np.arange(5)
             Out[21]:
             .. parsed-literal::
                 array([0, 1, 2, 3, 4])
             and the ``linspace`` and ``logspace`` functions to create linearly and
             logarithmically-spaced grids respectively, with a fixed number of points
             and including both ends of the specified interval:
             In[22]:
             .. code:: python
                 print "A linear grid between 0 and 1:", np.linspace(0, 1, 5)
                 print "A logarithmic grid between 10**1 and 10**4: ", np.logspace(1, 4, 4)
             .. parsed-literal::
                 A linear grid between 0 and 1: [ 0.    0.25  0.5   0.75  1.  ]
                 A logarithmic grid between 10**1 and 10**4:  [    10.    100.   1000.  10000.]
             Finally, it is often useful to create arrays with random numbers that
             follow a specific distribution. The ``np.random`` module contains a
             number of functions that can be used to this effect, for example this
             will produce an array of 5 random samples taken from a standard normal
             distribution (0 mean and variance 1):
             In[23]:
             .. code:: python
                 np.random.randn(5)
             Out[23]:
             .. parsed-literal::
                 array([-0.08633343, -0.67375434,  1.00589536,  0.87081651,  1.65597822])
             whereas this will also give 5 samples, but from a normal distribution
             with a mean of 10 and a variance of 3:
             In[24]:
             .. code:: python
                 norm10 = np.random.normal(10, 3, 5)
                 norm10
             Out[24]:
             .. parsed-literal::
                 array([  8.94879575,   5.53038269,   8.24847281,  12.14944165,  11.56209294])
             Indexing with other arrays
             --------------------------
             Above we saw how to index arrays with single numbers and slices, just
             like Python lists. But arrays allow for a more sophisticated kind of
             indexing which is very powerful: you can index an array with another
             array, and in particular with an array of boolean values. This is
             particluarly useful to extract information from an array that matches a
             certain condition.
             Consider for example that in the array ``norm10`` we want to replace all
             values above 9 with the value 0. We can do so by first finding the
             *mask* that indicates where this condition is true or false:
             In[25]:
             .. code:: python
                 mask = norm10 > 9
                 mask
             Out[25]:
             .. parsed-literal::
                 array([False, False, False,  True,  True], dtype=bool)
             Now that we have this mask, we can use it to either read those values or
             to reset them to 0:
             In[26]:
             .. code:: python
                 print 'Values above 9:', norm10[mask]
             .. parsed-literal::
                 Values above 9: [ 12.14944165  11.56209294]
             In[27]:
             .. code:: python
                 print 'Resetting all values above 9 to 0...'
                 norm10[mask] = 0
                 print norm10
             .. parsed-literal::
                 Resetting all values above 9 to 0...
                 [ 8.94879575  5.53038269  8.24847281  0.          0.        ]
             Arrays with more than one dimension
             -----------------------------------
             Up until now all our examples have used one-dimensional arrays. But
             Numpy can create arrays of aribtrary dimensions, and all the methods
             illustrated in the previous section work with more than one dimension.
             For example, a list of lists can be used to initialize a two dimensional
             array:
             In[28]:
             .. code:: python
                 lst2 = [[1, 2], [3, 4]]
                 arr2 = np.array([[1, 2], [3, 4]])
                 arr2
             Out[28]:
             .. parsed-literal::
                 array([[1, 2],
                        [3, 4]])
             With two-dimensional arrays we start seeing the power of numpy: while a
             nested list can be indexed using repeatedly the ``[ ]`` operator,
             multidimensional arrays support a much more natural indexing syntax with
             a single ``[ ]`` and a set of indices separated by commas:
             In[29]:
             .. code:: python
                 print lst2[0][1]
                 print arr2[0,1]
             .. parsed-literal::
             Most of the array creation functions listed above can be used with more
             than one dimension, for example:
             In[30]:
             .. code:: python
                 np.zeros((2,3))
             Out[30]:
             .. parsed-literal::
                 array([[ 0.,  0.,  0.],
                        [ 0.,  0.,  0.]])
             In[31]:
             .. code:: python
                 np.random.normal(10, 3, (2, 4))
             Out[31]:
             .. parsed-literal::
                 array([[ 11.26788826,   4.29619866,  11.09346496,   9.73861307],
                        [ 10.54025996,   9.5146268 ,  10.80367214,  13.62204505]])
             In fact, the shape of an array can be changed at any time, as long as
             the total number of elements is unchanged. For example, if we want a 2x4
             array with numbers increasing from 0, the easiest way to create it is:
             In[32]:
             .. code:: python
                 arr = np.arange(8).reshape(2,4)
                 print arr
             .. parsed-literal::
                 [[0 1 2 3]
                  [4 5 6 7]]
             With multidimensional arrays, you can also use slices, and you can mix
             and match slices and single indices in the different dimensions (using
             the same array as above):
             In[33]:
             .. code:: python
                 print 'Slicing in the second row:', arr[1, 2:4]
                 print 'All rows, third column   :', arr[:, 2]
             .. parsed-literal::
                 Slicing in the second row: [6 7]
                 All rows, third column   : [2 6]
             If you only provide one index, then you will get an array with one less
             dimension containing that row:
             In[34]:
             .. code:: python
                 print 'First row:  ', arr[0]
                 print 'Second row: ', arr[1]
             .. parsed-literal::
                 First row:   [0 1 2 3]
                 Second row:  [4 5 6 7]
             Now that we have seen how to create arrays with more than one dimension,
             it's a good idea to look at some of the most useful properties and
             methods that arrays have. The following provide basic information about
             the size, shape and data in the array:
             In[35]:
             .. code:: python
                 print 'Data type                :', arr.dtype
                 print 'Total number of elements :', arr.size
                 print 'Number of dimensions     :', arr.ndim
                 print 'Shape (dimensionality)   :', arr.shape
                 print 'Memory used (in bytes)   :', arr.nbytes
             .. parsed-literal::
                 Data type                : int32
                 Total number of elements : 8
                 Number of dimensions     : 2
                 Shape (dimensionality)   : (2, 4)
                 Memory used (in bytes)   : 32
             Arrays also have many useful methods, some especially useful ones are:
             In[36]:
             .. code:: python
                 print 'Minimum and maximum             :', arr.min(), arr.max()
                 print 'Sum and product of all elements :', arr.sum(), arr.prod()
                 print 'Mean and standard deviation     :', arr.mean(), arr.std()
             .. parsed-literal::
                 Minimum and maximum             : 0 7
                 Sum and product of all elements : 28 0
                 Mean and standard deviation     : 3.5 2.29128784748
             For these methods, the above operations area all computed on all the
             elements of the array. But for a multidimensional array, it's possible
             to do the computation along a single dimension, by passing the ``axis``
             parameter; for example:
             In[37]:
             .. code:: python
                 print 'For the following array:\n', arr
                 print 'The sum of elements along the rows is    :', arr.sum(axis=1)
                 print 'The sum of elements along the columns is :', arr.sum(axis=0)
             .. parsed-literal::
                 For the following array:
                 [[0 1 2 3]
                  [4 5 6 7]]
                 The sum of elements along the rows is    : [ 6 22]
                 The sum of elements along the columns is : [ 4  6  8 10]
             As you can see in this example, the value of the ``axis`` parameter is
             the dimension which will be *consumed* once the operation has been
             carried out. This is why to sum along the rows we use ``axis=0``.
             This can be easily illustrated with an example that has more dimensions;
             we create an array with 4 dimensions and shape ``(3,4,5,6)`` and sum
             along the axis number 2 (i.e. the *third* axis, since in Python all
             counts are 0-based). That consumes the dimension whose length was 5,
             leaving us with a new array that has shape ``(3,4,6)``:
             In[38]:
             .. code:: python
                 np.zeros((3,4,5,6)).sum(2).shape
             Out[38]:
             .. parsed-literal::
                 (3, 4, 6)
             Another widely used property of arrays is the ``.T`` attribute, which
             allows you to access the transpose of the array:
             In[39]:
             .. code:: python
                 print 'Array:\n', arr
                 print 'Transpose:\n', arr.T
             .. parsed-literal::
                 Array:
                 [[0 1 2 3]
                  [4 5 6 7]]
                 Transpose:
                 [[0 4]
                  [1 5]
                  [2 6]
                  [3 7]]
             We don't have time here to look at all the methods and properties of
             arrays, here's a complete list. Simply try exploring some of these
             IPython to learn more, or read their description in the full Numpy
             documentation:
             ::
                 arr.T             arr.copy          arr.getfield      arr.put           arr.squeeze
                 arr.all           arr.ctypes        arr.imag          arr.ravel         arr.std
                 arr.any           arr.cumprod       arr.item          arr.real          arr.strides
                 arr.argmax        arr.cumsum        arr.itemset       arr.repeat        arr.sum
                 arr.argmin        arr.data          arr.itemsize      arr.reshape       arr.swapaxes
                 arr.argsort       arr.diagonal      arr.max           arr.resize        arr.take
                 arr.astype        arr.dot           arr.mean          arr.round         arr.tofile
                 arr.base          arr.dtype         arr.min           arr.searchsorted  arr.tolist
                 arr.byteswap      arr.dump          arr.nbytes        arr.setasflat     arr.tostring
                 arr.choose        arr.dumps         arr.ndim          arr.setfield      arr.trace
                 arr.clip          arr.fill          arr.newbyteorder  arr.setflags      arr.transpose
                 arr.compress      arr.flags         arr.nonzero       arr.shape         arr.var
                 arr.conj          arr.flat          arr.prod          arr.size          arr.view
                 arr.conjugate     arr.flatten       arr.ptp           arr.sort
             Operating with arrays
             ---------------------
             Arrays support all regular arithmetic operators, and the numpy library
             also contains a complete collection of basic mathematical functions that
             operate on arrays. It is important to remember that in general, all
             operations with arrays are applied *element-wise*, i.e., are applied to
             all the elements of the array at the same time. Consider for example:
             In[40]:
             .. code:: python
                 arr1 = np.arange(4)
                 arr2 = np.arange(10, 14)
                 print arr1, '+', arr2, '=', arr1+arr2
             .. parsed-literal::
                 [0 1 2 3] + [10 11 12 13] = [10 12 14 16]
             Importantly, you must remember that even the multiplication operator is
             by default applied element-wise, it is *not* the matrix multiplication
             from linear algebra (as is the case in Matlab, for example):
             In[41]:
             .. code:: python
                 print arr1, '*', arr2, '=', arr1*arr2
             .. parsed-literal::
                 [0 1 2 3] * [10 11 12 13] = [ 0 11 24 39]
             While this means that in principle arrays must always match in their
             dimensionality in order for an operation to be valid, numpy will
             *broadcast* dimensions when possible. For example, suppose that you want
             to add the number 1.5 to ``arr1``; the following would be a valid way to
             do it:
             In[42]:
             .. code:: python
                 arr1 + 1.5*np.ones(4)
             Out[42]:
             .. parsed-literal::
                 array([ 1.5,  2.5,  3.5,  4.5])
             But thanks to numpy's broadcasting rules, the following is equally
             valid:
             In[43]:
             .. code:: python
                 arr1 + 1.5
             Out[43]:
             .. parsed-literal::
                 array([ 1.5,  2.5,  3.5,  4.5])
             In this case, numpy looked at both operands and saw that the first
             (``arr1``) was a one-dimensional array of length 4 and the second was a
             scalar, considered a zero-dimensional object. The broadcasting rules
             allow numpy to:
             -  *create* new dimensions of length 1 (since this doesn't change the
                size of the array)
             -  'stretch' a dimension of length 1 that needs to be matched to a
                dimension of a different size.
             So in the above example, the scalar 1.5 is effectively:
             -  first 'promoted' to a 1-dimensional array of length 1
             -  then, this array is 'stretched' to length 4 to match the dimension of
                ``arr1``.
             After these two operations are complete, the addition can proceed as now
             both operands are one-dimensional arrays of length 4.
             This broadcasting behavior is in practice enormously powerful,
             especially because when numpy broadcasts to create new dimensions or to
             'stretch' existing ones, it doesn't actually replicate the data. In the
             example above the operation is carried *as if* the 1.5 was a 1-d array
             with 1.5 in all of its entries, but no actual array was ever created.
             This can save lots of memory in cases when the arrays in question are
             large and can have significant performance implications.
             The general rule is: when operating on two arrays, NumPy compares their
             shapes element-wise. It starts with the trailing dimensions, and works
             its way forward, creating dimensions of length 1 as needed. Two
             dimensions are considered compatible when
             -  they are equal to begin with, or
             -  one of them is 1; in this case numpy will do the 'stretching' to make
                them equal.
             If these conditions are not met, a
             ``ValueError: frames are not aligned`` exception is thrown, indicating
             that the arrays have incompatible shapes. The size of the resulting
             array is the maximum size along each dimension of the input arrays.
             This shows how the broadcasting rules work in several dimensions:
             In[44]:
             .. code:: python
                 b = np.array([2, 3, 4, 5])
                 print arr, '\n\n+', b , '\n----------------\n', arr + b
             .. parsed-literal::
                 [[0 1 2 3]
                  [4 5 6 7]]
                 + [2 3 4 5]
                 ----------------
                 [[ 2  4  6  8]
                  [ 6  8 10 12]]
             Now, how could you use broadcasting to say add ``[4, 6]`` along the rows
             to ``arr`` above? Simply performing the direct addition will produce the
             error we previously mentioned:
             In[45]:
             .. code:: python
                 c = np.array([4, 6])
                 arr + c
             ::
                 ---------------------------------------------------------------------------
                 ValueError                                Traceback (most recent call last)
                 /home/fperez/teach/book-math-labtool/<ipython-input-45-62aa20ac1980> in <module>()
 c = np.array([4, 6])
                 ----> 2 arr + c
                 ValueError: operands could not be broadcast together with shapes (2,4) (2)
             According to the rules above, the array ``c`` would need to have a
             *trailing* dimension of 1 for the broadcasting to work. It turns out
             that numpy allows you to 'inject' new dimensions anywhere into an array
             on the fly, by indexing it with the special object ``np.newaxis``:
             In[46]:
             .. code:: python
                 (c[:, np.newaxis]).shape
             Out[46]:
             .. parsed-literal::
                 (2, 1)
             This is exactly what we need, and indeed it works:
             In[47]:
             .. code:: python
                 arr + c[:, np.newaxis]
             Out[47]:
             .. parsed-literal::
                 array([[ 4,  5,  6,  7],
                        [10, 11, 12, 13]])
             For the full broadcasting rules, please see the official Numpy docs,
             which describe them in detail and with more complex examples.
             As we mentioned before, Numpy ships with a full complement of
             mathematical functions that work on entire arrays, including logarithms,
             exponentials, trigonometric and hyperbolic trigonometric functions, etc.
             Furthermore, scipy ships a rich special function library in the
             ``scipy.special`` module that includes Bessel, Airy, Fresnel, Laguerre
             and other classical special functions. For example, sampling the sine
             function at 100 points between :math:`0` and :math:`2\pi` is as simple
             as:
             In[48]:
             .. code:: python
                 x = np.linspace(0, 2*np.pi, 100)
                 y = np.sin(x)
             Linear algebra in numpy
             -----------------------
             Numpy ships with a basic linear algebra library, and all arrays have a
             ``dot`` method whose behavior is that of the scalar dot product when its
             arguments are vectors (one-dimensional arrays) and the traditional
             matrix multiplication when one or both of its arguments are
             two-dimensional arrays:
             In[49]:
             .. code:: python
                 v1 = np.array([2, 3, 4])
                 v2 = np.array([1, 0, 1])
                 print v1, '.', v2, '=', v1.dot(v2)
             .. parsed-literal::
                 [2 3 4] . [1 0 1] = 6
             Here is a regular matrix-vector multiplication, note that the array
             ``v1`` should be viewed as a *column* vector in traditional linear
             algebra notation; numpy makes no distinction between row and column
             vectors and simply verifies that the dimensions match the required rules
             of matrix multiplication, in this case we have a :math:`2 \times 3`
             matrix multiplied by a 3-vector, which produces a 2-vector:
             In[50]:
             .. code:: python
                 A = np.arange(6).reshape(2, 3)
                 print A, 'x', v1, '=', A.dot(v1)
             .. parsed-literal::
                 [[0 1 2]
                  [3 4 5]] x [2 3 4] = [11 38]
             For matrix-matrix multiplication, the same dimension-matching rules must
             be satisfied, e.g. consider the difference between :math:`A \times A^T`:
             In[51]:
             .. code:: python
                 print A.dot(A.T)
             .. parsed-literal::
                 [[ 5 14]
                  [14 50]]
             and :math:`A^T \times A`:
             In[52]:
             .. code:: python
                 print A.T.dot(A)
             .. parsed-literal::
                 [[ 9 12 15]
                  [12 17 22]
                  [15 22 29]]
             Furthermore, the ``numpy.linalg`` module includes additional
             functionality such as determinants, matrix norms, Cholesky, eigenvalue
             and singular value decompositions, etc. For even more linear algebra
             tools, ``scipy.linalg`` contains the majority of the tools in the
             classic LAPACK libraries as well as functions to operate on sparse
             matrices. We refer the reader to the Numpy and Scipy documentations for
             additional details on these.
             Reading and writing arrays to disk
             ----------------------------------
             Numpy lets you read and write arrays into files in a number of ways. In
             order to use these tools well, it is critical to understand the
             difference between a *text* and a *binary* file containing numerical
             data. In a text file, the number :math:`\pi` could be written as
             "3.141592653589793", for example: a string of digits that a human can
             read, with in this case 15 decimal digits. In contrast, that same number
             written to a binary file would be encoded as 8 characters (bytes) that
             are not readable by a human but which contain the exact same data that
             the variable ``pi`` had in the computer's memory.
             The tradeoffs between the two modes are thus:
             -  Text mode: occupies more space, precision can be lost (if not all
                digits are written to disk), but is readable and editable by hand
                with a text editor. Can *only* be used for one- and two-dimensional
                arrays.
             -  Binary mode: compact and exact representation of the data in memory,
                can't be read or edited by hand. Arrays of any size and
                dimensionality can be saved and read without loss of information.
             First, let's see how to read and write arrays in text mode. The
             ``np.savetxt`` function saves an array to a text file, with options to
             control the precision, separators and even adding a header:
             In[53]:
             .. code:: python
                 arr = np.arange(10).reshape(2, 5)
                 np.savetxt('test.out', arr, fmt='%.2e', header="My dataset")
                 !cat test.out
             .. parsed-literal::
                 # My dataset
 .00e+00 1.00e+00 2.00e+00 3.00e+00 4.00e+00
 .00e+00 6.00e+00 7.00e+00 8.00e+00 9.00e+00
             And this same type of file can then be read with the matching
             ``np.loadtxt`` function:
             In[54]:
             .. code:: python
                 arr2 = np.loadtxt('test.out')
                 print arr2
             .. parsed-literal::
                 [[ 0.  1.  2.  3.  4.]
                  [ 5.  6.  7.  8.  9.]]
             For binary data, Numpy provides the ``np.save`` and ``np.savez``
             routines. The first saves a single array to a file with ``.npy``
             extension, while the latter can be used to save a *group* of arrays into
             a single file with ``.npz`` extension. The files created with these
             routines can then be read with the ``np.load`` function.
             Let us first see how to use the simpler ``np.save`` function to save a
             single array:
             In[55]:
             .. code:: python
                 np.save('test.npy', arr2)
                 # Now we read this back
                 arr2n = np.load('test.npy')
                 # Let's see if any element is non-zero in the difference.
                 # A value of True would be a problem.
                 print 'Any differences?', np.any(arr2-arr2n)
             .. parsed-literal::
                 Any differences? False
             Now let us see how the ``np.savez`` function works. You give it a
             filename and either a sequence of arrays or a set of keywords. In the
             first mode, the function will auotmatically name the saved arrays in the
             archive as ``arr_0``, ``arr_1``, etc:
             In[56]:
             .. code:: python
                 np.savez('test.npz', arr, arr2)
                 arrays = np.load('test.npz')
                 arrays.files
             Out[56]:
             .. parsed-literal::
                 ['arr_1', 'arr_0']
             Alternatively, we can explicitly choose how to name the arrays we save:
             In[57]:
             .. code:: python
                 np.savez('test.npz', array1=arr, array2=arr2)
                 arrays = np.load('test.npz')
                 arrays.files
             Out[57]:
             .. parsed-literal::
                 ['array2', 'array1']
             The object returned by ``np.load`` from an ``.npz`` file works like a
             dictionary, though you can also access its constituent files by
             attribute using its special ``.f`` field; this is best illustrated with
             an example with the ``arrays`` object from above:
             In[58]:
             .. code:: python
                 print 'First row of first array:', arrays['array1'][0]
                 # This is an equivalent way to get the same field
                 print 'First row of first array:', arrays.f.array1[0]
             .. parsed-literal::
                 First row of first array: [0 1 2 3 4]
                 First row of first array: [0 1 2 3 4]
             This ``.npz`` format is a very convenient way to package compactly and
             without loss of information, into a single file, a group of related
             arrays that pertain to a specific problem. At some point, however, the
             complexity of your dataset may be such that the optimal approach is to
             use one of the standard formats in scientific data processing that have
             been designed to handle complex datasets, such as NetCDF or HDF5.
             Fortunately, there are tools for manipulating these formats in Python,
             and for storing data in other ways such as databases. A complete
             discussion of the possibilities is beyond the scope of this discussion,
             but of particular interest for scientific users we at least mention the
             following:
             -  The ``scipy.io`` module contains routines to read and write Matlab
                files in ``.mat`` format and files in the NetCDF format that is
                widely used in certain scientific disciplines.
             -  For manipulating files in the HDF5 format, there are two excellent
                options in Python: The PyTables project offers a high-level, object
                oriented approach to manipulating HDF5 datasets, while the h5py
                project offers a more direct mapping to the standard HDF5 library
                interface. Both are excellent tools; if you need to work with HDF5
                datasets you should read some of their documentation and examples and
                decide which approach is a better match for your needs.
             High quality data visualization with Matplotlib
             ===============================================
             The `matplotlib <http://matplotlib.sf.net>`_ library is a powerful tool
             capable of producing complex publication-quality figures with fine
             layout control in two and three dimensions; here we will only provide a
             minimal self-contained introduction to its usage that covers the
             functionality needed for the rest of the book. We encourage the reader
             to read the tutorials included with the matplotlib documentation as well
             as to browse its extensive gallery of examples that include source code.
             Just as we typically use the shorthand ``np`` for Numpy, we will use
             ``plt`` for the ``matplotlib.pyplot`` module where the easy-to-use
             plotting functions reside (the library contains a rich object-oriented
             architecture that we don't have the space to discuss here):
             In[59]:
             .. code:: python
                 import matplotlib.pyplot as plt
             The most frequently used function is simply called ``plot``, here is how
             you can make a simple plot of :math:`\sin(x)` for
             :math:`x \in [0, 2\pi]` with labels and a grid (we use the semicolon in
             the last line to suppress the display of some information that is
             unnecessary right now):
             In[60]:
             .. code:: python
                 x = np.linspace(0, 2*np.pi)
                 y = np.sin(x)
                 plt.plot(x,y, label='sin(x)')
                 plt.legend()
                 plt.grid()
                 plt.title('Harmonic')
                 plt.xlabel('x')
                 plt.ylabel('y');
-            .. image:: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_01.svg
+            .. image:: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_01.svg
             You can control the style, color and other properties of the markers,
             for example:
             In[61]:
             .. code:: python
                 plt.plot(x, y, linewidth=2);
-            .. image:: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_02.svg
+            .. image:: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_02.svg
             In[62]:
             .. code:: python
                 plt.plot(x, y, 'o', markersize=5, color='r');
-            .. image:: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_03.svg
+            .. image:: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_03.svg
             We will now see how to create a few other common plot types, such as a
             simple error plot:
             In[63]:
             .. code:: python
                 # example data
                 x = np.arange(0.1, 4, 0.5)
                 y = np.exp(-x)
                 # example variable error bar values
                 yerr = 0.1 + 0.2*np.sqrt(x)
                 xerr = 0.1 + yerr
                 # First illustrate basic pyplot interface, using defaults where possible.
                 plt.figure()
                 plt.errorbar(x, y, xerr=0.2, yerr=0.4)
                 plt.title("Simplest errorbars, 0.2 in x, 0.4 in y");
-            .. image:: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_04.svg
+            .. image:: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_04.svg
             A simple log plot
             In[64]:
             .. code:: python
                 x = np.linspace(-5, 5)
                 y = np.exp(-x**2)
                 plt.semilogy(x, y);
-            .. image:: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_05.svg
+            .. image:: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_05.svg
             A histogram annotated with text inside the plot, using the ``text``
             function:
             In[65]:
             .. code:: python
                 mu, sigma = 100, 15
                 x = mu + sigma * np.random.randn(10000)
                 # the histogram of the data
                 n, bins, patches = plt.hist(x, 50, normed=1, facecolor='g', alpha=0.75)
                 plt.xlabel('Smarts')
                 plt.ylabel('Probability')
                 plt.title('Histogram of IQ')
                 # This will put a text fragment at the position given:
                 plt.text(55, .027, r'$\mu=100,\ \sigma=15$', fontsize=14)
                 plt.axis([40, 160, 0, 0.03])
                 plt.grid(True)
-            .. image:: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_06.svg
+            .. image:: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_06.svg
             Image display
             -------------
             The ``imshow`` command can display single or multi-channel images. A
             simple array of random numbers, plotted in grayscale:
             In[66]:
             .. code:: python
                 from matplotlib import cm
                 plt.imshow(np.random.rand(5, 10), cmap=cm.gray, interpolation='nearest');
-            .. image:: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_07.svg
+            .. image:: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_07.svg
             A real photograph is a multichannel image, ``imshow`` interprets it
             correctly:
             In[67]:
             .. code:: python
                 img = plt.imread('stinkbug.png')
                 print 'Dimensions of the array img:', img.shape
                 plt.imshow(img);
             .. parsed-literal::
                 Dimensions of the array img: (375, 500, 3)
-            .. image:: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_08.svg
+            .. image:: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_08.svg
             Simple 3d plotting with matplotlib
             ----------------------------------
             Note that you must execute at least once in your session:
             In[68]:
             .. code:: python
                 from mpl_toolkits.mplot3d import Axes3D
             One this has been done, you can create 3d axes with the
             ``projection='3d'`` keyword to ``add_subplot``:
             ::
                 fig = plt.figure()
                 fig.add_subplot(<other arguments here>, projection='3d')
             A simple surface plot:
             In[72]:
             .. code:: python
                 from mpl_toolkits.mplot3d.axes3d import Axes3D
                 from matplotlib import cm
                 fig = plt.figure()
                 ax = fig.add_subplot(1, 1, 1, projection='3d')
                 X = np.arange(-5, 5, 0.25)
                 Y = np.arange(-5, 5, 0.25)
                 X, Y = np.meshgrid(X, Y)
                 R = np.sqrt(X**2 + Y**2)
                 Z = np.sin(R)
                 surf = ax.plot_surface(X, Y, Z, rstride=1, cstride=1, cmap=cm.jet,
                         linewidth=0, antialiased=False)
                 ax.set_zlim3d(-1.01, 1.01);
-            .. image:: /Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_09.svg
+            .. image:: tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_09.svg
             IPython: a powerful interactive environment
             ===========================================
             A key component of the everyday workflow of most scientific computing
             environments is a good interactive environment, that is, a system in
             which you can execute small amounts of code and view the results
             immediately, combining both printing out data and opening graphical
             visualizations. All modern systems for scientific computing, commercial
             and open source, include such functionality.
             Out of the box, Python also offers a simple interactive shell with very
             limited capabilities. But just like the scientific community built Numpy
             to provide arrays suited for scientific work (since Pytyhon's lists
             aren't optimal for this task), it has also developed an interactive
             environment much more sophisticated than the built-in one. The `IPython
             project <http://ipython.org>`_ offers a set of tools to make productive
             use of the Python language, all the while working interactively and with
             immedate feedback on your results. The basic tools that IPython provides
             are:
 . A powerful terminal shell, with many features designed to increase
                the fluidity and productivity of everyday scientific workflows,
                including:
                -  rich introspection of all objects and variables including easy
                   access to the source code of any function
                -  powerful and extensible tab completion of variables and filenames,
                -  tight integration with matplotlib, supporting interactive figures
                   that don't block the terminal,
                -  direct access to the filesystem and underlying operating system,
                -  an extensible system for shell-like commands called 'magics' that
                   reduce the work needed to perform many common tasks,
                -  tools for easily running, timing, profiling and debugging your
                   codes,
                -  syntax highlighted error messages with much more detail than the
                   default Python ones,
                -  logging and access to all previous history of inputs, including
                   across sessions
 . A Qt console that provides the look and feel of a terminal, but adds
                support for inline figures, graphical calltips, a persistent session
                that can survive crashes (even segfaults) of the kernel process, and
                more.
 . A web-based notebook that can execute code and also contain rich text
                and figures, mathematical equations and arbitrary HTML. This notebook
                presents a document-like view with cells where code is executed but
                that can be edited in-place, reordered, mixed with explanatory text
                and figures, etc.
 . A high-performance, low-latency system for parallel computing that
                supports the control of a cluster of IPython engines communicating
                over a network, with optimizations that minimize unnecessary copying
                of large objects (especially numpy arrays).
             We will now discuss the highlights of the tools 1-3 above so that you
             can make them an effective part of your workflow. The topic of parallel
             computing is beyond the scope of this document, but we encourage you to
             read the extensive
             `documentation <http://ipython.org/ipython-doc/rel-0.12.1/parallel/index.html>`_
             and `tutorials <http://minrk.github.com/scipy-tutorial-2011/>`_ on this
             available on the IPython website.
             The IPython terminal
             --------------------
             You can start IPython at the terminal simply by typing:
             ::
                 $ ipython
             which will provide you some basic information about how to get started
             and will then open a prompt labeled ``In [1]:`` for you to start typing.
             Here we type :math:`2^{64}` and Python computes the result for us in
             exact arithmetic, returning it as ``Out[1]``:
             ::
                 $ ipython
                 Python 2.7.2+ (default, Oct  4 2011, 20:03:08)
                 Type "copyright", "credits" or "license" for more information.
                 IPython 0.13.dev -- An enhanced Interactive Python.
                 ?         -> Introduction and overview of IPython's features.
                 %quickref -> Quick reference.
                 help      -> Python's own help system.
                 object?   -> Details about 'object', use 'object??' for extra details.
                 In [1]: 2**64
                 Out[1]: 18446744073709551616L
             The first thing you should know about IPython is that all your inputs
             and outputs are saved. There are two variables named ``In`` and ``Out``
             which are filled as you work with your results. Furthermore, all outputs
             are also saved to auto-created variables of the form ``_NN`` where
             ``NN`` is the prompt number, and inputs to ``_iNN``. This allows you to
             recover quickly the result of a prior computation by referring to its
             number even if you forgot to store it as a variable. For example, later
             on in the above session you can do:
             ::
                 In [6]: print _1
                 18446744073709551616
             We strongly recommend that you take a few minutes to read at least the
             basic introduction provided by the ``?`` command, and keep in mind that
             the ``%quickref`` command at all times can be used as a quick reference
             "cheat sheet" of the most frequently used features of IPython.
             At the IPython prompt, any valid Python code that you type will be
             executed similarly to the default Python shell (though often with more
             informative feedback). But since IPython is a *superset* of the default
             Python shell; let's have a brief look at some of its additional
             functionality.
             **Object introspection**
             A simple ``?`` command provides a general introduction to IPython, but
             as indicated in the banner above, you can use the ``?`` syntax to ask
             for details about any object. For example, if we type ``_1?``, IPython
             will print the following details about this variable:
             ::
                 In [14]: _1?
                 Type:       long
                 Base Class: <type 'long'>
                 String Form:18446744073709551616
                 Namespace:  Interactive
                 Docstring:
                 long(x[, base]) -> integer
                 Convert a string or number to a long integer, if possible.  A floating
                 [etc... snipped for brevity]
             If you add a second ``?`` and for any oobject ``x`` type ``x??``,
             IPython will try to provide an even more detailed analsysi of the
             object, including its syntax-highlighted source code when it can be
             found. It's possible that ``x??`` returns the same information as
             ``x?``, but in many cases ``x??`` will indeed provide additional
             details.
             Finally, the ``?`` syntax is also useful to search *namespaces* with
             wildcards. Suppose you are wondering if there is any function in Numpy
             that may do text-related things; with ``np.*txt*?``, IPython will print
             all the names in the ``np`` namespace (our Numpy shorthand) that have
             'txt' anywhere in their name:
             ::
                 In [17]: np.*txt*?
                 np.genfromtxt
                 np.loadtxt
                 np.mafromtxt
                 np.ndfromtxt
                 np.recfromtxt
                 np.savetxt
             **Tab completion**
             IPython makes the tab key work extra hard for you as a way to rapidly
             inspect objects and libraries. Whenever you have typed something at the
             prompt, by hitting the ``<tab>`` key IPython will try to complete the
             rest of the line. For this, IPython will analyze the text you had so far
             and try to search for Python data or files that may match the context
             you have already provided.
             For example, if you type ``np.load`` and hit the key, you'll see:
             ::
                 In [21]: np.load<TAB HERE>
                 np.load     np.loads    np.loadtxt
             so you can quickly find all the load-related functionality in numpy. Tab
             completion works even for function arguments, for example consider this
             function definition:
             ::
                 In [20]: def f(x, frobinate=False):
                    ....:     if frobinate:
                    ....:         return x**2
                    ....:
             If you now use the ``<tab>`` key after having typed 'fro' you'll get all
             valid Python completions, but those marked with ``=`` at the end are
             known to be keywords of your function:
             ::
                 In [21]: f(2, fro<TAB HERE>
                 frobinate=    frombuffer    fromfunction  frompyfunc    fromstring
                 from          fromfile      fromiter      fromregex     frozenset
             at this point you can add the ``b`` letter and hit ``<tab>`` once more,
             and IPython will finish the line for you:
             ::
                 In [21]: f(2, frobinate=
             As a beginner, simply get into the habit of using ``<tab>`` after most
             objects; it should quickly become second nature as you will see how
             helps keep a fluid workflow and discover useful information. Later on
             you can also customize this behavior by writing your own completion
             code, if you so desire.
             **Matplotlib integration**
             One of the most useful features of IPython for scientists is its tight
             integration with matplotlib: at the terminal IPython lets you open
             matplotlib figures without blocking your typing (which is what happens
             if you try to do the same thing at the default Python shell), and in the
             Qt console and notebook you can even view your figures embedded in your
             workspace next to the code that created them.
             The matplotlib support can be either activated when you start IPython by
             passing the ``--pylab`` flag, or at any point later in your session by
             using the ``%pylab`` command. If you start IPython with ``--pylab``,
             you'll see something like this (note the extra message about pylab):
             ::
                 $ ipython --pylab
                 Python 2.7.2+ (default, Oct  4 2011, 20:03:08)
                 Type "copyright", "credits" or "license" for more information.
                 IPython 0.13.dev -- An enhanced Interactive Python.
                 ?         -> Introduction and overview of IPython's features.
                 %quickref -> Quick reference.
                 help      -> Python's own help system.
                 object?   -> Details about 'object', use 'object??' for extra details.
                 Welcome to pylab, a matplotlib-based Python environment [backend: Qt4Agg].
                 For more information, type 'help(pylab)'.
                 In [1]:
             Furthermore, IPython will import ``numpy`` with the ``np`` shorthand,
             ``matplotlib.pyplot`` as ``plt``, and it will also load all of the numpy
             and pyplot top-level names so that you can directly type something like:
             ::
                 In [1]: x = linspace(0, 2*pi, 200)
                 In [2]: plot(x, sin(x))
                 Out[2]: [<matplotlib.lines.Line2D at 0x9e7c16c>]
             instead of having to prefix each call with its full signature (as we
             have been doing in the examples thus far):
             ::
                 In [3]: x = np.linspace(0, 2*np.pi, 200)
                 In [4]: plt.plot(x, np.sin(x))
                 Out[4]: [<matplotlib.lines.Line2D at 0x9e900ac>]
             This shorthand notation can be a huge time-saver when working
             interactively (it's a few characters but you are likely to type them
             hundreds of times in a session). But we should note that as you develop
             persistent scripts and notebooks meant for reuse, it's best to get in
             the habit of using the longer notation (known as *fully qualified names*
             as it's clearer where things come from and it makes for more robust,
             readable and maintainable code in the long run).
             **Access to the operating system and files**
             In IPython, you can type ``ls`` to see your files or ``cd`` to change
             directories, just like you would at a regular system prompt:
             ::
                 In [2]: cd tests
                 /home/fperez/ipython/nbconvert/tests
                 In [3]: ls test.*
                 test.aux  test.html  test.ipynb  test.log  test.out  test.pdf  test.rst  test.tex
             Furthermore, if you use the ``!`` at the beginning of a line, any
             commands you pass afterwards go directly to the operating system:
             ::
                 In [4]: !echo "Hello IPython"
                 Hello IPython
             IPython offers a useful twist in this feature: it will substitute in the
             command the value of any *Python* variable you may have if you prepend
             it with a ``$`` sign:
             ::
                 In [5]: message = 'IPython interpolates from Python to the shell'
                 In [6]: !echo $message
                 IPython interpolates from Python to the shell
             This feature can be extremely useful, as it lets you combine the power
             and clarity of Python for complex logic with the immediacy and
             familiarity of many shell commands. Additionally, if you start the line
             with *two* ``$$`` signs, the output of the command will be automatically
             captured as a list of lines, e.g.:
             ::
                 In [10]: !!ls test.*
                 Out[10]:
                 ['test.aux',
                  'test.html',
                  'test.ipynb',
                  'test.log',
                  'test.out',
                  'test.pdf',
                  'test.rst',
                  'test.tex']
             As explained above, you can now use this as the variable ``_10``. If you
             directly want to capture the output of a system command to a Python
             variable, you can use the syntax ``=!``:
             ::
                 In [11]: testfiles =! ls test.*
                 In [12]: print testfiles
                 ['test.aux', 'test.html', 'test.ipynb', 'test.log', 'test.out', 'test.pdf', 'test.rst', 'test.tex']
             Finally, the special ``%alias`` command lets you define names that are
             shorthands for system commands, so that you can type them without having
             to prefix them via ``!`` explicitly (for example, ``ls`` is an alias
             that has been predefined for you at startup).
             **Magic commands**
             IPython has a system for special commands, called 'magics', that let you
             control IPython itself and perform many common tasks with a more
             shell-like syntax: it uses spaces for delimiting arguments, flags can be
             set with dashes and all arguments are treated as strings, so no
             additional quoting is required. This kind of syntax is invalid in the
             Python language but very convenient for interactive typing (less
             parentheses, commans and quoting everywhere); IPython distinguishes the
             two by detecting lines that start with the ``%`` character.
             You can learn more about the magic system by simply typing ``%magic`` at
             the prompt, which will give you a short description plus the
             documentation on *all* available magics. If you want to see only a
             listing of existing magics, you can use ``%lsmagic``:
             ::
                 In [4]: lsmagic
                 Available magic functions:
                 %alias  %autocall  %autoindent  %automagic  %bookmark  %c  %cd  %colors  %config  %cpaste
                 %debug  %dhist  %dirs  %doctest_mode  %ds  %ed  %edit  %env  %gui  %hist  %history
                 %install_default_config  %install_ext  %install_profiles  %load_ext  %loadpy  %logoff  %logon
                 %logstart  %logstate  %logstop  %lsmagic  %macro  %magic  %notebook  %page  %paste  %pastebin
                 %pd  %pdb  %pdef  %pdoc  %pfile  %pinfo  %pinfo2  %pop  %popd  %pprint  %precision  %profile
                 %prun  %psearch  %psource  %pushd  %pwd  %pycat  %pylab  %quickref  %recall  %rehashx
                 %reload_ext  %rep  %rerun  %reset  %reset_selective  %run  %save  %sc  %stop  %store  %sx  %tb
                 %time  %timeit  %unalias  %unload_ext  %who  %who_ls  %whos  %xdel  %xmode
                 Automagic is ON, % prefix NOT needed for magic functions.
             Note how the example above omitted the eplicit ``%`` marker and simply
             uses ``lsmagic``. As long as the 'automagic' feature is on (which it is
             by default), you can omit the ``%`` marker as long as there is no
             ambiguity with a Python variable of the same name.
             **Running your code**
             While it's easy to type a few lines of code in IPython, for any
             long-lived work you should keep your codes in Python scripts (or in
             IPython notebooks, see below). Consider that you have a script, in this
             case trivially simple for the sake of brevity, named ``simple.py``:
             ::
                 In [12]: !cat simple.py
                 import numpy as np
                 x = np.random.normal(size=100)
                 print 'First elment of x:', x[0]
             The typical workflow with IPython is to use the ``%run`` magic to
             execute your script (you can omit the .py extension if you want). When
             you run it, the script will execute just as if it had been run at the
             system prompt with ``python simple.py`` (though since modules don't get
             re-executed on new imports by Python, all system initialization is
             essentially free, which can have a significant run time impact in some
             cases):
             ::
                 In [13]: run simple
                 First elment of x: -1.55872256289
             Once it completes, all variables defined in it become available for you
             to use interactively:
             ::
                 In [14]: x.shape
                 Out[14]: (100,)
             This allows you to plot data, try out ideas, etc, in a
             ``%run``/interact/edit cycle that can be very productive. As you start
             understanding your problem better you can refine your script further,
             incrementally improving it based on the work you do at the IPython
             prompt. At any point you can use the ``%hist`` magic to print out your
             history without prompts, so that you can copy useful fragments back into
             the script.
             By default, ``%run`` executes scripts in a completely empty namespace,
             to better mimic how they would execute at the system prompt with plain
             Python. But if you use the ``-i`` flag, the script will also see your
             interactively defined variables. This lets you edit in a script larger
             amounts of code that still behave as if you had typed them at the
             IPython prompt.
             You can also get a summary of the time taken by your script with the
             ``-t`` flag; consider a different script ``randsvd.py`` that takes a bit
             longer to run:
             ::
                 In [21]: run -t randsvd.py
                 IPython CPU timings (estimated):
                   User   :       0.38 s.
                   System :       0.04 s.
                 Wall time:       0.34 s.
             ``User`` is the time spent by the computer executing your code, while
             ``System`` is the time the operating system had to work on your behalf,
             doing things like memory allocation that are needed by your code but
             that you didn't explicitly program and that happen inside the kernel.
             The ``Wall time`` is the time on a 'clock on the wall' between the start
             and end of your program.
             If ``Wall > User+System``, your code is most likely waiting idle for
             certain periods. That could be waiting for data to arrive from a remote
             source or perhaps because the operating system has to swap large amounts
             of virtual memory. If you know that your code doesn't explicitly wait
             for remote data to arrive, you should investigate further to identify
             possible ways of improving the performance profile.
             If you only want to time how long a single statement takes, you don't
             need to put it into a script as you can use the ``%timeit`` magic, which
             uses Python's ``timeit`` module to very carefully measure timig data;
             ``timeit`` can measure even short statements that execute extremely
             fast:
             ::
                 In [27]: %timeit a=1
                 10000000 loops, best of 3: 23 ns per loop
             and for code that runs longer, it automatically adjusts so the overall
             measurement doesn't take too long:
             ::
                 In [28]: %timeit np.linalg.svd(x)
 loops, best of 3: 310 ms per loop
             The ``%run`` magic still has more options for debugging and profiling
             data; you should read its documentation for many useful details (as
             always, just type ``%run?``).
             The graphical Qt console
             ------------------------
             If you type at the system prompt (see the IPython website for
             installation details, as this requires some additional libraries):
             ::
                 $ ipython qtconsole
             instead of opening in a terminal as before, IPython will start a
             graphical console that at first sight appears just like a terminal, but
             which is in fact much more capable than a text-only terminal. This is a
             specialized terminal designed for interactive scientific work, and it
             supports full multi-line editing with color highlighting and graphical
             calltips for functions, it can keep multiple IPython sessions open
             simultaneously in tabs, and when scripts run it can display the figures
             inline directly in the work area.
             .. raw:: html
                <center>
             .. raw:: html
                </center>
             % This cell is for the pdflatex output only
             \begin{figure}[htbp]
             \centering
             \includegraphics[width=3in]{ipython_qtconsole2.png}
             \caption{The IPython Qt console: a lightweight terminal for scientific exploration, with code, results and graphics in a soingle environment.}
             \end{figure}
             The Qt console accepts the same ``--pylab`` startup flags as the
             terminal, but you can additionally supply the value ``--pylab inline``,
             which enables the support for inline graphics shown in the figure. This
             is ideal for keeping all the code and figures in the same session, given
             that the console can save the output of your entire session to HTML or
             PDF.
             Since the Qt console makes it far more convenient than the terminal to
             edit blocks of code with multiple lines, in this environment it's worth
             knowing about the ``%loadpy`` magic function. ``%loadpy`` takes a path
             to a local file or remote URL, fetches its contents, and puts it in the
             work area for you to further edit and execute. It can be an extremely
             fast and convenient way of loading code from local disk or remote
             examples from sites such as the `Matplotlib
             gallery <http://matplotlib.sourceforge.net/gallery.html>`_.
             Other than its enhanced capabilities for code and graphics, all of the
             features of IPython we've explained before remain functional in this
             graphical console.
             The IPython Notebook
             --------------------
             The third way to interact with IPython, in addition to the terminal and
             graphical Qt console, is a powerful web interface called the "IPython
             Notebook". If you run at the system console (you can omit the ``pylab``
             flags if you don't need plotting support):
             ::
                 $ ipython notebook --pylab inline
             IPython will start a process that runs a web server in your local
             machine and to which a web browser can connect. The Notebook is a
             workspace that lets you execute code in blocks called 'cells' and
             displays any results and figures, but which can also contain arbitrary
             text (including LaTeX-formatted mathematical expressions) and any rich
             media that a modern web browser is capable of displaying.
             .. raw:: html
                <center>
             .. raw:: html
                </center>
             % This cell is for the pdflatex output only
             \begin{figure}[htbp]
             \centering
             \includegraphics[width=3in]{ipython-notebook-specgram-2.png}
             \caption{The IPython Notebook: text, equations, code, results, graphics and other multimedia in an open format for scientific exploration and collaboration}
             \end{figure}
             In fact, this document was written as a Notebook, and only exported to
             LaTeX for printing. Inside of each cell, all the features of IPython
             that we have discussed before remain functional, since ultimately this
             web client is communicating with the same IPython code that runs in the
             terminal. But this interface is a much more rich and powerful
             environment for maintaining long-term "live and executable" scientific
             documents.
             Notebook environments have existed in commercial systems like
             Mathematica(TM) and Maple(TM) for a long time; in the open source world
             the `Sage <http://sagemath.org>`_ project blazed this particular trail
             starting in 2006, and now we bring all the features that have made
             IPython such a widely used tool to a Notebook model.
             Since the Notebook runs as a web application, it is possible to
             configure it for remote access, letting you run your computations on a
             persistent server close to your data, which you can then access remotely
             from any browser-equipped computer. We encourage you to read the
             extensive documentation provided by the IPython project for details on
             how to do this and many more features of the notebook.
             Finally, as we said earlier, IPython also has a high-level and easy to
             use set of libraries for parallel computing, that let you control
             (interactively if desired) not just one IPython but an entire cluster of
             'IPython engines'. Unfortunately a detailed discussion of these tools is
             beyond the scope of this text, but should you need to parallelize your
             analysis codes, a quick read of the tutorials and examples provided at
             the IPython site may prove fruitful.

tests/ipynbref/IntroNumPy.orig.tex

0 +10 -10

             %% This file was auto-generated by IPython, do NOT edit
             %% Conversion from the original notebook file:
             %% tests/ipynbref/IntroNumPy.orig.ipynb
             %%
             \documentclass[11pt,english]{article}
             %% This is the automatic preamble used by IPython.  Note that it does *not*
             %% include a documentclass declaration, that is added at runtime to the overall
             %% document.
             \usepackage{amsmath}
             \usepackage{amssymb}
             \usepackage{graphicx}
             \usepackage{ucs}
             \usepackage[utf8x]{inputenc}
             % needed for markdown enumerations to work
             \usepackage{enumerate}
             % Slightly bigger margins than the latex defaults
             \usepackage{geometry}
             \geometry{verbose,tmargin=3cm,bmargin=3cm,lmargin=2.5cm,rmargin=2.5cm}
             % Define a few colors for use in code, links and cell shading
             \usepackage{color}
             \definecolor{orange}{cmyk}{0,0.4,0.8,0.2}
             \definecolor{darkorange}{rgb}{.71,0.21,0.01}
             \definecolor{darkgreen}{rgb}{.12,.54,.11}
             \definecolor{myteal}{rgb}{.26, .44, .56}
             \definecolor{gray}{gray}{0.45}
             \definecolor{lightgray}{gray}{.95}
             \definecolor{mediumgray}{gray}{.8}
             \definecolor{inputbackground}{rgb}{.95, .95, .85}
             \definecolor{outputbackground}{rgb}{.95, .95, .95}
             \definecolor{traceback}{rgb}{1, .95, .95}
             % Framed environments for code cells (inputs, outputs, errors, ...).  The
             % various uses of \unskip (or not) at the end were fine-tuned by hand, so don't
             % randomly change them unless you're sure of the effect it will have.
             \usepackage{framed}
             % remove extraneous vertical space in boxes
             \setlength\fboxsep{0pt}
             % codecell is the whole input+output set of blocks that a Code cell can
             % generate.
             % TODO: unfortunately, it seems that using a framed codecell environment breaks
             % the ability of the frames inside of it to be broken across pages.  This
             % causes at least the problem of having lots of empty space at the bottom of
             % pages as new frames are moved to the next page, and if a single frame is too
             % long to fit on a page, will completely stop latex from compiling the
             % document.  So unless we figure out a solution to this, we'll have to instead
             % leave the codecell env. as empty.  I'm keeping the original codecell
             % definition here (a thin vertical bar) for reference, in case we find a
             % solution to the page break issue.
             %% \newenvironment{codecell}{%
             %%     \def\FrameCommand{\color{mediumgray} \vrule width 1pt \hspace{5pt}}%
             %%    \MakeFramed{\vspace{-0.5em}}}
             %%  {\unskip\endMakeFramed}
             % For now, make this a no-op...
             \newenvironment{codecell}{}
              \newenvironment{codeinput}{%
                \def\FrameCommand{\colorbox{inputbackground}}%
                \MakeFramed{\advance\hsize-\width \FrameRestore}}
              {\unskip\endMakeFramed}
             \newenvironment{codeoutput}{%
                \def\FrameCommand{\colorbox{outputbackground}}%
                \vspace{-1.4em}
                \MakeFramed{\advance\hsize-\width \FrameRestore}}
              {\unskip\medskip\endMakeFramed}
             \newenvironment{traceback}{%
                \def\FrameCommand{\colorbox{traceback}}%
                \MakeFramed{\advance\hsize-\width \FrameRestore}}
              {\endMakeFramed}
             % Use and configure listings package for nicely formatted code
             \usepackage{listingsutf8}
             \lstset{
               language=python,
               inputencoding=utf8x,
               extendedchars=\true,
               aboveskip=\smallskipamount,
               belowskip=\smallskipamount,
               xleftmargin=2mm,
               breaklines=true,
               basicstyle=\small \ttfamily,
               showstringspaces=false,
               keywordstyle=\color{blue}\bfseries,
               commentstyle=\color{myteal},
               stringstyle=\color{darkgreen},
               identifierstyle=\color{darkorange},
               columns=fullflexible,  % tighter character kerning, like verb
             }
             % The hyperref package gives us a pdf with properly built
             % internal navigation ('pdf bookmarks' for the table of contents,
             % internal cross-reference links, web links for URLs, etc.)
             \usepackage{hyperref}
             \hypersetup{
               breaklinks=true,  % so long urls are correctly broken across lines
               colorlinks=true,
               urlcolor=blue,
               linkcolor=darkorange,
               citecolor=darkgreen,
               }
             % hardcode size of all verbatim environments to be a bit smaller
             \makeatletter
             \g@addto@macro\@verbatim\small\topsep=0.5em\partopsep=0pt
             \makeatother
             % Prevent overflowing lines due to urls and other hard-to-break entities.
             \sloppy
             \begin{document}
             \section{An Introduction to the Scientific Python Ecosystem}
             While the Python language is an excellent tool for general-purpose
             programming, with a highly readable syntax, rich and powerful data types
             (strings, lists, sets, dictionaries, arbitrary length integers, etc) and
             a very comprehensive standard library, it was not designed specifically
             for mathematical and scientific computing. Neither the language nor its
             standard library have facilities for the efficient representation of
             multidimensional datasets, tools for linear algebra and general matrix
             manipulations (an essential building block of virtually all technical
             computing), nor any data visualization facilities.
             In particular, Python lists are very flexible containers that can be
             nested arbitrarily deep and which can hold any Python object in them,
             but they are poorly suited to represent efficiently common mathematical
             constructs like vectors and matrices. In contrast, much of our modern
             heritage of scientific computing has been built on top of libraries
             written in the Fortran language, which has native support for vectors
             and matrices as well as a library of mathematical functions that can
             efficiently operate on entire arrays at once.
             \subsection{Scientific Python: a collaboration of projects built by scientists}
             The scientific community has developed a set of related Python libraries
             that provide powerful array facilities, linear algebra, numerical
             algorithms, data visualization and more. In this appendix, we will
             briefly outline the tools most frequently used for this purpose, that
             make ``Scientific Python'' something far more powerful than the Python
             language alone.
             For reasons of space, we can only describe in some detail the central
             Numpy library, but below we provide links to the websites of each
             project where you can read their documentation in more detail.
             First, let's look at an overview of the basic tools that most scientists
             use in daily research with Python. The core of this ecosystem is
             composed of:
             \begin{itemize}
             \item
               Numpy: the basic library that most others depend on, it provides a
               powerful array type that can represent multidmensional datasets of
               many different kinds and that supports arithmetic operations. Numpy
               also provides a library of common mathematical functions, basic linear
               algebra, random number generation and Fast Fourier Transforms. Numpy
               can be found at \href{http://numpy.scipy.org}{numpy.scipy.org}
             \item
               Scipy: a large collection of numerical algorithms that operate on
               numpy arrays and provide facilities for many common tasks in
               scientific computing, including dense and sparse linear algebra
               support, optimization, special functions, statistics, n-dimensional
               image processing, signal processing and more. Scipy can be found at
               \href{http://scipy.org}{scipy.org}.
             \item
               Matplotlib: a data visualization library with a strong focus on
               producing high-quality output, it supports a variety of common
               scientific plot types in two and three dimensions, with precise
               control over the final output and format for publication-quality
               results. Matplotlib can also be controlled interactively allowing
               graphical manipulation of your data (zooming, panning, etc) and can be
               used with most modern user interface toolkits. It can be found at
               \href{http://matplotlib.sf.net}{matplotlib.sf.net}.
             \item
               IPython: while not strictly scientific in nature, IPython is the
               interactive environment in which many scientists spend their time.
               IPython provides a powerful Python shell that integrates tightly with
               Matplotlib and with easy access to the files and operating system, and
               which can execute in a terminal or in a graphical Qt console. IPython
               also has a web-based notebook interface that can combine code with
               text, mathematical expressions, figures and multimedia. It can be
               found at \href{http://ipython.org}{ipython.org}.
             \end{itemize}
             While each of these tools can be installed separately, in our opinion
             the most convenient way today of accessing them (especially on Windows
             and Mac computers) is to install the
             \href{http://www.enthought.com/products/epd\_free.php}{Free Edition of
             the Enthought Python Distribution} which contain all the above. Other
             free alternatives on Windows (but not on Macs) are
             \href{http://code.google.com/p/pythonxy}{Python(x,y)} and
             \href{http://www.lfd.uci.edu/~gohlke/pythonlibs}{Christoph Gohlke's
             packages page}.
             These four `core' libraries are in practice complemented by a number of
             other tools for more specialized work. We will briefly list here the
             ones that we think are the most commonly needed:
             \begin{itemize}
             \item
               Sympy: a symbolic manipulation tool that turns a Python session into a
               computer algebra system. It integrates with the IPython notebook,
               rendering results in properly typeset mathematical notation.
               \href{http://sympy.org}{sympy.org}.
             \item
               Mayavi: sophisticated 3d data visualization;
               \href{http://code.enthought.com/projects/mayavi}{code.enthought.com/projects/mayavi}.
             \item
               Cython: a bridge language between Python and C, useful both to
               optimize performance bottlenecks in Python and to access C libraries
               directly; \href{http://cython.org}{cython.org}.
             \item
               Pandas: high-performance data structures and data analysis tools, with
               powerful data alignment and structural manipulation capabilities;
               \href{http://pandas.pydata.org}{pandas.pydata.org}.
             \item
               Statsmodels: statistical data exploration and model estimation;
               \href{http://statsmodels.sourceforge.net}{statsmodels.sourceforge.net}.
             \item
               Scikit-learn: general purpose machine learning algorithms with a
               common interface; \href{http://scikit-learn.org}{scikit-learn.org}.
             \item
               Scikits-image: image processing toolbox;
               \href{http://scikits-image.org}{scikits-image.org}.
             \item
               NetworkX: analysis of complex networks (in the graph theoretical
               sense); \href{http://networkx.lanl.gov}{networkx.lanl.gov}.
             \item
               PyTables: management of hierarchical datasets using the
               industry-standard HDF5 format;
               \href{http://www.pytables.org}{www.pytables.org}.
             \end{itemize}
             Beyond these, for any specific problem you should look on the internet
             first, before starting to write code from scratch. There's a good chance
             that someone, somewhere, has written an open source library that you can
             use for part or all of your problem.
             \subsection{A note about the examples below}
             In all subsequent examples, you will see blocks of input code, followed
             by the results of the code if the code generated output. This output may
             include text, graphics and other result objects. These blocks of input
             can be pasted into your interactive IPython session or notebook for you
             to execute. In the print version of this document, a thin vertical bar
             on the left of the blocks of input and output shows which blocks go
             together.
             If you are reading this text as an actual IPython notebook, you can
             press \texttt{Shift-Enter} or use the `play' button on the toolbar
             (right-pointing triangle) to execute each block of code, known as a
             `cell' in IPython:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             # This is a block of code, below you'll see its output
             print "Welcome to the world of scientific computing with Python!"
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             Welcome to the world of scientific computing with Python!
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             \section{Motivation: the trapezoidal rule}
             In subsequent sections we'll provide a basic introduction to the nuts
             and bolts of the basic scientific python tools; but we'll first motivate
             it with a brief example that illustrates what you can do in a few lines
             with these tools. For this, we will use the simple problem of
             approximating a definite integral with the trapezoid rule:
             \[
             \int_{a}^{b} f(x)\, dx \approx \frac{1}{2} \sum_{k=1}^{N} \left( x_{k} - x_{k-1} \right) \left( f(x_{k}) + f(x_{k-1}) \right).
             \]
             Our task will be to compute this formula for a function such as:
             \[
             f(x) = (x-3)(x-5)(x-7)+85
             \]
             integrated between $a=1$ and $b=9$.
             First, we define the function and sample it evenly between 0 and 10 at
 points:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             def f(x):
                 return (x-3)*(x-5)*(x-7)+85
             import numpy as np
             x = np.linspace(0, 10, 200)
             y = f(x)
             \end{lstlisting}
             \end{codeinput}
             \end{codecell}
             We select $a$ and $b$, our integration limits, and we take only a few
             points in that region to illustrate the error behavior of the trapezoid
             approximation:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             a, b = 1, 9
             xint = x[logical_and(x>=a, x<=b)][::30]
             yint = y[logical_and(x>=a, x<=b)][::30]
             \end{lstlisting}
             \end{codeinput}
             \end{codecell}
             Let's plot both the function and the area below it in the trapezoid
             approximation:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             import matplotlib.pyplot as plt
             plt.plot(x, y, lw=2)
             plt.axis([0, 10, 0, 140])
             plt.fill_between(xint, 0, yint, facecolor='gray', alpha=0.4)
             plt.text(0.5 * (a + b), 30,r"$\int_a^b f(x)dx$", horizontalalignment='center', fontsize=20);
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{center}
-            \includegraphics[width=6in]{/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_00.pdf}
+            \includegraphics[width=6in]{tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_00.pdf}
             \par
             \end{center}
             \end{codeoutput}
             \end{codecell}
             Compute the integral both at high accuracy and with the trapezoid
             approximation
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             from scipy.integrate import quad, trapz
             integral, error = quad(f, 1, 9)
             trap_integral = trapz(yint, xint)
             print "The integral is: %g +/- %.1e" % (integral, error)
             print "The trapezoid approximation with", len(xint), "points is:", trap_integral
             print "The absolute error is:", abs(integral - trap_integral)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             The integral is: 680 +/- 7.5e-12
             The trapezoid approximation with 6 points is: 621.286411141
             The absolute error is: 58.7135888589
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             This simple example showed us how, combining the numpy, scipy and
             matplotlib libraries we can provide an illustration of a standard method
             in elementary calculus with just a few lines of code. We will now
             discuss with more detail the basic usage of these tools.
             \section{NumPy arrays: the right data structure for scientific computing}
             \subsection{Basics of Numpy arrays}
             We now turn our attention to the Numpy library, which forms the base
             layer for the entire `scipy ecosystem'. Once you have installed numpy,
             you can import it as
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             import numpy
             \end{lstlisting}
             \end{codeinput}
             \end{codecell}
             though in this book we will use the common shorthand
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             import numpy as np
             \end{lstlisting}
             \end{codeinput}
             \end{codecell}
             As mentioned above, the main object provided by numpy is a powerful
             array. We'll start by exploring how the numpy array differs from Python
             lists. We start by creating a simple list and an array with the same
             contents of the list:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             lst = [10, 20, 30, 40]
             arr = np.array([10, 20, 30, 40])
             \end{lstlisting}
             \end{codeinput}
             \end{codecell}
             Elements of a one-dimensional array are accessed with the same syntax as
             a list:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             lst[0]
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             arr[0]
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             arr[-1]
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             arr[2:]
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([30, 40])
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             The first difference to note between lists and arrays is that arrays are
             \emph{homogeneous}; i.e.~all elements of an array must be of the same
             type. In contrast, lists can contain elements of arbitrary type. For
             example, we can change the last element in our list above to be a
             string:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             lst[-1] = 'a string inside a list'
             lst
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             [10, 20, 30, 'a string inside a list']
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             but the same can not be done with an array, as we get an error message:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             arr[-1] = 'a string inside an array'
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{traceback}
             \begin{verbatim}
             ---------------------------------------------------------------------------
             ValueError                                Traceback (most recent call last)
             /home/fperez/teach/book-math-labtool/<ipython-input-13-29c0bfa5fa8a> in <module>()
             ----> 1 arr[-1] = 'a string inside an array'
             ValueError: invalid literal for long() with base 10: 'a string inside an array'
             \end{verbatim}
             \end{traceback}
             \end{codeoutput}
             \end{codecell}
             The information about the type of an array is contained in its
             \emph{dtype} attribute:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             arr.dtype
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             dtype('int32')
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             Once an array has been created, its dtype is fixed and it can only store
             elements of the same type. For this example where the dtype is integer,
             if we store a floating point number it will be automatically converted
             into an integer:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             arr[-1] = 1.234
             arr
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([10, 20, 30,  1])
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             Above we created an array from an existing list; now let us now see
             other ways in which we can create arrays, which we'll illustrate next. A
             common need is to have an array initialized with a constant value, and
             very often this value is 0 or 1 (suitable as starting value for additive
             and multiplicative loops respectively); \texttt{zeros} creates arrays of
             all zeros, with any desired dtype:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             np.zeros(5, float)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([ 0.,  0.,  0.,  0.,  0.])
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             np.zeros(3, int)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([0, 0, 0])
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             np.zeros(3, complex)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([ 0.+0.j,  0.+0.j,  0.+0.j])
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             and similarly for \texttt{ones}:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             print '5 ones:', np.ones(5)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
 ones: [ 1.  1.  1.  1.  1.]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             If we want an array initialized with an arbitrary value, we can create
             an empty array and then use the fill method to put the value we want
             into the array:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             a = empty(4)
             a.fill(5.5)
             a
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([ 5.5,  5.5,  5.5,  5.5])
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             Numpy also offers the \texttt{arange} function, which works like the
             builtin \texttt{range} but returns an array instead of a list:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             np.arange(5)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([0, 1, 2, 3, 4])
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             and the \texttt{linspace} and \texttt{logspace} functions to create
             linearly and logarithmically-spaced grids respectively, with a fixed
             number of points and including both ends of the specified interval:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             print "A linear grid between 0 and 1:", np.linspace(0, 1, 5)
             print "A logarithmic grid between 10**1 and 10**4: ", np.logspace(1, 4, 4)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             A linear grid between 0 and 1: [ 0.    0.25  0.5   0.75  1.  ]
             A logarithmic grid between 10**1 and 10**4:  [    10.    100.   1000.  10000.]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             Finally, it is often useful to create arrays with random numbers that
             follow a specific distribution. The \texttt{np.random} module contains a
             number of functions that can be used to this effect, for example this
             will produce an array of 5 random samples taken from a standard normal
             distribution (0 mean and variance 1):
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             np.random.randn(5)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([-0.08633343, -0.67375434,  1.00589536,  0.87081651,  1.65597822])
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             whereas this will also give 5 samples, but from a normal distribution
             with a mean of 10 and a variance of 3:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             norm10 = np.random.normal(10, 3, 5)
             norm10
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([  8.94879575,   5.53038269,   8.24847281,  12.14944165,  11.56209294])
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             \subsection{Indexing with other arrays}
             Above we saw how to index arrays with single numbers and slices, just
             like Python lists. But arrays allow for a more sophisticated kind of
             indexing which is very powerful: you can index an array with another
             array, and in particular with an array of boolean values. This is
             particluarly useful to extract information from an array that matches a
             certain condition.
             Consider for example that in the array \texttt{norm10} we want to
             replace all values above 9 with the value 0. We can do so by first
             finding the \emph{mask} that indicates where this condition is true or
             false:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             mask = norm10 > 9
             mask
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([False, False, False,  True,  True], dtype=bool)
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             Now that we have this mask, we can use it to either read those values or
             to reset them to 0:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             print 'Values above 9:', norm10[mask]
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             Values above 9: [ 12.14944165  11.56209294]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             print 'Resetting all values above 9 to 0...'
             norm10[mask] = 0
             print norm10
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             Resetting all values above 9 to 0...
             [ 8.94879575  5.53038269  8.24847281  0.          0.        ]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             \subsection{Arrays with more than one dimension}
             Up until now all our examples have used one-dimensional arrays. But
             Numpy can create arrays of aribtrary dimensions, and all the methods
             illustrated in the previous section work with more than one dimension.
             For example, a list of lists can be used to initialize a two dimensional
             array:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             lst2 = [[1, 2], [3, 4]]
             arr2 = np.array([[1, 2], [3, 4]])
             arr2
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([[1, 2],
                    [3, 4]])
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             With two-dimensional arrays we start seeing the power of numpy: while a
             nested list can be indexed using repeatedly the \texttt{{[} {]}}
             operator, multidimensional arrays support a much more natural indexing
             syntax with a single \texttt{{[} {]}} and a set of indices separated by
             commas:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             print lst2[0][1]
             print arr2[0,1]
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             Most of the array creation functions listed above can be used with more
             than one dimension, for example:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             np.zeros((2,3))
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([[ 0.,  0.,  0.],
                    [ 0.,  0.,  0.]])
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             np.random.normal(10, 3, (2, 4))
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([[ 11.26788826,   4.29619866,  11.09346496,   9.73861307],
                    [ 10.54025996,   9.5146268 ,  10.80367214,  13.62204505]])
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             In fact, the shape of an array can be changed at any time, as long as
             the total number of elements is unchanged. For example, if we want a 2x4
             array with numbers increasing from 0, the easiest way to create it is:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             arr = np.arange(8).reshape(2,4)
             print arr
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             [[0 1 2 3]
              [4 5 6 7]]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             With multidimensional arrays, you can also use slices, and you can mix
             and match slices and single indices in the different dimensions (using
             the same array as above):
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             print 'Slicing in the second row:', arr[1, 2:4]
             print 'All rows, third column   :', arr[:, 2]
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             Slicing in the second row: [6 7]
             All rows, third column   : [2 6]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             If you only provide one index, then you will get an array with one less
             dimension containing that row:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             print 'First row:  ', arr[0]
             print 'Second row: ', arr[1]
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             First row:   [0 1 2 3]
             Second row:  [4 5 6 7]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             Now that we have seen how to create arrays with more than one dimension,
             it's a good idea to look at some of the most useful properties and
             methods that arrays have. The following provide basic information about
             the size, shape and data in the array:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             print 'Data type                :', arr.dtype
             print 'Total number of elements :', arr.size
             print 'Number of dimensions     :', arr.ndim
             print 'Shape (dimensionality)   :', arr.shape
             print 'Memory used (in bytes)   :', arr.nbytes
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             Data type                : int32
             Total number of elements : 8
             Number of dimensions     : 2
             Shape (dimensionality)   : (2, 4)
             Memory used (in bytes)   : 32
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             Arrays also have many useful methods, some especially useful ones are:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             print 'Minimum and maximum             :', arr.min(), arr.max()
             print 'Sum and product of all elements :', arr.sum(), arr.prod()
             print 'Mean and standard deviation     :', arr.mean(), arr.std()
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             Minimum and maximum             : 0 7
             Sum and product of all elements : 28 0
             Mean and standard deviation     : 3.5 2.29128784748
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             For these methods, the above operations area all computed on all the
             elements of the array. But for a multidimensional array, it's possible
             to do the computation along a single dimension, by passing the
             \texttt{axis} parameter; for example:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             print 'For the following array:\n', arr
             print 'The sum of elements along the rows is    :', arr.sum(axis=1)
             print 'The sum of elements along the columns is :', arr.sum(axis=0)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             For the following array:
             [[0 1 2 3]
              [4 5 6 7]]
             The sum of elements along the rows is    : [ 6 22]
             The sum of elements along the columns is : [ 4  6  8 10]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             As you can see in this example, the value of the \texttt{axis} parameter
             is the dimension which will be \emph{consumed} once the operation has
             been carried out. This is why to sum along the rows we use
             \texttt{axis=0}.
             This can be easily illustrated with an example that has more dimensions;
             we create an array with 4 dimensions and shape \texttt{(3,4,5,6)} and
             sum along the axis number 2 (i.e.~the \emph{third} axis, since in Python
             all counts are 0-based). That consumes the dimension whose length was 5,
             leaving us with a new array that has shape \texttt{(3,4,6)}:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             np.zeros((3,4,5,6)).sum(2).shape
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             (3, 4, 6)
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             Another widely used property of arrays is the \texttt{.T} attribute,
             which allows you to access the transpose of the array:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             print 'Array:\n', arr
             print 'Transpose:\n', arr.T
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             Array:
             [[0 1 2 3]
              [4 5 6 7]]
             Transpose:
             [[0 4]
              [1 5]
              [2 6]
              [3 7]]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             We don't have time here to look at all the methods and properties of
             arrays, here's a complete list. Simply try exploring some of these
             IPython to learn more, or read their description in the full Numpy
             documentation:
             \begin{verbatim}
             arr.T             arr.copy          arr.getfield      arr.put           arr.squeeze
             arr.all           arr.ctypes        arr.imag          arr.ravel         arr.std
             arr.any           arr.cumprod       arr.item          arr.real          arr.strides
             arr.argmax        arr.cumsum        arr.itemset       arr.repeat        arr.sum
             arr.argmin        arr.data          arr.itemsize      arr.reshape       arr.swapaxes
             arr.argsort       arr.diagonal      arr.max           arr.resize        arr.take
             arr.astype        arr.dot           arr.mean          arr.round         arr.tofile
             arr.base          arr.dtype         arr.min           arr.searchsorted  arr.tolist
             arr.byteswap      arr.dump          arr.nbytes        arr.setasflat     arr.tostring
             arr.choose        arr.dumps         arr.ndim          arr.setfield      arr.trace
             arr.clip          arr.fill          arr.newbyteorder  arr.setflags      arr.transpose
             arr.compress      arr.flags         arr.nonzero       arr.shape         arr.var
             arr.conj          arr.flat          arr.prod          arr.size          arr.view
             arr.conjugate     arr.flatten       arr.ptp           arr.sort
             \end{verbatim}
             \subsection{Operating with arrays}
             Arrays support all regular arithmetic operators, and the numpy library
             also contains a complete collection of basic mathematical functions that
             operate on arrays. It is important to remember that in general, all
             operations with arrays are applied \emph{element-wise}, i.e., are
             applied to all the elements of the array at the same time. Consider for
             example:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             arr1 = np.arange(4)
             arr2 = np.arange(10, 14)
             print arr1, '+', arr2, '=', arr1+arr2
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             [0 1 2 3] + [10 11 12 13] = [10 12 14 16]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             Importantly, you must remember that even the multiplication operator is
             by default applied element-wise, it is \emph{not} the matrix
             multiplication from linear algebra (as is the case in Matlab, for
             example):
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             print arr1, '*', arr2, '=', arr1*arr2
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             [0 1 2 3] * [10 11 12 13] = [ 0 11 24 39]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             While this means that in principle arrays must always match in their
             dimensionality in order for an operation to be valid, numpy will
             \emph{broadcast} dimensions when possible. For example, suppose that you
             want to add the number 1.5 to \texttt{arr1}; the following would be a
             valid way to do it:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             arr1 + 1.5*np.ones(4)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([ 1.5,  2.5,  3.5,  4.5])
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             But thanks to numpy's broadcasting rules, the following is equally
             valid:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             arr1 + 1.5
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([ 1.5,  2.5,  3.5,  4.5])
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             In this case, numpy looked at both operands and saw that the first
             (\texttt{arr1}) was a one-dimensional array of length 4 and the second
             was a scalar, considered a zero-dimensional object. The broadcasting
             rules allow numpy to:
             \begin{itemize}
             \item
               \emph{create} new dimensions of length 1 (since this doesn't change
               the size of the array)
             \item
               `stretch' a dimension of length 1 that needs to be matched to a
               dimension of a different size.
             \end{itemize}
             So in the above example, the scalar 1.5 is effectively:
             \begin{itemize}
             \item
               first `promoted' to a 1-dimensional array of length 1
             \item
               then, this array is `stretched' to length 4 to match the dimension of
               \texttt{arr1}.
             \end{itemize}
             After these two operations are complete, the addition can proceed as now
             both operands are one-dimensional arrays of length 4.
             This broadcasting behavior is in practice enormously powerful,
             especially because when numpy broadcasts to create new dimensions or to
             `stretch' existing ones, it doesn't actually replicate the data. In the
             example above the operation is carried \emph{as if} the 1.5 was a 1-d
             array with 1.5 in all of its entries, but no actual array was ever
             created. This can save lots of memory in cases when the arrays in
             question are large and can have significant performance implications.
             The general rule is: when operating on two arrays, NumPy compares their
             shapes element-wise. It starts with the trailing dimensions, and works
             its way forward, creating dimensions of length 1 as needed. Two
             dimensions are considered compatible when
             \begin{itemize}
             \item
               they are equal to begin with, or
             \item
               one of them is 1; in this case numpy will do the `stretching' to make
               them equal.
             \end{itemize}
             If these conditions are not met, a
             \texttt{ValueError: frames are not aligned} exception is thrown,
             indicating that the arrays have incompatible shapes. The size of the
             resulting array is the maximum size along each dimension of the input
             arrays.
             This shows how the broadcasting rules work in several dimensions:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             b = np.array([2, 3, 4, 5])
             print arr, '\n\n+', b , '\n----------------\n', arr + b
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             [[0 1 2 3]
              [4 5 6 7]]
             + [2 3 4 5]
             ----------------
             [[ 2  4  6  8]
              [ 6  8 10 12]]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             Now, how could you use broadcasting to say add \texttt{{[}4, 6{]}} along
             the rows to \texttt{arr} above? Simply performing the direct addition
             will produce the error we previously mentioned:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             c = np.array([4, 6])
             arr + c
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{traceback}
             \begin{verbatim}
             ---------------------------------------------------------------------------
             ValueError                                Traceback (most recent call last)
             /home/fperez/teach/book-math-labtool/<ipython-input-45-62aa20ac1980> in <module>()
 c = np.array([4, 6])
             ----> 2 arr + c
             ValueError: operands could not be broadcast together with shapes (2,4) (2)
             \end{verbatim}
             \end{traceback}
             \end{codeoutput}
             \end{codecell}
             According to the rules above, the array \texttt{c} would need to have a
             \emph{trailing} dimension of 1 for the broadcasting to work. It turns
             out that numpy allows you to `inject' new dimensions anywhere into an
             array on the fly, by indexing it with the special object
             \texttt{np.newaxis}:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             (c[:, np.newaxis]).shape
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             (2, 1)
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             This is exactly what we need, and indeed it works:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             arr + c[:, np.newaxis]
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             array([[ 4,  5,  6,  7],
                    [10, 11, 12, 13]])
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             For the full broadcasting rules, please see the official Numpy docs,
             which describe them in detail and with more complex examples.
             As we mentioned before, Numpy ships with a full complement of
             mathematical functions that work on entire arrays, including logarithms,
             exponentials, trigonometric and hyperbolic trigonometric functions, etc.
             Furthermore, scipy ships a rich special function library in the
             \texttt{scipy.special} module that includes Bessel, Airy, Fresnel,
             Laguerre and other classical special functions. For example, sampling
             the sine function at 100 points between $0$ and $2\pi$ is as simple as:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             x = np.linspace(0, 2*np.pi, 100)
             y = np.sin(x)
             \end{lstlisting}
             \end{codeinput}
             \end{codecell}
             \subsection{Linear algebra in numpy}
             Numpy ships with a basic linear algebra library, and all arrays have a
             \texttt{dot} method whose behavior is that of the scalar dot product
             when its arguments are vectors (one-dimensional arrays) and the
             traditional matrix multiplication when one or both of its arguments are
             two-dimensional arrays:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             v1 = np.array([2, 3, 4])
             v2 = np.array([1, 0, 1])
             print v1, '.', v2, '=', v1.dot(v2)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             [2 3 4] . [1 0 1] = 6
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             Here is a regular matrix-vector multiplication, note that the array
             \texttt{v1} should be viewed as a \emph{column} vector in traditional
             linear algebra notation; numpy makes no distinction between row and
             column vectors and simply verifies that the dimensions match the
             required rules of matrix multiplication, in this case we have a
             $2 \times 3$ matrix multiplied by a 3-vector, which produces a 2-vector:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             A = np.arange(6).reshape(2, 3)
             print A, 'x', v1, '=', A.dot(v1)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             [[0 1 2]
              [3 4 5]] x [2 3 4] = [11 38]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             For matrix-matrix multiplication, the same dimension-matching rules must
             be satisfied, e.g.~consider the difference between $A \times A^T$:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             print A.dot(A.T)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             [[ 5 14]
              [14 50]]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             and $A^T \times A$:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             print A.T.dot(A)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             [[ 9 12 15]
              [12 17 22]
              [15 22 29]]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             Furthermore, the \texttt{numpy.linalg} module includes additional
             functionality such as determinants, matrix norms, Cholesky, eigenvalue
             and singular value decompositions, etc. For even more linear algebra
             tools, \texttt{scipy.linalg} contains the majority of the tools in the
             classic LAPACK libraries as well as functions to operate on sparse
             matrices. We refer the reader to the Numpy and Scipy documentations for
             additional details on these.
             \subsection{Reading and writing arrays to disk}
             Numpy lets you read and write arrays into files in a number of ways. In
             order to use these tools well, it is critical to understand the
             difference between a \emph{text} and a \emph{binary} file containing
             numerical data. In a text file, the number $\pi$ could be written as
             ``3.141592653589793'', for example: a string of digits that a human can
             read, with in this case 15 decimal digits. In contrast, that same number
             written to a binary file would be encoded as 8 characters (bytes) that
             are not readable by a human but which contain the exact same data that
             the variable \texttt{pi} had in the computer's memory.
             The tradeoffs between the two modes are thus:
             \begin{itemize}
             \item
               Text mode: occupies more space, precision can be lost (if not all
               digits are written to disk), but is readable and editable by hand with
               a text editor. Can \emph{only} be used for one- and two-dimensional
               arrays.
             \item
               Binary mode: compact and exact representation of the data in memory,
               can't be read or edited by hand. Arrays of any size and dimensionality
               can be saved and read without loss of information.
             \end{itemize}
             First, let's see how to read and write arrays in text mode. The
             \texttt{np.savetxt} function saves an array to a text file, with options
             to control the precision, separators and even adding a header:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             arr = np.arange(10).reshape(2, 5)
             np.savetxt('test.out', arr, fmt='%.2e', header="My dataset")
             !cat test.out
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             # My dataset
 .00e+00 1.00e+00 2.00e+00 3.00e+00 4.00e+00
 .00e+00 6.00e+00 7.00e+00 8.00e+00 9.00e+00
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             And this same type of file can then be read with the matching
             \texttt{np.loadtxt} function:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             arr2 = np.loadtxt('test.out')
             print arr2
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             [[ 0.  1.  2.  3.  4.]
              [ 5.  6.  7.  8.  9.]]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             For binary data, Numpy provides the \texttt{np.save} and
             \texttt{np.savez} routines. The first saves a single array to a file
             with \texttt{.npy} extension, while the latter can be used to save a
             \emph{group} of arrays into a single file with \texttt{.npz} extension.
             The files created with these routines can then be read with the
             \texttt{np.load} function.
             Let us first see how to use the simpler \texttt{np.save} function to
             save a single array:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             np.save('test.npy', arr2)
             # Now we read this back
             arr2n = np.load('test.npy')
             # Let's see if any element is non-zero in the difference.
             # A value of True would be a problem.
             print 'Any differences?', np.any(arr2-arr2n)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             Any differences? False
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             Now let us see how the \texttt{np.savez} function works. You give it a
             filename and either a sequence of arrays or a set of keywords. In the
             first mode, the function will auotmatically name the saved arrays in the
             archive as \texttt{arr\_0}, \texttt{arr\_1}, etc:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             np.savez('test.npz', arr, arr2)
             arrays = np.load('test.npz')
             arrays.files
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             ['arr_1', 'arr_0']
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             Alternatively, we can explicitly choose how to name the arrays we save:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             np.savez('test.npz', array1=arr, array2=arr2)
             arrays = np.load('test.npz')
             arrays.files
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             ['array2', 'array1']
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             The object returned by \texttt{np.load} from an \texttt{.npz} file works
             like a dictionary, though you can also access its constituent files by
             attribute using its special \texttt{.f} field; this is best illustrated
             with an example with the \texttt{arrays} object from above:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             print 'First row of first array:', arrays['array1'][0]
             # This is an equivalent way to get the same field
             print 'First row of first array:', arrays.f.array1[0]
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             First row of first array: [0 1 2 3 4]
             First row of first array: [0 1 2 3 4]
             \end{verbatim}
             \end{codeoutput}
             \end{codecell}
             This \texttt{.npz} format is a very convenient way to package compactly
             and without loss of information, into a single file, a group of related
             arrays that pertain to a specific problem. At some point, however, the
             complexity of your dataset may be such that the optimal approach is to
             use one of the standard formats in scientific data processing that have
             been designed to handle complex datasets, such as NetCDF or HDF5.
             Fortunately, there are tools for manipulating these formats in Python,
             and for storing data in other ways such as databases. A complete
             discussion of the possibilities is beyond the scope of this discussion,
             but of particular interest for scientific users we at least mention the
             following:
             \begin{itemize}
             \item
               The \texttt{scipy.io} module contains routines to read and write
               Matlab files in \texttt{.mat} format and files in the NetCDF format
               that is widely used in certain scientific disciplines.
             \item
               For manipulating files in the HDF5 format, there are two excellent
               options in Python: The PyTables project offers a high-level, object
               oriented approach to manipulating HDF5 datasets, while the h5py
               project offers a more direct mapping to the standard HDF5 library
               interface. Both are excellent tools; if you need to work with HDF5
               datasets you should read some of their documentation and examples and
               decide which approach is a better match for your needs.
             \end{itemize}
             \section{High quality data visualization with Matplotlib}
             The \href{http://matplotlib.sf.net}{matplotlib} library is a powerful
             tool capable of producing complex publication-quality figures with fine
             layout control in two and three dimensions; here we will only provide a
             minimal self-contained introduction to its usage that covers the
             functionality needed for the rest of the book. We encourage the reader
             to read the tutorials included with the matplotlib documentation as well
             as to browse its extensive gallery of examples that include source code.
             Just as we typically use the shorthand \texttt{np} for Numpy, we will
             use \texttt{plt} for the \texttt{matplotlib.pyplot} module where the
             easy-to-use plotting functions reside (the library contains a rich
             object-oriented architecture that we don't have the space to discuss
             here):
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             import matplotlib.pyplot as plt
             \end{lstlisting}
             \end{codeinput}
             \end{codecell}
             The most frequently used function is simply called \texttt{plot}, here
             is how you can make a simple plot of $\sin(x)$ for $x \in [0, 2\pi]$
             with labels and a grid (we use the semicolon in the last line to
             suppress the display of some information that is unnecessary right now):
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             x = np.linspace(0, 2*np.pi)
             y = np.sin(x)
             plt.plot(x,y, label='sin(x)')
             plt.legend()
             plt.grid()
             plt.title('Harmonic')
             plt.xlabel('x')
             plt.ylabel('y');
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{center}
-            \includegraphics[width=6in]{/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_01.pdf}
+            \includegraphics[width=6in]{tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_01.pdf}
             \par
             \end{center}
             \end{codeoutput}
             \end{codecell}
             You can control the style, color and other properties of the markers,
             for example:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             plt.plot(x, y, linewidth=2);
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{center}
-            \includegraphics[width=6in]{/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_02.pdf}
+            \includegraphics[width=6in]{tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_02.pdf}
             \par
             \end{center}
             \end{codeoutput}
             \end{codecell}
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             plt.plot(x, y, 'o', markersize=5, color='r');
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{center}
-            \includegraphics[width=6in]{/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_03.pdf}
+            \includegraphics[width=6in]{tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_03.pdf}
             \par
             \end{center}
             \end{codeoutput}
             \end{codecell}
             We will now see how to create a few other common plot types, such as a
             simple error plot:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             # example data
             x = np.arange(0.1, 4, 0.5)
             y = np.exp(-x)
             # example variable error bar values
             yerr = 0.1 + 0.2*np.sqrt(x)
             xerr = 0.1 + yerr
             # First illustrate basic pyplot interface, using defaults where possible.
             plt.figure()
             plt.errorbar(x, y, xerr=0.2, yerr=0.4)
             plt.title("Simplest errorbars, 0.2 in x, 0.4 in y");
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{center}
-            \includegraphics[width=6in]{/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_04.pdf}
+            \includegraphics[width=6in]{tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_04.pdf}
             \par
             \end{center}
             \end{codeoutput}
             \end{codecell}
             A simple log plot
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             x = np.linspace(-5, 5)
             y = np.exp(-x**2)
             plt.semilogy(x, y);
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{center}
-            \includegraphics[width=6in]{/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_05.pdf}
+            \includegraphics[width=6in]{tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_05.pdf}
             \par
             \end{center}
             \end{codeoutput}
             \end{codecell}
             A histogram annotated with text inside the plot, using the \texttt{text}
             function:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             mu, sigma = 100, 15
             x = mu + sigma * np.random.randn(10000)
             # the histogram of the data
             n, bins, patches = plt.hist(x, 50, normed=1, facecolor='g', alpha=0.75)
             plt.xlabel('Smarts')
             plt.ylabel('Probability')
             plt.title('Histogram of IQ')
             # This will put a text fragment at the position given:
             plt.text(55, .027, r'$\mu=100,\ \sigma=15$', fontsize=14)
             plt.axis([40, 160, 0, 0.03])
             plt.grid(True)
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{center}
-            \includegraphics[width=6in]{/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_06.pdf}
+            \includegraphics[width=6in]{tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_06.pdf}
             \par
             \end{center}
             \end{codeoutput}
             \end{codecell}
             \subsection{Image display}
             The \texttt{imshow} command can display single or multi-channel images.
             A simple array of random numbers, plotted in grayscale:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             from matplotlib import cm
             plt.imshow(np.random.rand(5, 10), cmap=cm.gray, interpolation='nearest');
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{center}
-            \includegraphics[width=6in]{/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_07.pdf}
+            \includegraphics[width=6in]{tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_07.pdf}
             \par
             \end{center}
             \end{codeoutput}
             \end{codecell}
             A real photograph is a multichannel image, \texttt{imshow} interprets it
             correctly:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             img = plt.imread('stinkbug.png')
             print 'Dimensions of the array img:', img.shape
             plt.imshow(img);
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{verbatim}
             Dimensions of the array img: (375, 500, 3)
             \end{verbatim}
             \begin{center}
-            \includegraphics[width=6in]{/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_08.pdf}
+            \includegraphics[width=6in]{tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_08.pdf}
             \par
             \end{center}
             \end{codeoutput}
             \end{codecell}
             \subsection{Simple 3d plotting with matplotlib}
             Note that you must execute at least once in your session:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             from mpl_toolkits.mplot3d import Axes3D
             \end{lstlisting}
             \end{codeinput}
             \end{codecell}
             One this has been done, you can create 3d axes with the
             \texttt{projection='3d'} keyword to \texttt{add\_subplot}:
             \begin{verbatim}
             fig = plt.figure()
             fig.add_subplot(<other arguments here>, projection='3d')
             \end{verbatim}
             A simple surface plot:
             \begin{codecell}
             \begin{codeinput}
             \begin{lstlisting}
             from mpl_toolkits.mplot3d.axes3d import Axes3D
             from matplotlib import cm
             fig = plt.figure()
             ax = fig.add_subplot(1, 1, 1, projection='3d')
             X = np.arange(-5, 5, 0.25)
             Y = np.arange(-5, 5, 0.25)
             X, Y = np.meshgrid(X, Y)
             R = np.sqrt(X**2 + Y**2)
             Z = np.sin(R)
             surf = ax.plot_surface(X, Y, Z, rstride=1, cstride=1, cmap=cm.jet,
                     linewidth=0, antialiased=False)
             ax.set_zlim3d(-1.01, 1.01);
             \end{lstlisting}
             \end{codeinput}
             \begin{codeoutput}
             \begin{center}
-            \includegraphics[width=6in]{/Users/bussonniermatthias/nbconvert/tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_09.pdf}
+            \includegraphics[width=6in]{tests/ipynbref/IntroNumPy.orig_files/IntroNumPy.orig_fig_09.pdf}
             \par
             \end{center}
             \end{codeoutput}
             \end{codecell}
             \section{IPython: a powerful interactive environment}
             A key component of the everyday workflow of most scientific computing
             environments is a good interactive environment, that is, a system in
             which you can execute small amounts of code and view the results
             immediately, combining both printing out data and opening graphical
             visualizations. All modern systems for scientific computing, commercial
             and open source, include such functionality.
             Out of the box, Python also offers a simple interactive shell with very
             limited capabilities. But just like the scientific community built Numpy
             to provide arrays suited for scientific work (since Pytyhon's lists
             aren't optimal for this task), it has also developed an interactive
             environment much more sophisticated than the built-in one. The
             \href{http://ipython.org}{IPython project} offers a set of tools to make
             productive use of the Python language, all the while working
             interactively and with immedate feedback on your results. The basic
             tools that IPython provides are:
             \begin{enumerate}[1.]
             \item
               A powerful terminal shell, with many features designed to increase the
               fluidity and productivity of everyday scientific workflows, including:
               \begin{itemize}
               \item
                 rich introspection of all objects and variables including easy
                 access to the source code of any function
               \item
                 powerful and extensible tab completion of variables and filenames,
               \item
                 tight integration with matplotlib, supporting interactive figures
                 that don't block the terminal,
               \item
                 direct access to the filesystem and underlying operating system,
               \item
                 an extensible system for shell-like commands called `magics' that
                 reduce the work needed to perform many common tasks,
               \item
                 tools for easily running, timing, profiling and debugging your
                 codes,
               \item
                 syntax highlighted error messages with much more detail than the
                 default Python ones,
               \item
                 logging and access to all previous history of inputs, including
                 across sessions
               \end{itemize}
             \item
               A Qt console that provides the look and feel of a terminal, but adds
               support for inline figures, graphical calltips, a persistent session
               that can survive crashes (even segfaults) of the kernel process, and
               more.
             \item
               A web-based notebook that can execute code and also contain rich text
               and figures, mathematical equations and arbitrary HTML. This notebook
               presents a document-like view with cells where code is executed but
               that can be edited in-place, reordered, mixed with explanatory text
               and figures, etc.
             \item
               A high-performance, low-latency system for parallel computing that
               supports the control of a cluster of IPython engines communicating
               over a network, with optimizations that minimize unnecessary copying
               of large objects (especially numpy arrays).
             \end{enumerate}
             We will now discuss the highlights of the tools 1-3 above so that you
             can make them an effective part of your workflow. The topic of parallel
             computing is beyond the scope of this document, but we encourage you to
             read the extensive
             \href{http://ipython.org/ipython-doc/rel-0.12.1/parallel/index.html}{documentation}
             and \href{http://minrk.github.com/scipy-tutorial-2011/}{tutorials} on
             this available on the IPython website.
             \subsection{The IPython terminal}
             You can start IPython at the terminal simply by typing:
             \begin{verbatim}
             $ ipython
             \end{verbatim}
             which will provide you some basic information about how to get started
             and will then open a prompt labeled \texttt{In {[}1{]}:} for you to
             start typing. Here we type $2^{64}$ and Python computes the result for
             us in exact arithmetic, returning it as \texttt{Out{[}1{]}}:
             \begin{verbatim}
             $ ipython
             Python 2.7.2+ (default, Oct  4 2011, 20:03:08)
             Type "copyright", "credits" or "license" for more information.
             IPython 0.13.dev -- An enhanced Interactive Python.
             ?         -> Introduction and overview of IPython's features.
             %quickref -> Quick reference.
             help      -> Python's own help system.
             object?   -> Details about 'object', use 'object??' for extra details.
             In [1]: 2**64
             Out[1]: 18446744073709551616L
             \end{verbatim}
             The first thing you should know about IPython is that all your inputs
             and outputs are saved. There are two variables named \texttt{In} and
             \texttt{Out} which are filled as you work with your results.
             Furthermore, all outputs are also saved to auto-created variables of the
             form \texttt{\_NN} where \texttt{NN} is the prompt number, and inputs to
             \texttt{\_iNN}. This allows you to recover quickly the result of a prior
             computation by referring to its number even if you forgot to store it as
             a variable. For example, later on in the above session you can do:
             \begin{verbatim}
             In [6]: print _1
             18446744073709551616
             \end{verbatim}
             We strongly recommend that you take a few minutes to read at least the
             basic introduction provided by the \texttt{?} command, and keep in mind
             that the \texttt{\%quickref} command at all times can be used as a quick
             reference ``cheat sheet'' of the most frequently used features of
             IPython.
             At the IPython prompt, any valid Python code that you type will be
             executed similarly to the default Python shell (though often with more
             informative feedback). But since IPython is a \emph{superset} of the
             default Python shell; let's have a brief look at some of its additional
             functionality.
             \textbf{Object introspection}
             A simple \texttt{?} command provides a general introduction to IPython,
             but as indicated in the banner above, you can use the \texttt{?} syntax
             to ask for details about any object. For example, if we type
             \texttt{\_1?}, IPython will print the following details about this
             variable:
             \begin{verbatim}
             In [14]: _1?
             Type:       long
             Base Class: <type 'long'>
             String Form:18446744073709551616
             Namespace:  Interactive
             Docstring:
             long(x[, base]) -> integer
             Convert a string or number to a long integer, if possible.  A floating
             [etc... snipped for brevity]
             \end{verbatim}
             If you add a second \texttt{?} and for any oobject \texttt{x} type
             \texttt{x??}, IPython will try to provide an even more detailed analsysi
             of the object, including its syntax-highlighted source code when it can
             be found. It's possible that \texttt{x??} returns the same information
             as \texttt{x?}, but in many cases \texttt{x??} will indeed provide
             additional details.
             Finally, the \texttt{?} syntax is also useful to search
             \emph{namespaces} with wildcards. Suppose you are wondering if there is
             any function in Numpy that may do text-related things; with
             \texttt{np.*txt*?}, IPython will print all the names in the \texttt{np}
             namespace (our Numpy shorthand) that have `txt' anywhere in their name:
             \begin{verbatim}
             In [17]: np.*txt*?
             np.genfromtxt
             np.loadtxt
             np.mafromtxt
             np.ndfromtxt
             np.recfromtxt
             np.savetxt
             \end{verbatim}
             \textbf{Tab completion}
             IPython makes the tab key work extra hard for you as a way to rapidly
             inspect objects and libraries. Whenever you have typed something at the
             prompt, by hitting the \texttt{\textless{}tab\textgreater{}} key IPython
             will try to complete the rest of the line. For this, IPython will
             analyze the text you had so far and try to search for Python data or
             files that may match the context you have already provided.
             For example, if you type \texttt{np.load} and hit the key, you'll see:
             \begin{verbatim}
             In [21]: np.load<TAB HERE>
             np.load     np.loads    np.loadtxt
             \end{verbatim}
             so you can quickly find all the load-related functionality in numpy. Tab
             completion works even for function arguments, for example consider this
             function definition:
             \begin{verbatim}
             In [20]: def f(x, frobinate=False):
                ....:     if frobinate:
                ....:         return x**2
                ....:
             \end{verbatim}
             If you now use the \texttt{\textless{}tab\textgreater{}} key after
             having typed `fro' you'll get all valid Python completions, but those
             marked with \texttt{=} at the end are known to be keywords of your
             function:
             \begin{verbatim}
             In [21]: f(2, fro<TAB HERE>
             frobinate=    frombuffer    fromfunction  frompyfunc    fromstring
             from          fromfile      fromiter      fromregex     frozenset
             \end{verbatim}
             at this point you can add the \texttt{b} letter and hit
             \texttt{\textless{}tab\textgreater{}} once more, and IPython will finish
             the line for you:
             \begin{verbatim}
             In [21]: f(2, frobinate=
             \end{verbatim}
             As a beginner, simply get into the habit of using
             \texttt{\textless{}tab\textgreater{}} after most objects; it should
             quickly become second nature as you will see how helps keep a fluid
             workflow and discover useful information. Later on you can also
             customize this behavior by writing your own completion code, if you so
             desire.
             \textbf{Matplotlib integration}
             One of the most useful features of IPython for scientists is its tight
             integration with matplotlib: at the terminal IPython lets you open
             matplotlib figures without blocking your typing (which is what happens
             if you try to do the same thing at the default Python shell), and in the
             Qt console and notebook you can even view your figures embedded in your
             workspace next to the code that created them.
             The matplotlib support can be either activated when you start IPython by
             passing the \texttt{-{}-pylab} flag, or at any point later in your
             session by using the \texttt{\%pylab} command. If you start IPython with
             \texttt{-{}-pylab}, you'll see something like this (note the extra
             message about pylab):
             \begin{verbatim}
             $ ipython --pylab
             Python 2.7.2+ (default, Oct  4 2011, 20:03:08)
             Type "copyright", "credits" or "license" for more information.
             IPython 0.13.dev -- An enhanced Interactive Python.
             ?         -> Introduction and overview of IPython's features.
             %quickref -> Quick reference.
             help      -> Python's own help system.
             object?   -> Details about 'object', use 'object??' for extra details.
             Welcome to pylab, a matplotlib-based Python environment [backend: Qt4Agg].
             For more information, type 'help(pylab)'.
             In [1]:
             \end{verbatim}
             Furthermore, IPython will import \texttt{numpy} with the \texttt{np}
             shorthand, \texttt{matplotlib.pyplot} as \texttt{plt}, and it will also
             load all of the numpy and pyplot top-level names so that you can
             directly type something like:
             \begin{verbatim}
             In [1]: x = linspace(0, 2*pi, 200)
             In [2]: plot(x, sin(x))
             Out[2]: [<matplotlib.lines.Line2D at 0x9e7c16c>]
             \end{verbatim}
             instead of having to prefix each call with its full signature (as we
             have been doing in the examples thus far):
             \begin{verbatim}
             In [3]: x = np.linspace(0, 2*np.pi, 200)
             In [4]: plt.plot(x, np.sin(x))
             Out[4]: [<matplotlib.lines.Line2D at 0x9e900ac>]
             \end{verbatim}
             This shorthand notation can be a huge time-saver when working
             interactively (it's a few characters but you are likely to type them
             hundreds of times in a session). But we should note that as you develop
             persistent scripts and notebooks meant for reuse, it's best to get in
             the habit of using the longer notation (known as \emph{fully qualified
             names} as it's clearer where things come from and it makes for more
             robust, readable and maintainable code in the long run).
             \textbf{Access to the operating system and files}
             In IPython, you can type \texttt{ls} to see your files or \texttt{cd} to
             change directories, just like you would at a regular system prompt:
             \begin{verbatim}
             In [2]: cd tests
             /home/fperez/ipython/nbconvert/tests
             In [3]: ls test.*
             test.aux  test.html  test.ipynb  test.log  test.out  test.pdf  test.rst  test.tex
             \end{verbatim}
             Furthermore, if you use the \texttt{!} at the beginning of a line, any
             commands you pass afterwards go directly to the operating system:
             \begin{verbatim}
             In [4]: !echo "Hello IPython"
             Hello IPython
             \end{verbatim}
             IPython offers a useful twist in this feature: it will substitute in the
             command the value of any \emph{Python} variable you may have if you
             prepend it with a \texttt{\$} sign:
             \begin{verbatim}
             In [5]: message = 'IPython interpolates from Python to the shell'
             In [6]: !echo $message
             IPython interpolates from Python to the shell
             \end{verbatim}
             This feature can be extremely useful, as it lets you combine the power
             and clarity of Python for complex logic with the immediacy and
             familiarity of many shell commands. Additionally, if you start the line
             with \emph{two} \texttt{\$\$} signs, the output of the command will be
             automatically captured as a list of lines, e.g.:
             \begin{verbatim}
             In [10]: !!ls test.*
             Out[10]:
             ['test.aux',
              'test.html',
              'test.ipynb',
              'test.log',
              'test.out',
              'test.pdf',
              'test.rst',
              'test.tex']
             \end{verbatim}
             As explained above, you can now use this as the variable \texttt{\_10}.
             If you directly want to capture the output of a system command to a
             Python variable, you can use the syntax \texttt{=!}:
             \begin{verbatim}
             In [11]: testfiles =! ls test.*
             In [12]: print testfiles
             ['test.aux', 'test.html', 'test.ipynb', 'test.log', 'test.out', 'test.pdf', 'test.rst', 'test.tex']
             \end{verbatim}
             Finally, the special \texttt{\%alias} command lets you define names that
             are shorthands for system commands, so that you can type them without
             having to prefix them via \texttt{!} explicitly (for example,
             \texttt{ls} is an alias that has been predefined for you at startup).
             \textbf{Magic commands}
             IPython has a system for special commands, called `magics', that let you
             control IPython itself and perform many common tasks with a more
             shell-like syntax: it uses spaces for delimiting arguments, flags can be
             set with dashes and all arguments are treated as strings, so no
             additional quoting is required. This kind of syntax is invalid in the
             Python language but very convenient for interactive typing (less
             parentheses, commans and quoting everywhere); IPython distinguishes the
             two by detecting lines that start with the \texttt{\%} character.
             You can learn more about the magic system by simply typing
             \texttt{\%magic} at the prompt, which will give you a short description
             plus the documentation on \emph{all} available magics. If you want to
             see only a listing of existing magics, you can use \texttt{\%lsmagic}:
             \begin{verbatim}
             In [4]: lsmagic
             Available magic functions:
             %alias  %autocall  %autoindent  %automagic  %bookmark  %c  %cd  %colors  %config  %cpaste
             %debug  %dhist  %dirs  %doctest_mode  %ds  %ed  %edit  %env  %gui  %hist  %history
             %install_default_config  %install_ext  %install_profiles  %load_ext  %loadpy  %logoff  %logon
             %logstart  %logstate  %logstop  %lsmagic  %macro  %magic  %notebook  %page  %paste  %pastebin
             %pd  %pdb  %pdef  %pdoc  %pfile  %pinfo  %pinfo2  %pop  %popd  %pprint  %precision  %profile
             %prun  %psearch  %psource  %pushd  %pwd  %pycat  %pylab  %quickref  %recall  %rehashx
             %reload_ext  %rep  %rerun  %reset  %reset_selective  %run  %save  %sc  %stop  %store  %sx  %tb
             %time  %timeit  %unalias  %unload_ext  %who  %who_ls  %whos  %xdel  %xmode
             Automagic is ON, % prefix NOT needed for magic functions.
             \end{verbatim}
             Note how the example above omitted the eplicit \texttt{\%} marker and
             simply uses \texttt{lsmagic}. As long as the `automagic' feature is on
             (which it is by default), you can omit the \texttt{\%} marker as long as
             there is no ambiguity with a Python variable of the same name.
             \textbf{Running your code}
             While it's easy to type a few lines of code in IPython, for any
             long-lived work you should keep your codes in Python scripts (or in
             IPython notebooks, see below). Consider that you have a script, in this
             case trivially simple for the sake of brevity, named \texttt{simple.py}:
             \begin{verbatim}
             In [12]: !cat simple.py
             import numpy as np
             x = np.random.normal(size=100)
             print 'First elment of x:', x[0]
             \end{verbatim}
             The typical workflow with IPython is to use the \texttt{\%run} magic to
             execute your script (you can omit the .py extension if you want). When
             you run it, the script will execute just as if it had been run at the
             system prompt with \texttt{python simple.py} (though since modules don't
             get re-executed on new imports by Python, all system initialization is
             essentially free, which can have a significant run time impact in some
             cases):
             \begin{verbatim}
             In [13]: run simple
             First elment of x: -1.55872256289
             \end{verbatim}
             Once it completes, all variables defined in it become available for you
             to use interactively:
             \begin{verbatim}
             In [14]: x.shape
             Out[14]: (100,)
             \end{verbatim}
             This allows you to plot data, try out ideas, etc, in a
             \texttt{\%run}/interact/edit cycle that can be very productive. As you
             start understanding your problem better you can refine your script
             further, incrementally improving it based on the work you do at the
             IPython prompt. At any point you can use the \texttt{\%hist} magic to
             print out your history without prompts, so that you can copy useful
             fragments back into the script.
             By default, \texttt{\%run} executes scripts in a completely empty
             namespace, to better mimic how they would execute at the system prompt
             with plain Python. But if you use the \texttt{-i} flag, the script will
             also see your interactively defined variables. This lets you edit in a
             script larger amounts of code that still behave as if you had typed them
             at the IPython prompt.
             You can also get a summary of the time taken by your script with the
             \texttt{-t} flag; consider a different script \texttt{randsvd.py} that
             takes a bit longer to run:
             \begin{verbatim}
             In [21]: run -t randsvd.py
             IPython CPU timings (estimated):
               User   :       0.38 s.
               System :       0.04 s.
             Wall time:       0.34 s.
             \end{verbatim}
             \texttt{User} is the time spent by the computer executing your code,
             while \texttt{System} is the time the operating system had to work on
             your behalf, doing things like memory allocation that are needed by your
             code but that you didn't explicitly program and that happen inside the
             kernel. The \texttt{Wall time} is the time on a `clock on the wall'
             between the start and end of your program.
             If \texttt{Wall \textgreater{} User+System}, your code is most likely
             waiting idle for certain periods. That could be waiting for data to
             arrive from a remote source or perhaps because the operating system has
             to swap large amounts of virtual memory. If you know that your code
             doesn't explicitly wait for remote data to arrive, you should
             investigate further to identify possible ways of improving the
             performance profile.
             If you only want to time how long a single statement takes, you don't
             need to put it into a script as you can use the \texttt{\%timeit} magic,
             which uses Python's \texttt{timeit} module to very carefully measure
             timig data; \texttt{timeit} can measure even short statements that
             execute extremely fast:
             \begin{verbatim}
             In [27]: %timeit a=1
             10000000 loops, best of 3: 23 ns per loop
             \end{verbatim}
             and for code that runs longer, it automatically adjusts so the overall
             measurement doesn't take too long:
             \begin{verbatim}
             In [28]: %timeit np.linalg.svd(x)
 loops, best of 3: 310 ms per loop
             \end{verbatim}
             The \texttt{\%run} magic still has more options for debugging and
             profiling data; you should read its documentation for many useful
             details (as always, just type \texttt{\%run?}).
             \subsection{The graphical Qt console}
             If you type at the system prompt (see the IPython website for
             installation details, as this requires some additional libraries):
             \begin{verbatim}
             $ ipython qtconsole
             \end{verbatim}
             instead of opening in a terminal as before, IPython will start a
             graphical console that at first sight appears just like a terminal, but
             which is in fact much more capable than a text-only terminal. This is a
             specialized terminal designed for interactive scientific work, and it
             supports full multi-line editing with color highlighting and graphical
             calltips for functions, it can keep multiple IPython sessions open
             simultaneously in tabs, and when scripts run it can display the figures
             inline directly in the work area.
             % This cell is for the pdflatex output only
             \begin{figure}[htbp]
             \centering
             \includegraphics[width=3in]{ipython_qtconsole2.png}
             \caption{The IPython Qt console: a lightweight terminal for scientific exploration, with code, results and graphics in a soingle environment.}
             \end{figure}
             The Qt console accepts the same \texttt{-{}-pylab} startup flags as the
             terminal, but you can additionally supply the value
             \texttt{-{}-pylab inline}, which enables the support for inline graphics
             shown in the figure. This is ideal for keeping all the code and figures
             in the same session, given that the console can save the output of your
             entire session to HTML or PDF.
             Since the Qt console makes it far more convenient than the terminal to
             edit blocks of code with multiple lines, in this environment it's worth
             knowing about the \texttt{\%loadpy} magic function. \texttt{\%loadpy}
             takes a path to a local file or remote URL, fetches its contents, and
             puts it in the work area for you to further edit and execute. It can be
             an extremely fast and convenient way of loading code from local disk or
             remote examples from sites such as the
             \href{http://matplotlib.sourceforge.net/gallery.html}{Matplotlib
             gallery}.
             Other than its enhanced capabilities for code and graphics, all of the
             features of IPython we've explained before remain functional in this
             graphical console.
             \subsection{The IPython Notebook}
             The third way to interact with IPython, in addition to the terminal and
             graphical Qt console, is a powerful web interface called the ``IPython
             Notebook''. If you run at the system console (you can omit the
             \texttt{pylab} flags if you don't need plotting support):
             \begin{verbatim}
             $ ipython notebook --pylab inline
             \end{verbatim}
             IPython will start a process that runs a web server in your local
             machine and to which a web browser can connect. The Notebook is a
             workspace that lets you execute code in blocks called `cells' and
             displays any results and figures, but which can also contain arbitrary
             text (including LaTeX-formatted mathematical expressions) and any rich
             media that a modern web browser is capable of displaying.
             % This cell is for the pdflatex output only
             \begin{figure}[htbp]
             \centering
             \includegraphics[width=3in]{ipython-notebook-specgram-2.png}
             \caption{The IPython Notebook: text, equations, code, results, graphics and other multimedia in an open format for scientific exploration and collaboration}
             \end{figure}
             In fact, this document was written as a Notebook, and only exported to
             LaTeX for printing. Inside of each cell, all the features of IPython
             that we have discussed before remain functional, since ultimately this
             web client is communicating with the same IPython code that runs in the
             terminal. But this interface is a much more rich and powerful
             environment for maintaining long-term ``live and executable'' scientific
             documents.
             Notebook environments have existed in commercial systems like
             Mathematica(TM) and Maple(TM) for a long time; in the open source world
             the \href{http://sagemath.org}{Sage} project blazed this particular
             trail starting in 2006, and now we bring all the features that have made
             IPython such a widely used tool to a Notebook model.
             Since the Notebook runs as a web application, it is possible to
             configure it for remote access, letting you run your computations on a
             persistent server close to your data, which you can then access remotely
             from any browser-equipped computer. We encourage you to read the
             extensive documentation provided by the IPython project for details on
             how to do this and many more features of the notebook.
             Finally, as we said earlier, IPython also has a high-level and easy to
             use set of libraries for parallel computing, that let you control
             (interactively if desired) not just one IPython but an entire cluster of
             `IPython engines'. Unfortunately a detailed discussion of these tools is
             beyond the scope of this text, but should you need to parallelize your
             analysis codes, a quick read of the tutorials and examples provided at
             the IPython site may prove fruitful.
             \end{document}

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages