Improved speed for loading TRK

MarcCote · MarcCote · commit be485c6cb863 · 2016-05-30T23:08:44.000-04:00
diff --git a/Changelog b/Changelog
@@ -36,6 +36,9 @@ References like "pr/298" refer to github pull request numbers.
     are raising a DataError if the track is truncated when ``strict=True``
     (the default), rather than a TypeError when trying to create the points
     array.
+  * New API for managing streamlines and their different file formats. This
+    adds a new module ``nibabel.streamlines`` that will eventually deprecate
+    the current trackvis reader found in ``nibabel.trackvis``.
 
 * 2.0.2 (Monday 23 November 2015)
 
@@ -251,7 +254,7 @@ References like "pr/298" refer to github pull request numbers.
     the ability to transform to the image with data closest to the cononical
     image orientation (first axis left-to-right, second back-to-front, third
     down-to-up) (MB, Jonathan Taylor)
-  * Gifti format read and write support (preliminary) (Stephen Gerhard) 
+  * Gifti format read and write support (preliminary) (Stephen Gerhard)
   * Added utilities to use nipy-style data packages, by rip then edit of nipy
     data package code (MB)
   * Some improvements to release support (Jarrod Millman, MB, Fernando Perez)
@@ -469,7 +472,7 @@ visiting the URL::
 
   * Removed functionality for "NiftiImage.save() raises an IOError
     exception when writing the image file fails." (Yaroslav Halchenko)
-  * Added ability to force a filetype when setting the filename or saving 
+  * Added ability to force a filetype when setting the filename or saving
     a file.
   * Reverse the order of the 'header' and 'load' argument in the NiftiImage
     constructor. 'header' is now first as it seems to be used more often.
@@ -481,7 +484,7 @@ visiting the URL::
 
 * 0.20070301.2 (Thu, 1 Mar 2007)
 
-  * Fixed wrong link to the source tarball in README.html. 
+  * Fixed wrong link to the source tarball in README.html.
 
 
 * 0.20070301.1 (Thu, 1 Mar 2007)
diff --git a/nibabel/benchmarks/bench_streamlines.py b/nibabel/benchmarks/bench_streamlines.py
@@ -0,0 +1,80 @@
+""" Benchmarks for load and save of streamlines
+
+Run benchmarks with::
+
+    import nibabel as nib
+    nib.bench()
+
+If you have doctests enabled by default in nose (with a noserc file or
+environment variable), and you have a numpy version <= 1.6.1, this will also run
+the doctests, let's hope they pass.
+
+Run this benchmark with:
+
+    nosetests -s --match '(?:^|[\\b_\\.//-])[Bb]ench' /path/to/bench_streamlines.py
+"""
+from __future__ import division, print_function
+
+import numpy as np
+
+from nibabel.externals.six.moves import zip
+from nibabel.tmpdirs import InTemporaryDirectory
+
+from numpy.testing import assert_array_equal
+from nibabel.streamlines import Tractogram
+from nibabel.streamlines import TrkFile
+
+import nibabel as nib
+import nibabel.trackvis as tv
+
+from numpy.testing import measure
+
+
+def bench_load_trk():
+    rng = np.random.RandomState(42)
+    dtype = 'float32'
+    NB_STREAMLINES = 5000
+    NB_POINTS = 1000
+    points = [rng.rand(NB_POINTS, 3).astype(dtype)
+              for i in range(NB_STREAMLINES)]
+    scalars = [rng.rand(NB_POINTS, 10).astype(dtype)
+               for i in range(NB_STREAMLINES)]
+
+    repeat = 10
+
+    with InTemporaryDirectory():
+        trk_file = "tmp.trk"
+        tractogram = Tractogram(points, affine_to_rasmm=np.eye(4))
+        TrkFile(tractogram).save(trk_file)
+
+        loaded_streamlines_old = [d[0]-0.5 for d in tv.read(trk_file, points_space="rasmm")[0]]
+        mtime_old = measure('tv.read(trk_file, points_space="rasmm")', repeat)
+        print("Old: Loaded %d streamlines in %6.2f" % (NB_STREAMLINES, mtime_old))
+
+        loaded_streamlines_new = nib.streamlines.load(trk_file, lazy_load=False).streamlines
+        mtime_new = measure('nib.streamlines.load(trk_file, lazy_load=False)', repeat)
+        print("\nNew: Loaded %d streamlines in %6.2f" % (NB_STREAMLINES, mtime_new))
+        print("Speedup of %2f" % (mtime_old/mtime_new))
+
+        for s1, s2 in zip(loaded_streamlines_new, loaded_streamlines_old):
+            assert_array_equal(s1, s2)
+
+    # Points and scalars
+    with InTemporaryDirectory():
+
+        trk_file = "tmp.trk"
+        tractogram = Tractogram(points,
+                                data_per_point={'scalars': scalars},
+                                affine_to_rasmm=np.eye(4))
+        TrkFile(tractogram).save(trk_file)
+
+        mtime_old = measure('tv.read(trk_file, points_space="rasmm")', repeat)
+        print("Old: Loaded %d streamlines with scalars in %6.2f" % (NB_STREAMLINES, mtime_old))
+
+        mtime_new = measure('nib.streamlines.load(trk_file, lazy_load=False)', repeat)
+        print("New: Loaded %d streamlines with scalars in %6.2f" % (NB_STREAMLINES, mtime_new))
+        print("Speedup of %2f" % (mtime_old/mtime_new))
+
+
+if __name__ == '__main__':
+    bench_load_trk()
diff --git a/nibabel/streamlines/array_sequence.py b/nibabel/streamlines/array_sequence.py
@@ -60,40 +60,83 @@ def __init__(self, iterable=None, buffer_size=4):
             self._is_view = True
             return
 
-        # Add elements of the iterable.
+        try:
+            # If possible try pre-allocating memory.
+            if len(iterable) > 0:
+                first_element = np.asarray(iterable[0])
+                n_elements = np.sum([len(iterable[i])
+                                     for i in range(len(iterable))])
+                new_shape = (n_elements,) + first_element.shape[1:]
+                self._data = np.empty(new_shape, dtype=first_element.dtype)
+        except TypeError:
+            pass
+
+        # Initialize the `ArraySequence` object from iterable's item.
+        coroutine = self._extend_using_coroutine()
+        coroutine.send(None)  # Run until the first yield.
+
+        for e in iterable:
+            coroutine.send(e)
+
+        coroutine.close()  # Terminate coroutine.
+
+    def _extend_using_coroutine(self, buffer_size=4):
+        """ Creates a coroutine allowing to append elements.
+
+        Parameters
+        ----------
+        buffer_size : float, optional
+            Size (in Mb) for memory pre-allocation.
+
+        Returns
+        -------
+        coroutine
+            Coroutine object which expects the values to be appended to this
+            array sequence.
+
+        Notes
+        -----
+        This method is essential for
+        :func:`create_arraysequences_from_generator` as it allows for an
+        efficient way of creating multiple array sequences in a hyperthreaded
+        fashion and still benefit from the memory buffering. Whitout this
+        method the alternative would be to use :meth:`append` which does
+        not have such buffering mechanism and thus is at least one order of
+        magnitude slower.
+        """
         offsets = []
         lengths = []
-        # Initialize the `ArraySequence` object from iterable's item.
-        offset = 0
-        for i, e in enumerate(iterable):
-            e = np.asarray(e)
-            if i == 0:
-                try:
-                    n_elements = np.sum([len(iterable[i])
-                                         for i in range(len(iterable))])
-                    new_shape = (n_elements,) + e.shape[1:]
-                except TypeError:
-                    # Can't get the number of elements in iterable. So,
-                    # we use a memory buffer while building the ArraySequence.
+
+        offset = 0 if len(self) == 0 else self._offsets[-1] + self._lengths[-1]
+        try:
+            first_element = True
+            while True:
+                e = (yield)
+                e = np.asarray(e)
+                if first_element:
+                    first_element = False
                     n_rows_buffer = int(buffer_size * 1024**2 // e.nbytes)
                     new_shape = (n_rows_buffer,) + e.shape[1:]
+                    if len(self) == 0:
+                        self._data = np.empty(new_shape, dtype=e.dtype)
 
-                self._data = np.empty(new_shape, dtype=e.dtype)
+                end = offset + len(e)
+                if end > len(self._data):
+                    # Resize needed, adding `len(e)` items plus some buffer.
+                    nb_points = len(self._data)
+                    nb_points += len(e) + n_rows_buffer
+                    self._data.resize((nb_points,) + self.common_shape)
 
-            end = offset + len(e)
-            if end > len(self._data):
-                # Resize needed, adding `len(e)` items plus some buffer.
-                nb_points = len(self._data)
-                nb_points += len(e) + n_rows_buffer
-                self._data.resize((nb_points,) + self.common_shape)
+                offsets.append(offset)
+                lengths.append(len(e))
+                self._data[offset:offset + len(e)] = e
+                offset += len(e)
 
-            offsets.append(offset)
-            lengths.append(len(e))
-            self._data[offset:offset + len(e)] = e
-            offset += len(e)
+        except GeneratorExit:
+            pass
 
-        self._offsets = np.asarray(offsets)
-        self._lengths = np.asarray(lengths)
+        self._offsets = np.concatenate([self._offsets, offsets], axis=0)
+        self._lengths = np.concatenate([self._lengths, lengths], axis=0)
 
         # Clear unused memory.
         self._data.resize((offset,) + self.common_shape)
@@ -266,13 +309,6 @@ def __getitem__(self, idx):
             seq._is_view = True
             return seq
 
-            # for name, slice_ in data_per_point_slice.items():
-            #     seq = ArraySequence()
-            #     seq._data = scalars._data[:, slice_]
-            #     seq._offsets = scalars._offsets
-            #     seq._lengths = scalars._lengths
-            #     tractogram.data_per_point[name] = seq
-
         raise TypeError("Index must be either an int, a slice, a list of int"
                         " or a ndarray of bool! Not " + str(type(idx)))
 
@@ -320,10 +356,27 @@ def load(cls, filename):
 
 def create_arraysequences_from_generator(gen, n):
     """ Creates :class:`ArraySequence` objects from a generator yielding tuples
+
+    Parameters
+    ----------
+    gen : generator
+        Generator yielding a size `n` tuple containing the values to put in the
+        array sequences.
+    n : int
+        Number of :class:`ArraySequences` object to create.
     """
     seqs = [ArraySequence() for _ in range(n)]
+    coroutines = [seq._extend_using_coroutine() for seq in seqs]
+
+    for coroutine in coroutines:
+        coroutine.send(None)
+
     for data in gen:
-        for i, seq in enumerate(seqs):
-            seq.append(data[i])
+        for i, coroutine in enumerate(coroutines):
+            if data[i].nbytes > 0:
+                coroutine.send(data[i])
+
+    for coroutine in coroutines:
+        coroutine.close()
 
     return seqs
diff --git a/nibabel/streamlines/tests/test_array_sequence.py b/nibabel/streamlines/tests/test_array_sequence.py
@@ -200,6 +200,37 @@ def test_arraysequence_extend(self):
         seq = SEQ_DATA['seq'].copy()  # Copy because of in-place modification.
         assert_raises(ValueError, seq.extend, data)
 
+    def test_arraysequence_extend_using_coroutine(self):
+        new_data = generate_data(nb_arrays=10,
+                                 common_shape=SEQ_DATA['seq'].common_shape,
+                                 rng=SEQ_DATA['rng'])
+
+        # Extend with an empty list.
+        seq = SEQ_DATA['seq'].copy()  # Copy because of in-place modification.
+        coroutine = seq._extend_using_coroutine()
+        coroutine.send(None)
+        coroutine.close()
+        check_arr_seq(seq, SEQ_DATA['data'])
+
+        # Extend with a list of ndarrays.
+        seq = SEQ_DATA['seq'].copy()  # Copy because of in-place modification.
+        coroutine = seq._extend_using_coroutine()
+        coroutine.send(None)
+        for e in new_data:
+            coroutine.send(e)
+        coroutine.close()
+        check_arr_seq(seq, SEQ_DATA['data'] + new_data)
+
+        # Extend with elements of different shape.
+        data = generate_data(nb_arrays=10,
+                             common_shape=SEQ_DATA['seq'].common_shape*2,
+                             rng=SEQ_DATA['rng'])
+        seq = SEQ_DATA['seq'].copy()  # Copy because of in-place modification.
+
+        coroutine = seq._extend_using_coroutine()
+        coroutine.send(None)
+        assert_raises(ValueError, coroutine.send, data[0])
+
     def test_arraysequence_getitem(self):
         # Get one item
         for i, e in enumerate(SEQ_DATA['seq']):
diff --git a/nibabel/streamlines/trk.py b/nibabel/streamlines/trk.py
@@ -425,7 +425,7 @@ def save(self, fileobj):
             property_name = np.zeros(MAX_NB_NAMED_PROPERTIES_PER_STREAMLINE,
                                      dtype='S20')
             for i, name in enumerate(data_for_streamline_keys):
-                # Use the last to bytes of the name to store the number of
+                # Use the last two bytes of the name to store the number of
                 # values associated to this data_for_streamline.
                 nb_values = data_for_streamline[name].shape[-1]
                 property_name[i] = encode_value_in_name(nb_values, name)