gjbex
diff --git a/‎source-code/README.md
Lines changed: 1 addition & 0 deletions b/‎source-code/README.md
Lines changed: 1 addition & 0 deletions
diff --git a/‎source-code/iterators/README.md
Lines changed: 44 additions & 0 deletions b/‎source-code/iterators/README.md
Lines changed: 44 additions & 0 deletions
diff --git a/‎source-code/iterators/accumulator.py
Lines changed: 17 additions & 0 deletions b/‎source-code/iterators/accumulator.py
Lines changed: 17 additions & 0 deletions
diff --git a/‎source-code/iterators/count_downs.py
Lines changed: 55 additions & 0 deletions b/‎source-code/iterators/count_downs.py
Lines changed: 55 additions & 0 deletions
diff --git a/‎source-code/iterators/dataset.py
Lines changed: 183 additions & 0 deletions b/‎source-code/iterators/dataset.py
Lines changed: 183 additions & 0 deletions
@@ -16,6 +16,7 @@ was used to develop it.
    programming in Python.
 1. `introspection`: illustration of how to implement introspection in
    Python.
+1. `iterators`: illustrates iterators and functional programming concepts.
 1. `object-orientation`: illustrates some concepts of object-oriented
    programming in Python.
 1. `operators-functools`: illustrates some applications of the `operator`
 
@@ -0,0 +1,44 @@
+# Iterators
+An iterator is a nice concept since it allows to create laze sequences,
+i.e., sequences that have elements that are computed only when they are
+requested by retrieving the enxt element.
+
+Python allows for two basic ways to implement iterators, either as
+function that have a LHS yield statements, or as class that implement
+an `__iter__` and a `next` method.
+
+However, often it is not necessary to implements iterators from scratch,
+often they can be constructed by using the Python standard library's
+`itertools` functionality.
+
+## What is it?
+1. `accumulator.py`: illustrates the use of `itertools`'s `accumulate` in
+    for various types of data and operators.
+1. `count_down.py`: simple illustration of a class that implements an
+    iterable.
+1. `event_generate.py`: a sequence of `Event` objects is generated by
+    an instance of the `EventIter` class.  Events have a type, a start time,
+    and a duration.  Events of the same type can not overlap.  The
+    `EventIter` constructor takes a list of event types, and a start time.
+    It generates sequence of random type, start time and duration, until an
+    event is generated that last later than the stop time.
+1. `generators.ipynb`: Jupyter notebook illustrating generators.
+1. `people.py`: illustration of `itertools`'s `groupby`, and `operator`'s
+    `attrgetter` methods.  Note that `groupby` does not reorder the
+    original iterators element, but only groups consecutive elements that
+    have the same key.
+1. `primes.py`: this script will generate the sequence of prime numbers
+    until it is interupted.  The iterator is implemented by a function with
+    a `yield` statement.
+1. `primes_multiple_calls.py`: illustrates that a function with `yield`
+    instantiates a generator when called, and hence "starts over" for
+    each `for`-loop.
+1. `primes_itertools.py`: this script also generates a potentially
+    infinite sequence of prime numbers, but it is implemented using
+    the `count` function of the `itertools` module in Python's standard
+    library, as well as the `filter` function.
+1. `dataset.py`: illustrates the `__iter__` and `__next__` methods, as well
+    as utilities of the `operator` module.
+1. `generating_data.py`: a retake of the data geenration script in
+    Fundamentals, now using `itertools` and built-in Python functional
+    features.
@@ -0,0 +1,17 @@
+#!/usr/bin/env python
+
+from itertools import accumulate
+from operator import add, mul, concat
+
+if __name__ == '__main__':
+    data = range(10)
+    for x in accumulate(data, add):
+        print(x)
+    for x in accumulate(data[1:], mul):
+        print(x)
+    for x in ([y] for y in data):
+        print(x)
+    for x in accumulate(([y] for y in data), concat):
+        print(x)
+    for fragment in accumulate('hello world!', concat):
+        print(fragment)
@@ -0,0 +1,55 @@
+#!/usr/bin/env python
+
+
+class CountDown(object):
+    '''Class implementign a counter that goes from a start value to 0'''
+
+    def __init__(self, n):
+        '''Constructor setting the value to count down from'''
+        self._n = n
+        self._current = n
+
+    @property
+    def n(self):
+        '''Returns value that this counter will count down frmo'''
+        return self._n
+
+    def __iter__(self):
+        '''Initialize and return the iterator, this method is called
+        each time the object is used as an iterator'''
+        self._current = self.n
+        return self
+
+    def __next__(self):
+        '''Returns the next value, and changes state, called in each
+        iteration'''
+        if self._current >= 0:
+            value = self._current
+            self._current -= 1
+            return value
+        else:
+            raise StopIteration()
+
+    def __str__(self):
+        return 'count down at {c:d} from {n:d}'.format(self._current,
+                                                       self.n)
+
+
+if __name__ == '__main__':
+    count_down = CountDown(5)
+    print('first iteration')
+    for i in count_down:
+        print(i)
+    print('second iteration')
+    for i in count_down:
+        print(i)
+    for i in count_down:
+        print(i)
+    count_down1 = CountDown(10)
+    count_down2 = CountDown(8)
+    print('zip for 10, 8')
+    for i, j in zip(count_down1, count_down2):
+        print(i, j)
+    print('zip for same iterator, will not work')
+    for i, j in zip(count_down, count_down):
+        print(i, j)
@@ -0,0 +1,183 @@
+#!/usr/bin/env python
+'''dataset implements a poor man's version of pandas data frames, it is
+   only intended to illustrate a number of concepts about iterators
+   and can be used when dependencies on third party libraries should
+   be avoided'''
+
+import collections
+import operator
+
+ColumnDef = collections.namedtuple('ColumnSpecs', ['name', 'type'])
+
+
+class DatasetError(Exception):
+    '''Base class for Dataset exceptions'''
+
+    pass
+
+
+class DataLenError(DatasetError):
+    '''Exception indicating that a list of data is being appended with
+       a length different from the number of headers of the data set'''
+
+    pass
+
+
+class ConversionError(DatasetError):
+    '''Exception indicating that a type conversion failed, i.e., a
+       value is appended that can not be converted to its column's
+       type'''
+
+    pass
+
+
+class ColumnOverwriteError(DataLenError):
+    '''Exception indicating that a new column would overwrite an
+       existing one.'''
+
+    pass
+
+
+class UndefinedColumnError(DataLenError):
+    '''Exception indicating that a column does not exist in the dataset'''
+
+    pass
+
+
+class ComputeError(DataLenError):
+    '''Exception indicating that a computation failed'''
+
+    pass
+
+
+class Dataset(object):
+    '''Class representing data sets'''
+
+    def __init__(self, col_defs):
+        '''Constructor that optonally takes the data set headers'''
+        self._headers = [col_def.name for col_def in col_defs]
+        self._type_map = {col_def.name: col_def.type
+                          for col_def in col_defs}
+        self._data = {header: [] for header in self._headers}
+        self._nr_data = 0
+        self._next = 0
+
+    @property
+    def headers(self):
+        '''get the list of headers for the data set'''
+        return list(self._headers)
+
+    @property
+    def nr_columns(self):
+        '''returns number of columns in the dataset'''
+        return len(self._headers)
+
+    @property
+    def column_defs(self):
+        '''retrieve the column definitions of the dataset'''
+        col_defs = []
+        for header in self._headers:
+            col_defs.append(ColumnDef(header, self._type_map[header]))
+        return col_defs
+
+    def __len__(self):
+        '''retrieve the length of the data set'''
+        return self._nr_data
+
+    def _convert(self, header, value):
+        '''convert the value to the appropriate data type'''
+        return self._type_map[header](value)
+
+    def append(self, data):
+        '''append a row of data to the set'''
+        if len(data) != len(self._headers):
+            msg = '{0:d} headers, {1:d} items'.format(len(self._headers),
+                                                      len(data))
+            raise DataLenError(msg)
+        for i, header in enumerate(self._headers):
+            try:
+                value = self._convert(header, data[i])
+            except ValueError as error:
+                msg = 'type conversion failed: {0}'.format(str(error))
+                raise ConversionError(msg)
+            self._data[header].append(value)
+        self._nr_data += 1
+
+    def __iter__(self):
+        '''iterator over the data values in the data set, each returning
+           a list ordered according to the headers of the data set'''
+        self._RowTuple = collections.namedtuple('RowTuple', self._headers)
+        self._next = 0
+        return self
+
+    def __next__(self):
+        '''return next data value when dataset is used as an iterator'''
+        if self._next < self._nr_data:
+            values = self._RowTuple._make((self._data[header][self._next]
+                                           for header in self._headers))
+            self._next += 1
+            return values
+        else:
+            self._next = 0
+            raise StopIteration
+
+    def compute(self, col_defs, args, function):
+        '''perform a computation producing extra columns by applying a
+           function using the specified argument names'''
+        for col_def in col_defs:
+            if col_def.name in self._headers:
+                msg = 'column {0} already exists'.format(col_def.name)
+                raise ColumnOverwriteError(msg)
+            self._data[col_def.name] = []
+        for name in args:
+            if name not in self._headers:
+                msg = 'no column {0} in dataset'.format(name)
+                raise UndefinedColumnError(msg)
+        arg_idx = tuple(self._headers.index(name) for name in args)
+        selector = operator.itemgetter(*arg_idx)
+        names = [col_def.name for col_def in col_defs]
+        for row in self:
+            args = selector(row)
+            try:
+                values = function(*args)
+            except Exception as error:
+                args_str = ', '.join([str(arg) for arg in args])
+                msg = "computation for '{0}' failed: {1}".format(args_str,
+                                                                 str(error))
+                raise ComputeError(msg)
+            for name, value in zip(names, values):
+                self._data[name].append(value)
+        for col_def in col_defs:
+            self._headers.append(col_def.name)
+            self._type_map[col_def.name] = col_def.type
+
+    def __str__(self):
+        '''create string representation of the data set'''
+        str_repr = ', '.join(self._headers)
+        for row in self:
+            str_repr += '\n' + ', '.join([str(x) for x in row])
+        return str_repr
+
+
+if __name__ == '__main__':
+    data = Dataset([
+        ColumnDef('x', int),
+        ColumnDef('y', int),
+        ColumnDef('z', int),
+    ])
+    for x in range(10):
+        data.append((x, x**2, x**3))
+    print(data)
+    data.compute([ColumnDef('sum', int), ColumnDef('prod', int)], ['x', 'y'],
+                 lambda x, y: (x + y, x*y))
+    print(data)
+    for row in data:
+        print('{0:d} + {1:d} = {2:d}'.format(row.x, row.y, row.sum))
+    print('{0:d} data items'.format(len(data)))
+    data.compute([ColumnDef('substr', int)], ['x', 'y'],
+                 lambda x, y: (y - x, ))
+    print(data)
+    try:
+        data.append(['bla'] * data.nr_columns)
+    except Exception as error:
+        print('### error: {0}'.format(error))