AlvarBer
diff --git a/‎docs/Makefile‎
Lines changed: 8 additions & 8 deletions b/‎docs/Makefile‎
Lines changed: 8 additions & 8 deletions
diff --git a/‎docs/graphs/hierarchical.tex‎
Lines changed: 14 additions & 0 deletions b/‎docs/graphs/hierarchical.tex‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎docs/graphs/logical.tex‎
Lines changed: 24 additions & 0 deletions b/‎docs/graphs/logical.tex‎
Lines changed: 24 additions & 0 deletions
diff --git a/‎docs/persimmon.bib‎
Lines changed: 15 additions & 0 deletions b/‎docs/persimmon.bib‎
Lines changed: 15 additions & 0 deletions
diff --git a/‎docs/src/evaluation.md‎
Lines changed: 45 additions & 0 deletions b/‎docs/src/evaluation.md‎
Lines changed: 45 additions & 0 deletions
diff --git a/‎docs/src/implementation.md‎
Lines changed: 120 additions & 6 deletions b/‎docs/src/implementation.md‎
Lines changed: 120 additions & 6 deletions
diff --git a/‎docs/src/interface.md‎
Lines changed: 38 additions & 0 deletions b/‎docs/src/interface.md‎
Lines changed: 38 additions & 0 deletions
@@ -1,9 +1,9 @@
 PDF := persimmon.pdf  # PDF Main Target
-MARKDOWN := introduction.md state_of_the_art.md workflow.md milestones.md \
-	risk_analysis.md interface.md implementation.md type_checking.md \
-	postmortem.md  # Markdown files
-MARKDOWN_COMPLUTENSE := introduction.md focus.md state_of_the_art.md \
-	workflow.md milestones.md risk_analysis.md interface.md implementation.md \
+MARKDOWN := introduction.md literature.md workflow.md milestones.md \
+	risk.md interface.md implementation.md type_checking.md \
+	evaluation.md postmortem.md  # Markdown files
+MARKDOWN_COMPLUTENSE := introduction.md focus.md literature.md \
+	workflow.md milestones.md risk.md interface.md implementation.md \
 	type_checking.md analysis.md postmortem.md
 APPENDICES := package_organization.md how.md  # Appendix after bibliography
 METADATA := metadata.yaml  # Metadata files (Author, Date, Title, etc..)
@@ -30,7 +30,7 @@ $(PDF): $(MARKDOWN) $(APPENDIX) $(TEMPLATE) $(IMAGES) $(BIBLIOGRAPHY) $(CSL) $(M
 	pandoc --smart --standalone --latex-engine xelatex --template $(TEMPLATE) \
 		--bibliography $(BIBLIOGRAPHY) --csl $(CSL) --table-of-contents \
 		--top-level-division chapter --metadata date:"$(shell date +%Y/%m/%d)" \
-		--metadata sansfont:"Helvetica Neue LT Com" \
+		--metadata sansfont:"Helvetica Neue LT Com" --highlight-style breezedark\
 		$(METADATA) $(MARKDOWN) --include-after-body $(APPENDIX) -o $@
 
 complutense: $(MARKDOWN_COMPLUTENSE) $(APPENDIX) $(TEMPLATE) $(IMAGES) $(BIBLIOGRAPHY) $(CSL) $(METADATA)
@@ -54,8 +54,8 @@ twocol: $(MARKDOWN) $(APPENDIX) $(TEMPLATE) $(IMAGES) $(BIBLIOGRAPHY) $(CSL) $(M
 # For standalone images
 images/%.pdf: graphs/%.tex
 	xelatex $< > /dev/null
-	mv $*.pdf images/
-	rm -f $*.log $*.aux
+	@mv $*.pdf images/
+	@rm -f $*.log $*.aux
 
 $(APPENDIX): $(APPENDICES)
 	pandoc --smart --no-tex-ligatures --top-level-division chapter $(APPENDICES) -o $@
 
@@ -0,0 +1,14 @@
+\documentclass{standalone}
+
+\usepackage{tikz}
+
+\begin{document}
+  \begin{tikzpicture}[sibling distance=5em]
+    \node {Blackboard}
+      child { node {Block α} 
+        child { node {OutPin} } }
+      child { node {Connection} }
+      child { node {Block β} 
+        child { node {InPin} } };
+  \end{tikzpicture}
+\end{document}
@@ -0,0 +1,24 @@
+\documentclass{standalone}
+
+\usepackage{tikz}
+\usetikzlibrary{positioning}
+
+\begin{document}
+  \begin{tikzpicture}
+    \node at (0, 0) (c) {Connection};
+    \node [left = 1cm of c] (alpha) {Block α};
+    \node [below = 1cm of alpha] (o) {OutPin};
+    \draw [<->] (alpha) -- (o);
+    \node [below left = 1cm and -1cm of c] (e) {end};
+    \draw [<-] (o) -- (e);
+    \node [right = 1cm of c] (beta) {Block β};
+    \node [below = 1cm of beta] (i) {InPin};
+    \draw [<->] (beta) -- (i);
+    \node [below right = 1cm and -1cm of c] (s) {start};
+    \draw [->] (s) -- (i);
+    \draw [->] (c) -- (e);
+    \draw [->] (c) -- (s);
+    \draw [->] (o) -- (c);
+    \draw [->] (i) -- (c);
+  \end{tikzpicture}
+\end{document}
@@ -41,6 +41,21 @@ @online{sexy
   urldate = {2017-02-25},
 }
 
+@online{hunt,
+  title = {The Hunt For Unicorn Data Scientists Lifts Salaries For All Data Analytics Professionals},
+  author = {Gil Press},
+  url = {https://www.forbes.com/sites/gilpress/2015/10/09/the-hunt-for-unicorn-data-scientists-lifts-salaries-for-all-data-analytics-professionals/#38147ccc5258},
+  year = {2015},
+  urldate = {2017-04-03},
+}
+
+@online{unicorn,
+  title = {Data scientists: 'As rare as unicorns'},
+  author = {Jeanne G. Harris and Ray Eitel-Porter},
+  url = {https://www.theguardian.com/media-network/2015/feb/12/data-scientists-as-rare-as-unicorns},
+  year = {2015},
+  urldate = {2017-04-03},
+}
 
 % Data Visualization
 @online{principles,
 
@@ -0,0 +1,45 @@
+Evaluation
+==========
+
+On this chapter the evaluation process and how the survey was designed is
+explained.
+
+Method
+------
+Based on in place recollection, mainly based on a questionnaire, plus some
+additional information that is harvested by the system (mainly timings).
+
+The questionnaire selected is the System Usability Scale.
+
+
+Proposed tasks
+--------------
+The evaluation is composed by three different closed tasks.
+
+* First task is the creation of a simple workflow, the objective of
+    this task being to introduce Persimmon to the participants in the simplest
+    terms.
+    - First the participants have to load the iris file, using the csv input
+        block and navigating the filesystem to get the file `iris.csv`.
+    - Then they have to spawn the SVM block and connect the previous input
+        block to this block, they do not need to change any of the parameters
+        of the block.
+    - After the SMV block has been placed a cross validation block has to be
+        spawned and connected to the result of the SVM block.
+    - Finally the result of the cross validation has to be connected to a
+        print output block.
+* Second task is modifying the previous workflow to create a more complex
+    worflow. It is only slightly more complex than the previous one, but it
+    introduces the concept of re-cabling to the participants.
+    - Add a prediction block.
+    - Save to file.
+* Third task and final task. This one involves adding hyper-parameter tunning,
+    which in turns means providing a dictionary with desired parameters.
+<!--
+    - Create an entirely new workflow, either by putting it on the same
+        blackboard or on a new one.
+-->
+    - Use `gridsearch` for hyper-parameter tunning.
+    - Use print output block again to return best hyper-parameters.
+
+<!-- Actual evaluation -->
@@ -1,12 +1,13 @@
 Implementation
 ==============
-<!-- High level overview + low level overview -->
+
+The system is implemented in python, using the `Kivy` framework for the
+frontend and multiple scientific tools such as `Numpy`, `Scipy`, `Pandas` and
+most important `scikit-learn` for the backend.
 
 
 First Iteration
 ---------------
-![Sketch of the first interface](images/sketch_1.png)
-
 For the first iteration the priority was to get a proof of concept in order to
 see where the difficulties can appear, with a few simple classifiers and
 cross-validation techniques. As such a button-based interface with very limited
@@ -20,7 +21,7 @@ Trees, but gives good results in wide variety of problems.
 All these classifiers have few parameters on their respective sklearn
 implementations, and for this prototype the interface did not allow modifying
 any of them, as the it would have cluttered and it was not a necessary feature.
-Also all of them are classifiers, as it simplies the interface, since
+Also all of them are classifiers, as it simplifies the interface, since
 regressors and clustering have some incompatibilities.
 
 Apart from the temporary interface the backend had to be built. Since the
@@ -33,8 +34,6 @@ executed those.
 
 Second Iteration
 ----------------
-![Sketch of the second interface](images/sketch_2.png)
-
 For the second interface the drag and drop feel was the main priority.
 As such after developing the tab panel draggable boxes were developed, these
 boxes needed to be connected through pins.
@@ -100,6 +99,121 @@ receives it).
 
 For more information about internal package distribution check appendix A.
 
+
+Making a Connection
+-------------------
+One of the most complex part is the connection, reconnection and deletion of
+connection between blocks, it involves several actors, asynchronous callbacks
+and a very strong coupling between all elements.
+
+![Widget Tree](images/hierarchical.pdf)
+
+In order to understand how connections are made it is necessary to understand
+how `Kivy` handles input.
+At surface level `Kivy` follows the traditional event-based input management,
+with the event propagating downwards from the root.
+However while traditionaly inputs events are only passed down to components
+that are on the event position `Kivy` passes the events to almost all children
+by default, this is done because in phones (one of `Kivy` targets is Android)
+gestures tend to start outside the actual widget they intend to affect.
+
+On `Kivy` there are three main inputs events, `on_touch_down` that gets called
+when a key is is pressed, `on_touch_move` that is notified when the touch is
+moved, i.e. a finger moves across the screen, or on this cases when the mouse
+moves, and `on_touch_up` that is fired when the touch is released.
+
+Lets represent the possible actions as use cases, the \* represents
+`on_touch_down`, - represents `on_touch_move`, and the inner \* `on_touch_up`:
+
+* (On pin) Start a connection
+* (On connection) Modify a connection
+    - Follow cursor
+    - (On pin) Typecheck
+        * (On a pin) Establish connection if possible
+        * (Elsewhere) Remove connection
+
+Logic is split in two big cases, creating a connection and modifying an
+existing one.
+Creating a connection involves creating one end of the connection, both
+visually and logically and preparing the line that will follow the cursor.
+On the other hand modifying a connection means removing the end that is being
+touched.
+This two cases can be handled by different classes, pin on the first case and
+connection for the last.
+Moving and finishing the connection are the same.
+
+Without getting too deep into implementation details ends cannot just be
+removed, there are visual binds that have to be unbinded, and when a connection
+is destroyed (this only happens inside `on_touch_up`, but it can be either
+the pins or the blackboard `on_touch_up` depending if the connection is
+destroyed because the pin violates type safety or there is no pin under the
+cursor respectively) it has to unbind the logical connections of the pins
+themselves.
+For this reason connection has high-level functions that do the unbind, rebind
+and deletion of ends, as long as the necessary elements are passed (dependency
+injection pattern).
+
+![Connections between elements](images/logical.pdf)
+
+
+Intermediate Representation
+---------------------------
+The visual blocks represent a visual-dataflow language, however the backend
+uses a simpler representation of the relations between the blocks, this in turn
+helps decoupling backend and frontend.
+
+The frontend blocks are translated on function `to_ir`, which merely performs
+trivial transformations to achieve the desired intermediate representation
+desired and runs on $\mathcal{O}(n)$ with n being the number of pins.
+
+Let's represent the types on a more strongly typed language than Python.
+
+~~~haskell
+type Id = Int -- The hash is an integer
+data Inputs = Inputs {origin :: Id, block :: Id}
+data Blocks = Blocks {inputs :: [Id], function :: IO a -> IO a,
+                      outputs :: [Id]}
+data Outputs = Outputs {destinations :: [Id], block :: Id}
+data IR = IR {inputs :: Map Id Inputs, blocks :: Map Id Blocks,
+              outputs :: Map Id Outputs}
+~~~
+
+As we can see on the Haskell definition the intermediation representation is
+just three Maps, one for blocks, one for input pins and one for output pins.
+But the maps do not contains pins themselves, merely unique hashes (Int on
+this case).
+This reflects the fact that pins model only relationships, not state.
+The only non-hash value on `IR` are the blocks functions.
+This functions are indeed impure, but earlier on the literature review it was
+established that dataflow programming was mainly side-effect free, so why do
+they involve side effects?.
+
+There are actually first two reasons, first on the actual python programs this
+types do not exist, at least not on an enforceable way, so when translating
+them to haskell the `function` field represents the "worst case", that is to
+say only a few functions will actually end up producing side-effects.
+The second and more important reason is that blocks actually execute
+themselves, meaning the block function does not has parameters, it relays on
+getting the values from the pins values and sets the values of the output
+values, leaving us with the work of setting those input pins and retrieving
+results from the output pins.
+
+This goes against the previously stated "pins represent relationships, not
+state", in fact an alternative implementation was created in which the
+function returned a tuple of results, and it's the compiler job to now
+associate the output pins to each of the elements on the tuple. This was done
+using the same current mechanism, saving into a dictionary, the difference
+being that while currently the values appear on the output pins and have to be
+moved into the dictionary (or otherwise a reference to the pin itself must be
+kept on the dictionary) on this case the values were fed directly to the
+algorithm.
+However this proved limiting, as code became more complex since more checks have
+to be done, there was no obvious advantage and side-effects did not disappeared
+but merely were harder to do.
+
+<!-- Talk about function composition -->
+
+
 [^blackboard]: Blackboard is how the canvas where the blocks and connections
     are lay down.
 [^MVC]: Model View Controller is a software pattern.
 
@@ -1,11 +1,49 @@
 Interface Design
 ================
 
+The main way users interact with the system is trough the visual interface, and
+as such is very important that all the information and operations available are
+easily accessible on an intuitive manner, removing the need for extensive
+training with the software.
+
 Colour Palette
 --------------
+<!-- Talk about hsv and all that fluff, color brewer 2? -->
 
 Typography
 ----------
+The default font for kivy is Roboto, and for a good reason, as one of Kivy
+targets is Android, which has Roboto as the most commonly used font.
+Roboto is a neo-grotesque sans-serif with a modern robotic feel, it really
+feels at home on mobile screens, and it is also used on other Google's products
+and websites.
+However on the desktop it feels a bit too cold and ubiquitous, as John Gruber
+calls it "Google's Arial'.
+The better solution would be platform-dependent, as Mac default choice,
+Helvetica, has trouble rendering in some Window and Linux desktop enviroments.
+For this reason Roboto was left as the choice for font rendering.
+
 
 Sketches
 --------
+![Sketch of the first interface](images/sketch_1.png)
+
+On the first interface there was a focus on getting a model done as soon as
+possible. For this reason the interface had to be easy to implement and easy
+to use, with the few navigations steps required to perform all possible actions
+as to allow for quick debugging.
+This meant sacrificing flexibility in favour of usability, because the
+algorithms implement were so few the button-based interface worked as intended
+for this prototype.
+No special considerations were taken for color palettes,
+shapes or any other kind of visual aid.
+
+![Sketch of the second interface](images/sketch_2.png)
+For the second iteration however the extensibility had to be present, meaning
+the old interface was not reusable for the new functionality.
+The block based interface gives a lot more of control to the final user, still
+some underlying mechanisms such as optional parameters or saving into file were
+not present.
+
+<!-- Third interface: drag and drop blocks? Bubble? Code execution
+     visualization? Type safety indicators? -->