adding introduction

pascalwhoop · pascalwhoop · commit 0293bd1c4f4d · 2018-05-29T17:00:11.000+02:00
diff --git a/src/bibliography.bib b/src/bibliography.bib
@@ -1,7 +1,111 @@
+@misc{roberts_2016,
+    title     = {Why the "duck curve" created by solar power is a problem for utilities},
+    url       = {https://www.vox.com/2016/2/10/10960848/solar-energy-duck-curve},
+    journal   = {Vox},
+    publisher = {Vox},
+    author    = {Roberts,
+                 David},
+    year      = {2016},
+    month     = {Feb}
+}
+
+@misc{crawford_2015,
+    title     = {The California `Duck Curve' That Will Jolt Its Power Grid},
+    url       = {https://www.bloomberg.com/news/articles/2015-10-21/california-s-duck-curve-is-about-to-jolt-the-electricity-grid},
+    journal   = {Bloomberg.com},
+    publisher = {Bloomberg},
+    author    = {Crawford, Jonathan},
+    year      = {2015},
+    month     = {Oct}}
+
+@inproceedings{Molderink:2009:SEE:1995456.1995665,
+
+    author    = {Molderink, Albert and Bosman, Maurice G. C. and Bakker, Vincent and Hurink, Johann L. and Smit, Gerard J.
+                 M.},
+    title     = {Simulating the Effect on the Energy Efficiency of Smart Grid Technologies},
+    booktitle = {Winter Simulation Conference},
+    series    = {WSC '09},
+    year      = {2009},
+    isbn      = {978-1-4244-5771-7},
+    location  = {Austin, Texas},
+    pages     = {1530--1541},
+    numpages  = {12},
+    url       = {http://dl.acm.org/citation.cfm?id=1995456.1995665},
+    acmid     = {1995665},
+    publisher = {Winter Simulation Conference},
+}
+
+@article{Orgerie:2014:STI:2597757.2532637,
+    author     = {Orgerie, Anne-Cecile and Assuncao, Marcos Dias de and Lefevre, Laurent},
+    title      = {A Survey on Techniques for Improving the Energy Efficiency of Large-scale Distributed Systems},
+    journal    = {ACM Comput. Surv.},
+    issue_date = {April 2014},
+    volume     = {46},
+    number     = {4},
+    month      = mar,
+    year       = {2014},
+    issn       = {0360-0300},
+    pages      = {47:1--47:31},
+    articleno  = {47},
+    numpages   = {31},
+    url        = {http://doi.acm.org/10.1145/2532637},
+    doi        = {10.1145/2532637},
+    acmid      = {2532637},
+    publisher  = {ACM},
+    address    = {New York, NY, USA},
+    keywords   = {Energy efficiency, computing, distributed systems, networking},
+}
+
+@article{DePaola:2014:IMS:2620784.2611779,
+    author     = {De Paola, Alessandra and Ortolani, Marco and Lo Re, Giuseppe and Anastasi, Giuseppe and Das, Sajal K.},
+    title      = {Intelligent Management Systems for Energy Efficiency in Buildings: A Survey},
+    journal    = {ACM Comput. Surv.},
+    issue_date = {July 2014},
+    volume     = {47},
+    number     = {1},
+    month      = jun,
+    year       = {2014},
+    issn       = {0360-0300},
+    pages      = {13:1--13:38},
+    articleno  = {13},
+    numpages   = {38},
+    url        = {http://doi.acm.org/10.1145/2611779},
+    doi        = {10.1145/2611779},
+    acmid      = {2611779},
+    publisher  = {ACM},
+    address    = {New York, NY, USA},
+    keywords   = {Building management systems, ambient intelligence, energy saving},
+}
+
+@article{ketter2015competitive,
+    title      = {Competitive benchmarking: an IS research approach to address wicked problems with big data and analytics},
+    author     = {Ketter, Wolfgang and Peters, Markus and Collins, John and Gupta, Alok},
+    year       = {2015}
+}
+
+@misc{mozur_markoff_2017,
+    title     = {Is China Outsmarting America in A.I.?},
+    url       = {https://www.nytimes.com/2017/05/27/technology/china-us-ai-artificial-intelligence.html},
+    journal   = {The New York Times},
+    publisher = {The New York Times},
+    author    = {Mozur, Paul and Markoff, John},
+    year      = {2017},
+    month     = {May}
+}
+
+@misc{faznetchina_2018,
+    title     = {Merkel in China: Die Kanzlerin kündigt Großes an},
+    url       = {http://www.faz.net/aktuell/wirtschaft/merkel-die-kooperation-mit-china-muss-jetzt-auf-ganz-neue-fuesse-gestellt-werden-15607145.html},
+    journal   = {FAZ.NET},
+    publisher = {Frankfurter Allgemeine Zeitung},
+    year      = {2018},
+    month     = {May}
+}
+
 @article{lillicrap2015continuous,
     title   = {Continuous control with deep reinforcement learning},
     author  = {Lillicrap, Timothy P and Hunt, Jonathan J and Pritzel, Alexander and Heess, Nicolas and Erez, Tom and
-              Tassa, Yuval and Silver, David and Wierstra, Daan},
+               Tassa, Yuval and Silver, David and Wierstra, Daan},
     journal = {arXiv preprint arXiv:1509.02971},
     year    = {2015}
 }
diff --git a/src/body.tex b/src/body.tex
@@ -1,13 +1,85 @@
 \chapter{Introduction}
 
-TODO Intro comes at the end
+Over the last few years, the field of \ac {AI} has seen a massive rise in publications and overall interest in the field
+\cite[]{arulkumaran2017brief, russell2016artificial}.
+It has been discussed as key future challenges for nation states and companies alike 
+\cite[]{mozur_markoff_2017, faznetchina_2018}. Recent years have produced a large corpus of research focusing on visual data learning such
+as image recognition, audio and text based language recognition and robotics. In the field of \ac {RL}, many recent
+breakthroughs were achieved in robotics as well as common game challenges such as solving Atari games or playing Go
+\cite[]{arulkumaran2017brief}. 
+
+However, there are many other problem fields that can also benefit from such technologies. One such field is that of the
+global energy markets. These are expected to shift radically in the upcoming decades, adapting to new problems related to global warming and alternative
+energy sources. New problem solving techniques are required to solve such \emph{wicked problems}, because they depend on
+numerous impact factors such as economic, social, political and technical factors. 
+\cite[]{ketter2015competitive}. 
+
+On a local scale, appliances need to improve their efficiency and machines need to deliver their performance with
+minimal energy requirements. Cars, fridges, water heating appliances, dishwashers and entertainment systems alike have
+all shown improvements in their efficiency and it has become a key component of a customers purchasing choice.
+Similarly, large distributed IT systems as well as building management systems are adapted to more efficiently make use
+of the energy they require
+\cite[]{Orgerie:2014:STI:2597757.2532637, DePaola:2014:IMS:2620784.2611779}.
+
+On a regional and even national and international scale, the problem is equally complex. Energy systems were
+conventionally not built to contain \emph{energy buffers}. Energy always needed to be produced to match the demand. This
+is expected to change over the coming years due to an increasing number of electric vehicles and smart appliances. In
+addition, decentralized solar energy production changes the demand curve of macro-level energy supply. California is
+currently suffering a large supply of energy during sunny summer days while lacking energy when wind and solar energy
+output less due to lack of wind or sunshine. This puts previously unseen stress on the transport systems which were
+constructed to deliver large amounts of energy from few sources to many consumers instead of having many small producers
+distributed throughout the system
+\cite[]{roberts_2016}.
+
+\ac {PowerTAC}, a competitive simulation of future energy markets, attempts to solve the planning dilemma of such
+complex systems. It allows researchers to experiment with  numerous alternative scenarios, adapt the system dynamics to
+incentivize participants to behave in alignment with the greater interests and observe the interaction of a variety of
+market participants using different technologies to automatically generate profit. Researchers are invited to participate
+in this simulation by supplying usage models for appliances and developing \emph{brokers} that participate in the game.
+Brokers trade energy, offer contracts and coordinate storage capacities within their own customer network as well as
+with the overall market. 
+
+The simulation offers opportunities for several interesting fields of research: Game design, energy demand forecasting,
+intelligent contract design, commodity trading and of course general simulation and software design questions. 
+
+Brokers can be developed by anyone. This means that some broker developers have years of experience while others have
+not participated in a single competition. Each simulation takes approximately two to three hours to complete and each
+time-step takes five seconds. Previous researchers have identified the problem as a \ac {POMDP}, a common model of \ac
+{RL} literature \cite[]{tactexurieli2016mdp}. Deep \ac {NN} architectures have proven to be very successful in solving
+games in a variety of instances. It is therefore intuitive to attempt and apply such architectures to the problems posed
+by the \ac {PowerTAC} simulation. Unfortunately, most such implementations are only available in Python and \ac{PowerTAC}
+is almost exclusively based on Java. An extension of the current communication protocols to other languages may
+therefore benefit the overall reach of the simulation and motivate newcomers to join the competition with their Python
+based \ac {NN} architectures. 
+
+Finally, a subfield of \ac {RL} research has identified a problem in the transfer of knowledge from previously trained
+networks to newly developed iterations. Because \ac {NN} are mostly black boxes to researchers, it is difficult to
+extract knowledge and transfer this to another architecture. Especially when architectures differ in their
+hyperparameters, the learned weights of a \ac {NN} can not easily be transferred. The field of transfer learning has
+shown many interesting approaches for solving this problem. Agents with access to previously developed models may pass
+their observations to the \emph{teacher agent} and intially attempt to align their decisions to those that their teacher
+would do \cite[]{schmitt2018kickstarting}. More general problem solving agents may be trained by first training several
+small narrow focus agent networks on subproblems and then training the general agent on the actions of the narrow focus
+agents \cite[]{parisotto2015actor}. For problems where a reward function is difficult to construct, \emph{inverse
+reinforcement learning} can be used to train an agent to behave similar to an observable expert. The policy function of
+the agent shows good performance despite lacking a specific reward function \cite[]{NG2004Apprentice}. 
+
+To allow new brokers in the \ac {PowerTAC} setting to quickly catch up to previously developed competitor brokers,
+porting such learning transfer methods and their underlying deep architectures to the problem scope of \ac {PowerTAC}
+may be beneficial. The stated research question for this work therefore goes as follows:
+
+\emph{Can \ac {RL} agents learn from actions of other agents in the \ac {PowerTAC} environment? If so, how? Can imitation allow for
+boosted performance of reinforcement learning algorithms within a competitive simulation environment?} 
+
+%TODO anything from the proposal that can be stolen?
 
 % intro structuring basing on style from https://explorationsofstyle.com/2013/01/22/introductions/
 %Intro short:
+% - recent developments of of A.I. and machine learnin
+% - most research problems applied to image recognition, translation and in the RL space to games and robotics. 
 % - global warming, lots of problems
 % - reinvent the energy grid, lots of changes to the structure
 %   - very difficult to construct such a highly complex, globally spanning, must-never-fail system
-% - recent developments of of A.I. and machine learnin
 % - combine the two
 
 %Intro long
@@ -25,30 +97,31 @@ \chapter{Introduction}
 %allow for boosted performance of reinforcement algorithms within a competitive simulation environment?}
 %------------------------------------------------------------------------------- 
 
-Global warming is a key challenge of the near and medium future. Without proper action, entire continents will see
-%TODO END
-
-Global warming, if not combated, will change the face of the planet. Billions will be impacted, entire coastlines will
-be changed and cities all over the global will have to either be retrofitted to handle sub-sea level positioning or
-abandoned and relocated. (global warming report)
-
-
-One key component to avoid such disastrous effects is the reinvention of the energy systems of the world. While
-appliances on an individual level need to become ever more efficient, globally it is necessary to shift the
-transportation sector towards renewable energy sources.
-Solar and wind
-are required. But The future of energy is difficult (--> MISQ paper argumentation line)
-
-Smart grids need decentralized intelligence where appliance level evaluation of the grid status impacts how energy is
-consumed. When such intelligence shifting is happening towards the \emph{edge} of the grid, it can be intelligent to
-introduce intermediate broker entities that mediate between the two extremes, the end-consumers and the wholesale
-market.
-
-At the same time, current developments in AI and machine learning allow for highly sophisticated learning machines that
-can help manage complex tasks and systems. (citing some sexy AI papers)
 
-Bringing these two developments together, it is intuitive to apply some of the recently developed technologies of 
-\ac {AI} research to solve the coordination issues of contemporary, frankly crude energy networks. 
+% Global warming is a key challenge of the near and medium future. Without proper action, entire continents will see
+% %TODO END
+% 
+% Global warming, if not combated, will change the face of the planet. Billions will be impacted, entire coastlines will
+% be changed and cities all over the global will have to either be retrofitted to handle sub-sea level positioning or
+% abandoned and relocated. (global warming report)
+% 
+% 
+% One key component to avoid such disastrous effects is the reinvention of the energy systems of the world. While
+% appliances on an individual level need to become ever more efficient, globally it is necessary to shift the
+% transportation sector towards renewable energy sources.
+% Solar and wind
+% are required. But The future of energy is difficult (--> MISQ paper argumentation line)
+% 
+% Smart grids need decentralized intelligence where appliance level evaluation of the grid status impacts how energy is
+% consumed. When such intelligence shifting is happening towards the \emph{edge} of the grid, it can be intelligent to
+% introduce intermediate broker entities that mediate between the two extremes, the end-consumers and the wholesale
+% market.
+% 
+% At the same time, current developments in AI and machine learning allow for highly sophisticated learning machines that
+% can help manage complex tasks and systems. (citing some sexy AI papers)
+% 
+% Bringing these two developments together, it is intuitive to apply some of the recently developed technologies of 
+% \ac {AI} research to solve the coordination issues of contemporary, frankly crude energy networks. 
 
 
 \section{Methodology}
@@ -641,6 +714,8 @@ \subsection{Deep Learning in Reinforcement Settings}%
 
 \section{PowerTAC: A Competitive Simulation}
 
+%TODO alternative sources / implementations like powertac
+% Simulating the effect on the energy efficiency of smart grid technologies.pdf
 In the following chapter, I will introduce the \acf{PowerTAC}. It's simulating a liberalized retail electrical energy
 market where multiple autonomous agents compete in different markets. Firstly, a retail market where agents, or
 \emph{brokers}, compete for numerous end-users through the offering of tariff contracts. Secondly, a wholesale market in
diff --git a/thesis.vim b/thesis.vim
@@ -1,27 +1,27 @@
 ab ---      %-------------------------------------------------------------------------------
 ab ===      %===============================================================================
-ab RL       \ac {RL}
-ab GRPC     \ac {GRPC}
-ab UL       \ac {UL}
-ab kWh      \ac {kWh}
-ab SL       \ac {SL}
-ab RNN      \ac {RNN}
-ab LSTM     \ac {LSTM}
-ab DRL      \ac {Deep RL}
-ab JMS      \ac {JMS}
-ab XML      \ac {XML}
-ab DU       \ac {DU}
-ab CHP      \ac {CHP}
-ab NN       \ac {NN}
-ab SARSA    \ac {SARSA}
-ab MDP      \ac {MDP}
-ab POMDP    \ac {POMDP}
-ab AI       \ac {AI}
-ab PPO      \ac {PPO}
-ab POMDP    \ac {POMDP}
-ab GPU      \ac {GPU}
-ab CPU      \ac {CPU}
-ab TF       \ac {TF}
-ab TPU      \ac {TPU}
-ab SOTA     \ac {SOTA}
-ab PowerTAC \ac {PowerTAC}
+ab RL       \ac{RL}
+ab GRPC     \ac{GRPC}
+ab UL       \ac{UL}
+ab kWh      \ac{kWh}
+ab SL       \ac{SL}
+ab RNN      \ac{RNN}
+ab LSTM     \ac{LSTM}
+ab DRL      \ac{Deep RL}
+ab JMS      \ac{JMS}
+ab XML      \ac{XML}
+ab DU       \ac{DU}
+ab CHP      \ac{CHP}
+ab NN       \ac{NN}
+ab SARSA    \ac{SARSA}
+ab MDP      \ac{MDP}
+ab POMDP    \ac{POMDP}
+ab AI       \ac{AI}
+ab PPO      \ac{PPO}
+ab POMDP    \ac{POMDP}
+ab GPU      \ac{GPU}
+ab CPU      \ac{CPU}
+ab TF       \ac{TF}
+ab TPU      \ac{TPU}
+ab SOTA     \ac{SOTA}
+ab PowerTAC \ac{PowerTAC}