robot.bib

@misc{LinMartiusOettel2019:DFTML,
  author = {Shang-Chun Lin and Georg Martius and Martin Oettel},
  title = {Analytical classical density functionals from an equation learning network},
  year = {2019},
  note = {arXiv preprint \url{https://arxiv.org/abs/1910.12752}}
}

@incollection{BlaesVlastelicaZhuMartius2019:CWYC,
  title = {Control {W}hat {Y}ou {C}an: {I}ntrinsically Motivated Task-Planning Agent},
  author = {Sebastian Blaes and Marin Vlastelica and Jia-Jie Zhu and Georg Martius},
  booktitle = {Advances in Neural Information Processing Systems 32 (NeurIPS'19)},
  pages = {},
  year = {2019},
  publisher = {Curran Associates, Inc.},
  notes = {in press},
  url2 = {http://papers.nips.cc/paper/}
}

@inproceedings{BaumannZhuMartiusTrimpe2018:DeepRL-ETC,
  author = {Baumann, Dominik and Zhu, Jia-Jie and Martius, Georg and Trimpe, Sebastian},
  booktitle = {2018 IEEE Conference on Decision and Control (CDC)},
  title = {Deep Reinforcement Learning for Event-Triggered Control},
  year = {2018},
  pages = {943-950},
  volume = {},
  number = {},
  keywords = {control engineering computing;learning (artificial intelligence);multi-agent systems;networked control systems;nonlinear control systems;multiple control tasks;model-based ETC designs;event-triggered control methods;high-performance control;usual time-triggered methods;mathematical model;controller;deep reinforcement learning algorithms;DRL approach;Mathematical model;Reinforcement learning;Heuristic algorithms;Aerospace electronics;Sensors;Task analysis;Numerical models},
  doi = {10.1109/CDC.2018.8619335},
  url = {http://al.is.tuebingen.mpg.de/publications/baumann2018deep}
}

@inproceedings{RolinekZietlowMartius2019:VAEPCA,
  author = {Rol{\'i}nek, Michal and Zietlow, Dominik and Martius, Georg},
  title = {Variational Autoencoders Pursue PCA Directions (by Accident)},
  booktitle = {Conference on Computer Vision and Pattern Recognition (CVPR'19)},
  month = {June},
  pages = {12406-12415},
  year = {2019}
}

@inproceedings{RolinekMartius2018:L4,
  title = {L4: {P}ractical loss-based stepsize adaptation for deep learning},
  author = {Rol{\'i}nek, Michal and Martius, Georg},
  booktitle = {Advances in Neural Information Processing (NeurIPS'18)},
  pages = {6434--6444},
  editors = {S. Bengio and H. Wallach and H. Larochelle and K. Grauman and N. Cesa-Bianchi and R. Garnett},
  publisher = {Curran Associates, Inc.},
  year = {2018},
  suppl = {http://al.is.tuebingen.mpg.de/publications/rolinekmartius2018-l4},
  url = {http://papers.nips.cc/paper/7879-l4-practical-loss-based-stepsize-adaptation-for-deep-learning.pdf}
}

@inproceedings{bogomolovEtAl2019:falsification_nlopt,
  author = {Sergiy Bogomolov and Goran Frehse and Amit Gurung and Dongxu Li and Georg Martius and  Rajarshi Ray},
  title = {Falsification of Hybrid Systems using Symbolic Reachability and
Trajectory Splicing},
  booktitle = {22nd ACM Intl.~Conf.~on Hybrid Systems: Computation and Control (HSCC 2019)},
  year = 2019,
  pages = {1-10}
}

@conference{SunMartius2018:SingleTouchSensation,
  title = {Robust Affordable {3D} Haptic Sensation via Learning Deformation Patterns},
  author = {Sun, Huanbo and Martius, Georg},
  booktitle = {Proceedings International Conference on Humanoid Robots (IEEE Humanoids)},
  pages = {846-853},
  publisher = {IEEE},
  address = {New York, NY, USA},
  year = {2018},
  note = {Oral Presentation},
  url = {http://al.is.tuebingen.mpg.de/publications/sunmartius2018-singletouchsensation}
}

@article{SunMartius2019:ML4haptics,
  author = {Sun, Huanbo and Martius, Georg},
  title = {Machine Learning for Haptics: Inferring Multi-Contact Stimulation From Sparse Sensor Configuration},
  journal = {Frontiers in Neurorobotics},
  volume = 13,
  pages = 51,
  year = 2019,
  url = {https://www.frontiersin.org/article/10.3389/fnbot.2019.00051},
  doi = {10.3389/fnbot.2019.00051},
  issn = {1662-5218},
  abstract = {Robust haptic sensation systems are essential for obtaining dexterous robots. Currently, we have solutions for small surface areas, such as fingers, but affordable and robust techniques for covering large areas of an arbitrary 3D surface are still missing. Here, we introduce a general machine learning framework to infer multi-contact haptic forces on a 3D robot's limb surface from internal deformation measured by only a few physical sensors. The general idea of this framework is to predict first the whole surface deformation pattern from the sparsely placed sensors and then to infer number, locations, and force magnitudes of unknown contact points. We show how this can be done even if training data can only be obtained for single-contact points using transfer learning at the example of a modified limb of the Poppy robot. With only 10 strain-gauge sensors we obtain a high accuracy also for multiple-contact points. The method can be applied to arbitrarily shaped surfaces and physical sensor types, as long as training data can be obtained.}
}

@inproceedings{PinneriMartius2018:Repeller,
  title = {Systematic self-exploration of behaviors for robots in a dynamical systems framework},
  author = {Cristina Pinneri and Georg Martius},
  booktitle = {Proc.\ Artificial Life XI},
  year = {2018},
  publisher = {MIT Press, Cambridge, MA},
  pages = {319-326},
  doi = {10.1162/isal\_a\_00062},
  url = {https://www.mitpressjournals.org/doi/abs/10.1162/isal_a_00062},
  abstract = { One of the challenges of this century is to understand the neural mechanisms behind cognitive control and learning. Recent investigations propose biologically plausible synaptic mechanisms for self-organizing controllers, in the spirit of Hebbian learning. In particular, differential extrinsic plasticity (DEP) has proven to enable embodied agents to self-organize their individual sensorimotor development, and generate highly coordinated behaviors during their interaction with the environment. These behaviors are attractors of a dynamical system. In this paper, we use the DEP rule to generate attractors and we combine it with a “repelling potential” which allows the system to actively explore all its attractor behaviors in a systematic way. With a view to a selfdetermined exploration of goal-free behaviors, our framework enables switching between different motion patterns in an autonomous and sequential fashion. Our algorithm is able to recover all the attractor behaviors in a toy system and it is also effective in two simulated environments. A spherical robot discovers all its major rolling modes and a hexapod robot learns to locomote in 50 different ways in 30min. }
}

@inproceedings{SahooLampertMartius2018:EQLDiv,
  title = {Learning equations for extrapolation and control},
  author = {Subham S. Sahoo and  Christoph H. Lampert and Georg Martius},
  booktitle = {Proc.\ 35th International Conference on Machine Learning,
               {ICML} 2018, Stockholm, Sweden},
  pages = {4442--4450},
  volume = {80},
  publisher = {{PMLR}},
  year = 2018,
  pdf = {http://proceedings.mlr.press/v80/sahoo18a/sahoo18a.pdf},
  url = {http://proceedings.mlr.press/v80/sahoo18a.html},
  editor = {Dy, Jennifer and Krause, Andreas},
  abstract = {
  We present an approach to identify concise equations from data using a shallow neural network approach. In contrast to ordinary black-box regression, this approach allows understanding functional relations and generalizing them from observed data to unseen parts of the parameter space. We show how to extend the class of learnable equations for a recently proposed equation learning network to include divisions, and we improve the learning and model selection strategy to be useful for challenging real-world data. For systems governed by analytical expressions, our method can in many cases identify the true underlying equation and extrapolate to unseen domains. We demonstrate its effectiveness by experiments on a cart-pendulum system, where only 2 random rollouts are required to learn the forward dynamics and successfully achieve the swing-up task.}
}

@article{BotellaSolerEtAl2018:NonlinearRetinaDecoding,
  author = {Botella-Soler, Vicente AND Deny, St\'ephane AND Martius, Georg AND Marre, Olivier AND Tka\check{c}ik, Ga\check{s}per},
  journal = {PLOS Computational Biology},
  publisher = {Public Library of Science},
  title = {Nonlinear decoding of a complex movie from the mammalian retina},
  year = {2018},
  month = {05},
  volume = {14},
  url = {https://doi.org/10.1371/journal.pcbi.1006057},
  pages = {1-27},
  abstract = {Author summary Neurons in the retina transform patterns of incoming light into sequences of neural spikes. We recorded from ∼100 neurons in the rat retina while it was stimulated with a complex movie. Using machine learning regression methods, we fit decoders to reconstruct the movie shown from the retinal output. We demonstrated that retinal code can only be read out with a low error if decoders make use of correlations between successive spikes emitted by individual neurons. These correlations can be used to ignore spontaneous spiking that would, otherwise, cause even the best linear decoders to “hallucinate” nonexistent stimuli. This work represents the first high resolution single-trial full movie reconstruction and suggests a new paradigm for separating spontaneous from stimulus-driven neural activity.},
  number = {5},
  doi = {10.1371/journal.pcbi.1006057}
}

@misc{MartiusLampert2017:EQL,
  title = {Extrapolation and learning equations},
  author = {Georg Martius and Christoph H. Lampert},
  note = {arXiv preprint \url{https://arxiv.org/abs/1610.02995}},
  year = 2016
}

@inproceedings{MartiusHostettlerKnollDer2016:IROS-MyoArm,
  title = {Compliant control for soft robots: emergent behavior of a tendon driven anthropomorphic arm.},
  author = { Martius, Georg and Hostettler, Rafael and Knoll, Alois and Der, Ralf},
  booktitle = {2016 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
  year = {2016},
  pages = {767-773},
  keywords = {Control systems;Muscles;Robot kinematics;Robot sensing systems;Springs;Tendons},
  doi = {10.1109/IROS.2016.7759138},
  pdf = {http://robot.informatik.uni-leipzig.de/research/publications/2016/MartiusHostettlerKnollDer:IROS_watermark.pdf},
  suppl = {http://playfulmachines.com/MyoArm-2}
}

@article{Der2016:InSearch,
  author = {Der, Ralf},
  title = {In search for the neural mechanisms of individual development: behavior-driven differential Hebbian learning},
  journal = {Frontiers in Robotics and AI},
  volume = {2},
  year = {2016},
  number = {37},
  url = {http://www.frontiersin.org/computational_intelligence/10.3389/frobt.2015.00037},
  doi = {10.3389/frobt.2015.00037},
  issn = {2296-9144}
}

@inproceedings{DerMartius2016:ICDL-dyn-self-consistency,
  author = {Ralf Der and Georg Martius},
  booktitle = {2016 Joint IEEE International Conference on Development and Learning and Epigenetic Robotics (ICDL-EpiRob)},
  title = {Dynamical self-consistency leads to behavioral development and emergent social interactions in robots},
  year = {2016},
  pages = {49-56},
  doi = {10.1109/DEVLRN.2016.7846789},
  publisher = {IEEE},
  month = {Sept},
  pdf = {http://robot.informatik.uni-leipzig.de/research/publications/2016/DerMartius2016:ICDL-dyn-self-consistency.pdf},
  suppl = {http://playfulmachines.com/ICDL2016},
  comment = {distinguished oral paper award}
}

@article{DerMartius2017:SOMusculo,
  author = {Der, Ralf and Martius, Georg},
  title = {Self-Organized Behavior Generation for Musculoskeletal Robots},
  journal = {Frontiers in Neurorobotics},
  volume = {11},
  pages = {8},
  year = {2017},
  url = {http://journal.frontiersin.org/article/10.3389/fnbot.2017.00008},
  doi = {10.3389/fnbot.2017.00008},
  issn = {1662-5218},
  suppl = {http://playfulmachines.com/MyoArm-1},
  note = {arXiv preprint \url{http://arxiv.org/abs/1602.02990}}
}

@article{DerMartius2015:DEP,
  author = {Der, Ralf and Martius, Georg},
  title = {Novel plasticity rule can explain the development of sensorimotor intelligence},
  volume = {112},
  number = {45},
  pages = {E6224-E6232},
  year = {2015},
  doi = {10.1073/pnas.1508400112},
  abstract = {Grounding autonomous behavior in the nervous system is a fundamental challenge for neuroscience. In particular, self-organized behavioral development provides more questions than answers. Are there special functional units for curiosity, motivation, and creativity? This paper argues that these features can be grounded in synaptic plasticity itself, without requiring any higher-level constructs. We propose differential extrinsic plasticity (DEP) as a new synaptic rule for self-learning systems and apply it to a number of complex robotic systems as a test case. Without specifying any purpose or goal, seemingly purposeful and adaptive rhythmic behavior is developed, displaying a certain level of sensorimotor intelligence. These surprising results require no system-specific modifications of the DEP rule. They rather arise from the underlying mechanism of spontaneous symmetry breaking, which is due to the tight brain body environment coupling. The new synaptic rule is biologically plausible and would be an interesting target for neurobiological investigation. We also argue that this neuronal mechanism may have been a catalyst in natural evolution.},
  url = {http://www.pnas.org/content/112/45/E6224.abstract},
  eprint = {http://www.pnas.org/content/112/45/E6224.full.pdf},
  journal = {Proceedings of the National Academy of Sciences},
  suppl = {http://playfulmachines.com/DEP}
}

@article{MartiusOlbrich2015:QuantBehavior,
  author = {Martius, Georg and Olbrich, Eckehard},
  title = {Quantifying Emergent Behavior of Autonomous Robots},
  journal = {Entropy},
  volume = {17},
  year = {2015},
  number = {10},
  pages = {7266},
  url = {http://www.mdpi.com/1099-4300/17/10/7266},
  issn = {1099-4300},
  doi = {10.3390/e17107266},
  suppl = {http://playfulmachines.com/QuantBeh2015}
}

@article{ay2012information,
  title = {Information-driven self-organization: the dynamical system approach to autonomous robot behavior},
  author = {Ay, Nihat and Bernigau, Holger and Der, Ralf and Prokopenko, Mikhail},
  journal = {Theory in Biosciences},
  volume = {131},
  number = {3},
  pages = {161--179},
  year = {2012},
  publisher = {Springer}
}

@article{ay08:predinf_explore_behavior,
  title = {Predictive information and explorative behavior of autonomous robots},
  author = {N. Ay and N. Bertschinger and R. Der and F. G{\"u}ttler and E. Olbrich},
  journal = {The European Physical Journal B},
  year = {2008},
  number = {3},
  pages = {329--339},
  volume = {63},
  doi = {10.1140/epjb/e2008-00175-0},
  pdf = {http://www.informatik.uni-leipzig.de/~der/Veroeff/journphysics.pdf},
  url = {http://www.springerlink.com/content/d410227j49136551}
}

@incollection{DerGSO2012,
  title = {On the role of embodiment for self-organizing robots: behavior as broken symmetry},
  author = {Der, Ralf},
  booktitle = {Guided Self-Organization: Inception},
  publisher = {Springer},
  year = {2014},
  editor = {Prokopenko, Mikhail},
  volume = {9},
  pages = {193-221},
  series = {Emergence, Complexity and Computation},
  affiliation = {Max Planck Institute for Mathematics in the Sciences},
  file = {GSO2012.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2013/GSO2012.pdf:PDF},
  pdf = {http://robot.informatik.uni-leipzig.de/research/publications/2013/GSO2012.pdf},
  suppl = {http://robot.informatik.uni-leipzig.de/research/supplementary/GSO2012}
}

@article{ZahediAyDer2010:HigherCoordination,
  author = {Zahedi, Keyan and Ay, Nihat and Der, Ralf},
  title = {Higher Coordination With Less Control -- {A} Result of Information Maximization in the Sensorimotor Loop},
  volume = {18},
  number = {3-4},
  pages = {338-355},
  year = {2010},
  doi = {10.1177/1059712310375314},
  abstract = {This work presents a novel learning method in the context of embodied artificial intelligence and self-organization, which has as few assumptions and restrictions as possible about the world and the underlying model. The learning rule is derived from the principle of maximizing the predictive information in the sensorimotor loop. It is evaluated on robot chains of varying length with individually controlled, noncommunicating segments. The comparison of the results shows that maximizing the predictive information per wheel leads to a higher coordinated behavior of the physically connected robots compared with a maximization per robot. Another focus of this article is the analysis of the effect of the robot chain length on the overall behavior of the robots. It will be shown that longer chains with less capable controllers outperform those of shorter length and more complex controllers. The reason is found and discussed in the information-geometric interpretation of the learning process.},
  hyperlink = {http://adb.sagepub.com/content/18/3-4/338.abstract},
  eprint = {http://adb.sagepub.com/content/18/3-4/338.full.pdf+html},
  journal = {Adaptive Behavior},
  pdf = {http://arxiv.org/abs/0910.2039}
}

@article{der01,
  title = {Self-Organized Acquisition of Situated Behaviors},
  author = {Ralf Der},
  journal = {Theory Biosci.},
  year = {2001},
  pages = {179-187},
  volume = {120}
}

@misc{der98hk_nocite,
  title = {Self-Organized Robot Behavior from the Principle of Homeokinesis.},
  author = {Ralf Der},
  year = {1999},
  file = {derpantz1.ps:http\://www.informatik.uni-leipzig.de/~der/Veroeff/derpantz1.ps:PostScript}
}

@inproceedings{DerGuettlerAy08:predinf,
  title = {Predictive information and emergent cooperativity in a chain of mobile robots},
  author = {Der, R. and G{\"u}ttler, F. and Ay, N.},
  booktitle = {Proc.\ Artificial Life XI},
  year = {2008},
  editor = {Bullock, S. and Noble, J. and Watson, R. and Bedau, M. A.},
  pages = {166--172},
  publisher = {MIT Press, Cambridge, MA},
  citeulike-article-id = {3365910},
  citeulike-linkout-0 = {http://www.alifexi.org/papers/ALIFExi_pp166-172.pdf},
  pdf = {http://www.informatik.uni-leipzig.de/%7Eder/Veroeff/AlifeXI.pdf},
  url = {http://www.alifexi.org/papers/ALIFExi_pp166-172.pdf}
}

@inproceedings{DerGuettAy08,
  title = {Predictive Information and Emergent Cooperativity in a Chain of Mobile Robots},
  author = {Ralf Der and Frank G{\"u}ttler and Nihat Ay},
  booktitle = {Artificial Life {XI}},
  year = {2008},
  publisher = {MIT Press},
  file = {AlifeXI.pdf:http\://www.informatik.uni-leipzig.de/%7Eder/Veroeff/AlifeXI.pdf:PDF}
}

@inproceedings{derherrmann96rl,
  title = {Self-adjusting reinforcement learning},
  author = {Ralf Der and Michael Herrmann},
  booktitle = {{N}onlinear {T}heory and {A}pplications - {NOLTA} 96},
  year = {1996},
  pages = {441 - 444},
  file = {nolta96.ps.gz:http\://www.informatik.uni-leipzig.de/~der/Veroeff/nolta96.ps.gz:PostScript}
}

@inproceedings{derherr95rl,
  title = {Efficient {Q}-Learning by division of labour.},
  author = {Ralf Der and Michael Herrmann},
  booktitle = {Proc.\ Intl.\ Conf.\ on Artificial Neural Networks - ICANN95},
  year = {1995},
  pages = {129 - 134},
  file = {div.labour.ps.gz:http\://www.informatik.uni-leipzig.de/~der/Veroeff/div.labour.ps.gz:PostScript}
}

@article{derherrhol02,
  title = {Self-organization in sensor-motor loops by the homeokinetic principle},
  author = {Ralf Der and Michael Herrmann and M. Holicki},
  journal = {Verhandlungen der Deutschen Physikalischen Gesellschaft},
  year = {2002},
  month = jan,
  pages = {510}
}

@techreport{derself-referential05,
  title = {Contingent Robot Behavior Generated by Self-Referential Dynamical Systems},
  author = {Der, Ralf and Hesse, Frank and Liebscher, Ren{\'e}},
  institution = {University of Leipzig},
  year = {2005},
  file = {autorob.pdf:http\://www.informatik.uni-leipzig.de/~der/Veroeff/autorob.pdf:PDF}
}

@inproceedings{derfeeling05,
  title = {Learning to Feel the Physics of a Body},
  author = {Ralf Der and Frank Hesse and Georg Martius},
  booktitle = {Computational Intelligence for Modelling, Control and Automation, CIMCA 2005 },
  year = {2005},
  address = {Washington, DC, USA},
  pages = {252--257},
  volume = {2},
  abstract = {Despite the tremendous progress in robotic hardware and in both sensorial and computing efficiencies the performance of contemporary autonomous robots is still far below that of simple animals. This has triggered an intensive search for alternative approaches to the control of robots. The present paper exemplifies a general approach to the self-organization of behavior which has been developed and tested in various examples in recent years. We apply this approach to an underactuated snake like artifact with a complex physical behavior which is not known to the controller. Due to the weak forces available, the controller so to say has to develop a kind of feeling for the body which is seen to emerge from our approach in a natural way with meandering and rotational collective modes being observed in computer simulation experiments.},
  file = {feelphysics.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2005/feelphysics.pdf:PDF},
  isbn = {0-7695-2504-0}
}

@inproceedings{derlieb02,
  title = {True autonomy from self-organized adaptivity},
  author = {Ralf Der and Ren{\'e} Liebscher},
  booktitle = {Proc. Workshop Biologically Inspired Robotics},
  year = {2002},
  address = {Bristol},
  file = {bristol.pdf:http\://www.informatik.uni-leipzig.de/~der/Veroeff/bristol.pdf:PDF}
}

@inproceedings{dermartius:babble06,
  title = {From Motor Babbling to Purposive Actions: Emerging Self-exploration in a Dynamical Systems Approach to Early Robot Development},
  author = {Ralf Der and Georg Martius},
  booktitle = {Proc.\ From Animals to Animats 9, SAB 2006},
  year = {2006},
  editor = {Stefano Nolfi and Gianluca Baldassarre and Raffaele Calabretta and John C. T. Hallam and Davide Marocco and Jean-Arcady Meyer and Orazio Miglino and Domenico Parisi},
  pages = {406-421},
  publisher = {Springer},
  series = {LNCS},
  volume = {4095},
  abstract = {Self-organization and the phenomenon of emergence play an essential role in living systems and form a challenge to artificial life systems. This is not only because systems become more lifelike, but also since self-organization may help in reducing the design efforts in creating complex behavior systems. The present paper studies self-exploration based on a general approach to the self-organization of behavior, which has been developed and tested in various examples in recent years. This is a step towards autonomous early robot development. We consider agents under the close sensorimotor coupling paradigm with a certain cognitive ability realized by an internal forward model. Starting from tabula rasa initial conditions we overcome the bootstrapping problem and show emerging self-exploration. Apart from that, we analyze the effect of limited actions, which lead to deprivation of the world model. We show that our paradigm explicitly avoids this by producing purposive actions in a natural way. Examples are given using a simulated simple wheeled robot and a spherical robot driven by shifting internal masses.},
  file = {babble2purpos06.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2006/babble2purpos06.pdf:PDF},
  isbn = {3-540-38608-4}
}

@incollection{DerMartius13,
  title = {Behavior as broken symmetry in embodied self-organizing robots},
  author = {Ralf Der and Georg Martius},
  booktitle = {Advances in Artificial Life, ECAL 2013},
  publisher = {MIT Press},
  year = {2013},
  pages = {601-608},
  affiliation = {Max Planck Institute for Mathematics in the Sciences},
  pdf = {http://robot.informatik.uni-leipzig.de/research/publications/2013/ECAL2013.pdf},
  suppl = {http://robot.informatik.uni-leipzig.de/research/supplementary/ECAL2013}
}

@book{DerMartius11,
  title = {{T}he {P}layful {M}achine - {T}heoretical Foundation and Practical Realization of Self-Organizing Robots},
  author = {Der, Ralf and Martius, Georg},
  publisher = {Springer},
  address = {Berlin Heidelberg},
  year = {2012},
  abstract = {Autonomous robots may become our closest companions in the near future. While the technology for physically building such machines is already available today, a problem lies in the generation of the behavior for such complex machines. Nature proposes a solution: young children and higher animals learn to master their complex brain-body systems by playing. Can this be an option for robots? How can a machine be playful? The book provides answers by developing a general principle---homeokinesis, the dynamical symbiosis between brain, body, and environment---that is shown to drive robots to self-determined, individual development in a playful and obviously embodiment-related way: a dog-like robot starts playing with a barrier, eventually jumping or climbing over it; a snakebot develops coiling and jumping modes; humanoids develop climbing behaviors when fallen into a pit, or engage in wrestling-like scenarios when encountering an opponent. The book also develops guided self-organization, a new method that helps to make the playful machines fit for fulfilling tasks in the real world.},
  isbn = {978-3-642-20252-0},
  url = {http://playfulmachines.com},
  pdf = {http://robot.informatik.uni-leipzig.de/research/publications/2012/the-playful-machine.pdf}
}

@misc{TutorialPlayfulmachines,
  title = {Playful {M}achines: {T}utorial},
  author = {Der, Ralf and Martius, Georg },
  howpublished = {\url{http://robot.informatik.uni-leipzig.de/tutorial?lang=en}},
  year = {2010}
}

@inproceedings{derspherical06,
  title = {Let It Roll -- Emerging Sensorimotor Coordination in a Spherical Robot},
  author = {Ralf Der and Georg Martius and Frank Hesse},
  booktitle = {Proc,\ Artificial Life X},
  year = {2006},
  editor = {L. M. Rocha and L. S. Yaeger and M. A. Bedau and D. Floreano and R. L. Goldstone and A. Vespignani},
  month = {August},
  pages = {192--198},
  publisher = {Intl.~Society for Artificial Life, MIT Press},
  abstract = {Self-organization and the phenomenen of emergence play an essential role in living systems and form a challenge to artificial life systems. This is not only because systems become more life like but also since self-organization may help in reducing the design efforts in creating complex behavior systems. The present paper exemplifies a general approach to the self-organization of behavior which has been developed and tested in various examples in recent years. We apply this approach to a spherical robot driven by shifting internal masses. The complex physics of this robotic object is completely unknown to the controller. Nevertheless after a short time the robot develops systematic rolling movements covering large distances with high velocity. In a hilly landscape it is capable of manoeuvering out of the basins and in landscapes with a fixed rotational geometry the robot more or less adatps its movements to this geometry -- the controller so to say develops a kind of feeling for its environment although there are no sensors for measuring the positions or the velocity of the robot. We argue that this behavior is a result of the spontaneous symmetry breaking effects which are responsible for the emergence of behavior in our approach.},
  file = {letitroll_alifex06.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2006/letitroll_alifex06.pdf:PDF}
}

@inproceedings{dersteinpas99,
  title = {Homeokinesis - A new principle to back up evolution with learning},
  author = {Ralf Der and U. Steinmetz and Frank Pasemann},
  booktitle = {Proc.\ Intl.\ Conf.\ on Computational Intelligence for Modelling, Control and Automation (CIMCA 99)},
  year = {1999},
  address = {Amsterdam},
  pages = {43-47},
  publisher = {IOS Press},
  series = {Concurrent Systems Engineering Series},
  volume = {55},
  file = {wienfin3.ps:http\://www.informatik.uni-leipzig.de/~der/Veroeff/wienfin3.ps:PostScript},
  url = {citeseer.ist.psu.edu/der99homeokinesis.html}
}

@mastersthesis{guettler:07:diplom,
  title = {Realit\"atsnahe Simulationsumgebung einer selbstorganisierenden Roboterwelt},
  author = {Frank G{\"u}ttler},
  school = {University Leipzig},
  year = {2007},
  url = {\url{http://lips.informatik.uni-leipzig.de/pub/2007-8}}
}

@phdthesis{hamed06,
  title = {Self-Referential Dynamical Systems and Developmental Robotics},
  author = {Naglaa Hamed},
  school = {University of Leipzig},
  year = {2007},
  file = {ThesisHamed.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2007/ThesisHamed.pdf:PDF}
}

@article{Herrmann01,
  title = {Dynamical Systems for Predictive Control of Autonomous Robots},
  author = {J. M. Herrmann},
  journal = {Theory in Biosci.},
  year = {2001},
  pages = {241-252},
  volume = {120}
}

@inproceedings{herrholickider04,
  title = {On Ashby's Homeostat: A Formal Model of Adaptive Regulation},
  author = {Michael Herrmann and Michael Holicki and Ralf Der},
  booktitle = {Proc.\ From Animals to Animats 8 (SAB 2004)},
  year = {2004},
  editor = {S. Schaal},
  pages = {324 - 333},
  publisher = {MIT Press},
  file = {homeostat_final.pdf:http\://www.informatik.uni-leipzig.de/~der/Veroeff/homeostat_final.pdf:PDF}
}

@phdthesis{hesse09:diss,
  title = {Self-Organizing Control for Autonomous Robots},
  author = {Frank Hesse},
  school = {University of G\"ottingen, Institute for Nonlinear Dynamics},
  year = {2009}
}

@inproceedings{hesse:reflexfromselforg07,
  title = {Reflexes from Self-Organizing Control in Autonomous Robots},
  author = {Frank Hesse and Ralf Der and J. Michael Herrmann},
  booktitle = {Proc.\ 7th Intl.\ Conf.\ on Epigenetic Robotics},
  year = {2007},
  editor = {Luc Berthouze and Christopher G. Prince and Michael Littman and Hideki Kozima and Christian Balkenius },
  pages = {37-44},
  publisher = {Lund University},
  series = {Cognitive Studies},
  volume = {134},
  abstract = {Homeokinetic learning provides a route to the self-organization of elementary behaviors in autonomous robots by establishing low-level sensomotoric loops. Strength and duration of the internal parameter changes which are caused by the homeokinetic adaptation provide a natural evaluation of external states, which can be used to incorporate information from additional sensory inputs and to extend the function of the low-level behavior to more general situations. We illustrate the approach by two examples, a mobile robot and a human-like hand which are driven by the same low-level scheme, but use the second-order information in different ways to achieve either risk avoidance and unconstrained movement or constrained movement. While the low-level adaptation follows a set of rigid learning rules, the second-order learning exerts a modulatory effect to the elementary behaviors and to the distribution of their inputs.},
  file = {reflexfromselforg.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2007/reflexfromselforg.pdf:PDF},
  isbn = {91-974741-8-5}
}

@article{HesseDerHerrmann2009,
  title = {{Modulated Exploratory Dynamics Can Shape Self-Organized Behavior}},
  author = {Hesse, Frank and Der, Ralf and Herrmann, J. Michael},
  journal = {Advances in Complex Systems},
  year = {2009},
  number = {03},
  pages = {273},
  volume = {12},
  abstract = {We study an adaptive controller that adjusts its internal parameters by self-organization of its interaction with the environment. We show that the parameter changes that occur in this low-level learning process can themselves provide a source of information to a higher-level context-sensitive learning mechanism. In this way the context is interpreted in terms of the concurrent low-level learning mechanism. The dual learning architecture is studied in realistic simulations of a foraging robot and of a humanoid hand that manipulated an object. Both systems are driven by the same low-level scheme, but use the second-order information in different ways. While the low-level adaptation continues to follow a set of rigid learning rules, the second-order learning modulates the elementary behaviors and affects the distribution of the sensory inputs via the environment.},
  doi = {10.1142/S0219525909002258},
  file = {HesseDerHerrmann2009.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2009/HesseDerHerrmann2009.pdf:PDF},
  issn = {0219-5259},
  pdf = {http://robot.informatik.uni-leipzig.de/research/publications/2009/HesseDerHerrmann2009.pdf},
  url = {http://www.worldscinet.com/acs/12/1203/S0219525909002258.html}
}

@article{hesse:sensorbased09,
  title = {A Sensor-Based Learning Algorithm for the Self-Organization of Robot Behavior},
  author = {Frank Hesse and Georg Martius and Ralf Der and J. Michael Herrmann},
  journal = {Algorithms},
  year = {2009},
  number = {1},
  pages = {398-409},
  volume = {2},
  abstract = {Ideally, sensory information forms the only source of information to a robot. We consider an algorithm for the self-organization of a controller. At short timescales the controller is merely reactive but the parameter dynamics and the acquisition of knowledge by an internal model lead to seemingly purposeful behavior on longer timescales. As a paradigmatic example, we study the simulation of an underactuated snake-like robot. By interacting with the real physical system formed by the robotic hardware and the environment, the controller achieves a sensitive and body-specific actuation of the robot.},
  authorurls = {http://www.nld.ds.mpg.de/nldpeoplefolder.2007-07-17.7548289764/nldperson.2007-12-17.7160605945 and http://www.nld.ds.mpg.de/nldpeoplefolder.2007-07-17.7548289764/nldperson.2007-12-17.4790408658 and and http://www.nld.ds.mpg.de/nldpeoplefolder.2007-07-17.7548289764/nldperson.2007-12-11.8055420465},
  url = {http://www.mdpi.com/1999-4893/2/1/398}
}

@article{Martius2012,
  title = {Robustness of guided self-organization against sensorimotor disruptions},
  author = {Georg Martius},
  journal = {Advances in Complex Systems},
  year = {2013},
  number = {02n03},
  pages = {1350001},
  volume = {16},
  abstract = {Self-organizing processes are crucial for the development of living beings. Practical applications in robots may benefit from the self-organization of behavior, e.g.~to increase fault tolerance and enhance flexibility, provided that external goals can also be achieved. We present results on the guidance of self-organizing control by visual target stimuli and show a remarkable robustness to sensorimotor disruptions. In a proof of concept study an autonomous wheeled robot is learning an object finding and ball-pushing task from scratch within a few minutes in continuous domains. The robustness is demonstrated by the rapid recovery of the performance after severe changes of the sensor configuration.},
  doi = {10.1142/S021952591350001X},
  eprint = {http://www.worldscientific.com/doi/pdf/10.1142/S021952591350001X},
  file = {martius_robustness_of_gso_12_watermark.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2012/martius_robustness_of_gso_12_watermark.pdf:PDF},
  pdf = {http://robot.informatik.uni-leipzig.de/research/publications/2012/martius_robustness_of_gso_12_watermark.pdf}
}

@phdthesis{martius:diss10,
  title = {Goal-Oriented Control of Self-Organizing Behavior in Autonomous Robots},
  author = {Georg Martius},
  school = {Georg-August-Universit\"at G\"ottingen},
  year = {2010},
  url = {http://resolver.sub.uni-goettingen.de/purl/?webdoc-2459}
}

@article{MartiusDerAy2013,
  title = {Information Driven Self-Organization of Complex Robotic Behaviors},
  author = {Georg Martius and Ralf Der and Nihat Ay},
  journal = {PLoS ONE},
  year = {2013},
  number = {5},
  pages = {e63400},
  volume = {8},
  abstract = {Information theory is a powerful tool to express principles to drive autonomous systems because it is domain invariant and allows for an intuitive interpretation. This paper studies the use of the predictive information (PI), also called excess entropy or effective measure complexity, of the sensorimotor process as a driving force to generate behavior. We study nonlinear and nonstationary systems and introduce the time-local predicting information (TiPI) which allows us to derive exact results together with explicit update rules for the parameters of the controller in the dynamical systems framework. In this way the information principle, formulated at the level of behavior, is translated to the dynamics of the synapses. We underpin our results with a number of case studies with high-dimensional robotic systems. We show the spontaneous cooperativity in a complex physical system with decentralized control. Moreover, a jointly controlled humanoid robot develops a high behavioral variety depending on its physics and the environment it is dynamically embedded into. The behavior can be decomposed into a succession of low-dimensional modes that increasingly explore the behavior space. This is a promising way to avoid the curse of dimensionality which hinders learning systems to scale well.},
  doi = {10.1371/journal.pone.0063400},
  preprint = {http://arxiv.org/abs/1301.7473},
  publisher = {Public Library of Science},
  url = {http://dx.doi.org/10.1371/journal.pone.0063400},
  suppl = {http://playfulmachines.com/TiPI}
}

@incollection{MartiusDerHerrmann14,
  title = {Robot Learning by Guided Self-Organization},
  author = {Martius, Georg and Der, Ralf and Herrmann, J. Michael},
  booktitle = {Guided Self-Organization: Inception},
  publisher = {Springer Berlin Heidelberg},
  year = {2014},
  editor = {Prokopenko, Mikhail},
  pages = {223-260},
  series = {Emergence, Complexity and Computation},
  volume = {9},
  doi = {10.1007/978-3-642-53734-9_8},
  isbn = {978-3-642-53733-2},
  url = {http://dx.doi.org/10.1007/978-3-642-53734-9_8}
}

@inproceedings{martius:struct_behav08,
  title = {{S}tructure from {B}ehavior in {A}utonomous {A}gents},
  author = {Georg Martius and Katja Fiedler and J.~Michael Herrmann},
  booktitle = {Proc.\ IEEE Intl.\ Conf.\ Intelligent Robots and Systems (IROS 2008)},
  year = {2008},
  pages = {858 -- 862},
  doi = {10.1109/IROS.2008.4651231},
  file = {mfhIROS08.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2008/mfhIROS08.pdf:PDF}
}

@incollection{martiusherrmann:taming10,
  title = {Taming the Beast: Guided Self-organization of Behavior in Autonomous Robots},
  author = {Martius, Georg and Herrmann, J. Michael},
  booktitle = {From Animals to Animats 11},
  publisher = {Springer},
  year = {2010},
  editor = {Doncieux, Stéphane and Girard, Benoît and Guillot, Agnès and Hallam, John and Meyer, Jean-Arcady and Mouret, Jean-Baptiste},
  pages = {50-61},
  series = {LNCS},
  volume = {6226},
  affiliation = {Bernstein Center for Computational Neuroscience Göttingen, Bunsenstraße 10, 37073 Göttingen, Germany},
  comment = {best paper award},
  doi = {10.1007/978-3-642-15193-4_5},
  file = {taming_the_beast_martius2010.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2010/taming_the_beast_martius2010.pdf:PDF},
  url = {http://dx.doi.org/10.1007/978-3-642-15193-4_5}
}

@article{martiusherrmann:variantsofgso12,
  title = {Variants of guided self-organization for robot control},
  author = {Martius, Georg and Herrmann, J.~Michael},
  journal = {Theory in Biosci.},
  year = {2012},
  number = {3},
  pages = {129-137},
  volume = {131},
  abstract = {Autonomous robots can generate exploratory behavior by self-organization of the sensorimotor loop. We show that the behavioral manifold that is covered in this way can be modified in a goal-dependent way without reducing the self-induced activity of the robot. We present three strategies for guided self-organization, namely by using external rewards, a problem-specific error function or assumptions about the symmetries of the desired behavior. The strategies are analyzed for two different robots in a physically realistic simulation.},
  affiliation = {Bernstein Center for Computational Neuroscience and Max Planck Institute for Dynamics and Self-Organization, Bunsenstr. 10, 37073 Göttingen, Germany},
  doi = {10.1007/s12064-011-0141-0},
  file = {martiusherrmann_variantsofgso_12_watermark.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2012/martiusherrmann_variantsofgso_12_watermark.pdf:PDF},
  issn = {1431-7613},
  pdf = {http://robot.informatik.uni-leipzig.de/research/publications/2012/martiusherrmann_variantsofgso_12_watermark.pdf},
  publisher = {Springer Berlin / Heidelberg},
  url = {http://dx.doi.org/10.1007/s12064-011-0141-0}
}

@incollection{martiusherrmann:tippingscales11,
  title = {Tipping the Scales: Guidance and Intrinsically Motivated Behavior},
  author = {Martius, Georg and Herrmann, J. M.},
  booktitle = {Advances in Artificial Life, ECAL 2011},
  publisher = {MIT Press},
  year = {2011},
  pages = {506--513},
  affiliation = {Max Planck Institute for Mathematics in the Sciences},
  editors = {Tom Lenaerts and Mario Giacobini and Hugues Bersini and Paul Bourgine and Marco Dorigo and René Doursat},
  file = {martiusherrmann11_tippingscales.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2011/martiusherrmann11_tippingscales.pdf:PDF},
  pdf = {http://robot.informatik.uni-leipzig.de/research/publications/2011/martiusherrmann11_tippingscales.pdf},
  isbn = {978-0-262-29714-1},
  suppl = {http://robot.informatik.uni-leipzig.de/research/supplementary/ECAL2011/}
}

@inproceedings{martius:guidedselforg07,
  title = {Guided Self-organisation for Autonomous Robot Development},
  author = {Georg Martius and J. Michael Herrmann and Ralf Der},
  booktitle = {Advances in Artificial Life 9th European Conference, ECAL 2007},
  year = {2007},
  editor = {Almeida e Costa, Fernando and Rocha, Luis and Costa, Ernesto and Harvey, Inman and Coutinho, Ant{\'o}nio},
  pages = {766-775},
  publisher = {Springer},
  series = {LNCS},
  volume = {4648},
  abstract = {The paper presents a method to guide the self-organised development of behaviours of autonomous robots. In earlier publications we demonstrated how to use the homeokinesis principle and dynamical systems theory to obtain self-organised playful but goal-free behaviour. Now we extend this framework by reinforcement signals. We validate the mechanisms with two experiment with a spherical robot. The first experiment aims at fast motion, where the robot reaches on average about twice the speed of a not reinforcement robot. In the second experiment spinning motion is rewarded and we demonstrate that the robot successfully develops pirouettes and curved motion which only rarely occur among the natural behaviours of the robot.},
  file = {guidedselforg.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2007/guidedselforg.pdf:PDF},
  isbn = {978-3-540-74912-7}
}

@misc{lpzrobots10,
  title = {\textsc{LpzRobots}: A free and powerful robot simulator},
  author = {Martius, Georg and Hesse, Frank and Frank G\"uttler and Der, Ralf},
  howpublished = {\url{http://robot.informatik.uni-leipzig.de/software}},
  year = {2010}
}

@inproceedings{MartiusJahnHauserHafner2014:Stumpy,
  title = {Self-Exploration of the Stumpy Robot with Predictive Information Maximization},
  author = {Georg Martius and Luisa Jahn and Helmut Hauser and Verena V.~Hafner},
  booktitle = {Proc.\ From Animals to Animats, SAB 2014},
  year = {2014},
  publisher = {Springer},
  series = {LNCS},
  volume = {8575},
  pages = {32-42},
  editor = {del Pobil, AngelP. and Chinellato, Eris and Martinez-Martin, Ester and Hallam, John and Cervera, Enric and Morales, Antonio},
  keywords = {Self-exploration; intrinsic motivation; robot control; information theory; dynamical systems; learning},
  affiliation = {Max Planck Institute for Mathematics in the Sciences},
  file = {MartiusJahnHauserHafner2014:Stumpy.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2014/MartiusJahnHauserHafner2014:Stumpy.pdf:PDF},
  pdf = {http://robot.informatik.uni-leipzig.de/research/publications/2014/MartiusJahnHauserHafner2014:Stumpy.pdf},
  suppl = {http://robot.informatik.uni-leipzig.de/research/supplementary/SAB2014},
  comment = {best paper award}
}

@inproceedings{martius:interaction08,
  title = {Emergence of Interaction Among Adaptive Agents},
  author = {Georg Martius and Stefano Nolfi and J. Michael Herrmann},
  booktitle = {Proc.\ From Animals to Animats 10 (SAB 2008)},
  year = {2008},
  editor = {Minoru Asada and John C. T. Hallam and Jean-Arcady Meyer and Jun Tani},
  pages = {457-466},
  publisher = {Springer},
  series = {LNCS},
  volume = {5040},
  abstract = {Robotic agents can self-organize their interaction with the environment by an adaptive homeokinetic controller that simultaneously maximizes sensitivity of the behavior and predictability of sensory inputs. Based on previous work with single robots, we study the interaction of two homeokinetic agents. We show that this paradigm also produces quasi-social interactions among artificial agents. The results suggest that homeokinetic learning generates social behavior only in the the context of an actual encounter of the interaction partner while this does not happen for an identical stimulus pattern that is only replayed. This is in agreement with earlier experiments with human subjects.},
  doi = {10.1007/978-3-540-69134-1},
  ee = {http://dx.doi.org/10.1007/978-3-540-69134-1_45},
  file = {Martius_Nolfi_Herrmann08.Interaction.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2008/Martius_Nolfi_Herrmann08.Interaction.pdf:PDF},
  isbn = {978-3-540-69133-4}
}

@article{ZahediMartiusAy2013,
  title = {Linear combination of one-step predictive information with an external reward in an episodic policy gradient setting: a critical analysis},
  author = {Zahedi, Keyan and Martius, Georg and Ay, Nihat},
  journal = {Frontiers in Psychology},
  year = {2013},
  number = {801},
  volume = {4},
  abstract = {One of the main challenges in the field of embodied artificial intelligence is the open-ended autonomous learning of complex behaviours. Our approach is to use task-independent, information-driven intrinsic motivation(s) to support task-dependent learning. The work presented here is a preliminary step in which we investigate the predictive information (the mutual information of the past and future of the sensor stream) as an intrinsic drive, ideally supporting any kind of task acquisition. Previous experiments have shown that the predictive information (PI) is a good candidate to support autonomous, open-ended learning of complex behaviours, because a maximisation of the PI corresponds to an exploration of morphology- and environment-dependent behavioural regularities. The idea is that these regularities can then be exploited in order to solve any given task. Three different experiments are presented and their results lead to the conclusion that the linear combination of the one-step PI with an external reward function is not generally recommended in an episodic policy gradient setting. Only for hard tasks a great speed-up can be achieved at the cost of an asymptotic performance lost.},
  doi = {10.3389/fpsyg.2013.00801},
  issn = {1664-1078},
  url = {http://www.frontiersin.org/cognitive_science/10.3389/fpsyg.2013.00801/abstract}
}

@inproceedings{ZahediMartiusAy12:gso5,
  title = {Predictive information in reinforcement learning of embodied agents},
  author = {Zahedi, Keyan and Martius, Georg and Ay, Nihat},
  booktitle = {Int. Workshop on Guided Self-Organization 5},
  year = {2012},
  note = {Abstract},
  file = {ZahediMartiusAy_PredInfRL_abstract.pdf:http\://robot.informatik.uni-leipzig.de/research/publications/2012/ZahediMartiusAy_PredInfRL_abstract.pdf:PDF}
}

@article{derhessemartius05,
  author = {Der, Ralf and Hesse, Frank and Martius, Georg},
  year = 2006,
  title = {Rocking Stamper and Jumping Snake from a Dynamical System
		  Approach to Artificial Life},
  journal = {Adaptive Behavior},
  volume = 14,
  number = {2},
  pages = {105-115},
  doi = {10.1177/105971230601400202},
  pdf = {http://robot.informatik.uni-leipzig.de/research/publications/2005/rockstump_AdaptBeh.pdf},
  keywords = {autonomous robots, self-organization, homeostasis, homeokinesis, dynamical systems, learning},
  abstract = {Dynamical systems offer intriguing possibilities as a substrate for the generation of behavior because of their rich behavioral complexity. However this complexity   together with the largely covert relation between the parameters and the behavior of the agent is also the main hindrance in the goal-oriented design of a behavior  system. This paper presents a general approach to the self-regulation of dynamical systems so that the design problem is circumvented. We consider the controller (a neural net work) as the mediator for changes in the sensor values over time and   define a dynamics for the parameters of the controller by maximizing the dynamical complexity of the sensorimotor loop under the condition that the consequences of the   actions taken are still predictable. This very general principle is given a concrete mathematical formulation and is implemented in an extremely robust and versatile   algorithm for the parameter dynamics of the controller. We consider two different applications, a mechanical device called the rocking stamper and the ODE simulations   of a "snake" with five degrees of freedom. In these and many other examples studied we observed various behavior modes of high dynamical complexity. }
}