<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="editorial">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Psychol.</journal-id>
<journal-title>Frontiers in Psychology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Psychol.</abbrev-journal-title>
<issn pub-type="epub">1664-1078</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpsyg.2014.00985</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Psychology</subject>
<subj-group>
<subject>Editorial Article</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Intrinsic motivations and open-ended development in animals, humans, and robots: an overview</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Baldassarre</surname> <given-names>Gianluca</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://community.frontiersin.org/people/u/7331"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Stafford</surname> <given-names>Tom</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://community.frontiersin.org/people/u/33026"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Mirolli</surname> <given-names>Marco</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://community.frontiersin.org/people/u/1104"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Redgrave</surname> <given-names>Peter</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://community.frontiersin.org/people/u/11534"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Ryan</surname> <given-names>Richard M.</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://community.frontiersin.org/people/u/72297"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Barto</surname> <given-names>Andrew</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="http://community.frontiersin.org/people/u/54562"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Laboratory of Computational Embodied Neuroscience, Institute of Cognitive Sciences and Technologies, National Research Council</institution> <country>Rome, Italy</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Psychology, University of Sheffield</institution> <country>Sheffield, UK</country></aff>
<aff id="aff3"><sup>3</sup><institution>Department of Clinical and Social Sciences in Psychology, University of Rochester</institution> <country>River, New York, USA</country></aff>
<aff id="aff4"><sup>4</sup><institution>Department of Computer Science, University of Massachusetts Amherst</institution> <country>Massachusetts, USA</country></aff>
<author-notes>
<fn fn-type="corresp" id="fn001"><p>&#x0002A;Correspondence: <email>gianluca.baldassarre&#x00040;istc.cnr.it</email></p></fn>
<fn fn-type="other" id="fn002"><p>This article was submitted to Cognitive Science, a section of the journal Frontiers in Psychology.</p></fn>
<fn fn-type="edited-by"><p>Edited and reviewed by: Eddy J. Davelaar, Birkbeck College, UK</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>09</day>
<month>09</month>
<year>2014</year>
</pub-date>
<pub-date pub-type="collection">
<year>2014</year>
</pub-date>
<volume>5</volume>
<elocation-id>985</elocation-id>
<history>
<date date-type="received">
<day>14</day>
<month>07</month>
<year>2014</year>
</date>
<date date-type="accepted">
<day>19</day>
<month>08</month>
<year>2014</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2014 Baldassarre, Stafford, Mirolli, Redgrave, Ryan and Barto.</copyright-statement>
<copyright-year>2014</copyright-year>
<license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) or licensor are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<kwd-group>
<kwd>intrinsic motivations</kwd>
<kwd>novelty and surprise</kwd>
<kwd>cumulative learning and development</kwd>
<kwd>computational models</kwd>
<kwd>autonomous robotics</kwd>
<kwd>reinforcement learning</kwd>
<kwd>brain and behavior</kwd>
<kwd>review</kwd>
</kwd-group>
<counts>
<fig-count count="0"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="61"/>
<page-count count="5"/>
<word-count count="4609"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="introduction" id="s1">
<title>1. Introduction</title>
<p>This editorial article introduces the Frontiers Research Topic and Electronic Book (eBook) on <italic>Intrinsic Motivations</italic> (IMs), which involved the publication of 24 articles with the journals <italic>Frontiers in Psychology &#x02013; Cognitive Science</italic> and <italic>Frontiers in Neurorobotics</italic>. The main objective of this Frontiers Research Topic is to present state-of-the-art research on IMs and open-ended development from an interdisciplinary perspective involving human and animal psychology, neuroscience, and computational perspectives. We first introduce in this section the main themes and concepts on IMs from different interdisciplinary perspectives. These themes and concepts have been reviewed more extensively in other works (e.g., see Barto et al., <xref ref-type="bibr" rid="B9">2004</xref>; Oudeyer and Kaplan, <xref ref-type="bibr" rid="B38">2007</xref>; Mirolli and Baldassarre, <xref ref-type="bibr" rid="B32">2013</xref>; Barto, <xref ref-type="bibr" rid="B7">2013</xref>), but they are briefly reported here both to meet the needs of the reader new to the field and to introduce the concepts and terms we use in the succeeding sections. In the next four sections, we give an overview of the Topic contributions grouped by four themes. A final section draws the conclusions.</p>
<p>Autonomous development and lifelong open-ended learning are hallmarks of intelligence. Higher mammals, and especially humans, engage in activities that do not appear to directly serve the goals of survival, reproduction, or material advantage. Rather, many activities seem to be carried out &#x0201C;for their own sake&#x0201D; (Berlyne, <xref ref-type="bibr" rid="B11">1966</xref>), play being a prime example, but including other activities driven by curiosity and interest in novel stimuli or surprising events. Autonomously setting goals and working to acquire new forms of competence are also examples of activities that often do not confer obvious evolutionary benefit. Activities like these are thus said to be driven by intrinsic motivations (Baldassarre and Mirolli, <xref ref-type="bibr" rid="B4">2013a</xref>). IMs facilitate the cumulative and virtually open-ended acquisition of knowledge and skills that can later be used to accomplish fitness-enhancing goals (Singh et al., <xref ref-type="bibr" rid="B57">2010</xref>; Baldassarre, <xref ref-type="bibr" rid="B3">2011</xref>). IMs continue during adulthood, and they underlie several important human phenomena such as artistic creativity, scientific discovery, and subjective well-being (Ryan and Deci, <xref ref-type="bibr" rid="B46">2000b</xref>; Schmidhuber, <xref ref-type="bibr" rid="B52">2010</xref>).</p>
<p>IMs were proposed within the animal literature to explain aspects of behavior that could not be explained by the dominant theory of motivation postulating that animals work to reduce physiological imbalances (Hull, <xref ref-type="bibr" rid="B20">1943</xref>). The term &#x0201C;intrinsic motivation&#x0201D; was first used to describe a &#x0201C;manipulation drive&#x0201D; hypothesized to explain why rhesus monkeys would engage with mechanical puzzles for long periods of time without receiving extrinsic rewards (Harlow et al., <xref ref-type="bibr" rid="B19">1950</xref>). Other studies showed how animal instrumental actions can be conditioned with the delivery of apparently neutral stimuli: for example, monkeys were trained to perform actions to gain access to a window from which they could observe conspecifics (Butler, <xref ref-type="bibr" rid="B14">1953</xref>), and mice were trained to perform actions that resulted in clicks or in moving the cage platform (Kish, <xref ref-type="bibr" rid="B23">1955</xref>). The psychological literature on IMs initially linked them to the perceptual properties of stimuli, such as their complexity, novel appearance, or surprising features (Berlyne, <xref ref-type="bibr" rid="B10">1950</xref>, <xref ref-type="bibr" rid="B11">1966</xref>). Later, IMs were also related to action, in particular to the competence (&#x0201C;effectance&#x0201D;) that an agent can acquire to willfully make changes in its environment (White, <xref ref-type="bibr" rid="B60">1959</xref>). This relation of IMs with action and their effects was later linked to the possibility of autonomously setting one&#x00027;s own goals (Ryan and Deci, <xref ref-type="bibr" rid="B45">2000a</xref>).</p>
<p>Computational approaches, in particular machine learning and autonomous robotics, are concerned with IMs and open-ended development as these are thought to have the potential to lead to the construction of truly intelligent artificial systems, in particular systems that are capable of improving their own skills and knowledge <italic>autonomously and indefinitely</italic>. The relation of these studies with those on IMs in psychology were first highlighted by Barto et al. (<xref ref-type="bibr" rid="B9">2004</xref>) and Singh et al. (<xref ref-type="bibr" rid="B56">2005</xref>). The investigation of IMs from a computational perspective can lead to theoretical clarifications, in particular with respect to the computational mechanisms and functions that might underlie IMs (Mirolli and Baldassarre, <xref ref-type="bibr" rid="B32">2013</xref>). IM mechanisms have been classified as being either <italic>knowledge-based</italic> or <italic>competence-based</italic> (Oudeyer and Kaplan, <xref ref-type="bibr" rid="B38">2007</xref>): the former based on measures related to the acquisition of information, and the latter on measures related to the learning of skills. More recently, knowledge-based IMs have been further divided into <italic>novelty-based IMs</italic> and <italic>prediction-based IMs</italic> (Baldassarre and Mirolli, <xref ref-type="bibr" rid="B5">2013b</xref>; Barto et al., <xref ref-type="bibr" rid="B8">2013</xref>). Novelty-based IMs are elicited by the experience of stimuli that are not in the agent&#x00027;s memory (e.g., novel objects, or novel object-object or object-context combinations); prediction-based IMs are related to events that surprise the agent by violating its explicit predictions.</p>
<p>These distinctions have been formalized in the computational models proposed in the literature. Seminal works in machine learning (Schmidhuber, <xref ref-type="bibr" rid="B51">1991</xref>), later developed to function in robots (Oudeyer et al., <xref ref-type="bibr" rid="B39">2007</xref>), have proposed algorithms rewarding actions that allow the agent to improve the quality of a &#x0201C;predictor&#x0201D; component with which it anticipates the effects that such actions produce on the environment. Other researchers have proposed robots capable of detecting and focussing on novel stimuli (e.g., Marsland et al., <xref ref-type="bibr" rid="B28">2005</xref>), or systems capable of detecting anomalies in datasets (Nehmzow et al., <xref ref-type="bibr" rid="B35">2013</xref>). Additional research threads have focussed on action and control, in particular on IMs guiding the autonomous acquisition of motor skills (Barto et al., <xref ref-type="bibr" rid="B9">2004</xref>), on the decision about which of several skills to practice at any time (Schembri et al., <xref ref-type="bibr" rid="B49">2007</xref>; Santucci et al., <xref ref-type="bibr" rid="B47">2013</xref>), and on the the autonomous formation of goals guiding skill acquisition (Baranes and Oudeyer, <xref ref-type="bibr" rid="B6">2013</xref>). Other computational mechanisms related to the idea of IMs are being proposed in the growing field of <italic>active learning</italic>, in particular in relation to supervised learning systems (Settles, <xref ref-type="bibr" rid="B54">2010</xref>).</p>
<p>Recent neuroscientific investigations are revealing brain mechanisms that possibly underlie the IM systems investigated in the behavioral and computational literature. However, unfortunately such investigations are carried out under agendas different from the one on IMs, e.g., in relation to dopamine, memory, motor learning, goal-directed behavior, and conflict monitoring, so comprehensive views are still missing. A large body of research shows how the hippocampus, a brain compound system playing pivotal functions for memory, has the capacity to detect the novelty of various aspects of experience, from the novelty of single items to the novelty of item-item and item-context associations (Ranganath and Rainer, <xref ref-type="bibr" rid="B42">2003</xref>; Kumaran and Maguire, <xref ref-type="bibr" rid="B24">2007</xref>). This detection is then capable of triggering the release of neuromodulators, such as dopamine, that modulate the functioning and learning processes of the hippocampus itself and other brain areas, e.g., of the frontal cortex involved in higher cognition, action planning, and action execution (Lisman and Grace, <xref ref-type="bibr" rid="B26">2005</xref>). Other studies have shown that unexpected stimuli can activate the superior colliculus, a midbrain structure that plays a key role in oculomotor control, which in turn causes phasic bursts of dopamine affecting trial-and-error learning processes happening in basal ganglia, a brain region known to be involved in learning to select actions and other cortex contents (Redgrave and Gurney, <xref ref-type="bibr" rid="B43">2006</xref>). Dopamine signals have also been shown to have an interesting direct relationship with information seeking (Bromberg-Martin and Hikosaka, <xref ref-type="bibr" rid="B13">2009</xref>). Noradrenaline, another neuromodulator targeting a large part of brain, has been shown to be involved in signaling violations of the agent&#x00027;s expectations (Sara, <xref ref-type="bibr" rid="B48">2009</xref>). The failure (Carter et al., <xref ref-type="bibr" rid="B15">1998</xref>) or success (Ribas-Fernandes et al., <xref ref-type="bibr" rid="B44">2011</xref>) in accomplishing goals and sub-goals, possibly themselves set by IMs, has been shown to have neural correlates that might affect succeeding motivation, engagement, and learning. Bio-inspired/bio-constrained computational modeling is linking some of these neuroscientific results to specific computational mechanisms, e.g., in relation to dopamine (e.g., see the pioneering work of Kakade and Dayan, <xref ref-type="bibr" rid="B22">2002</xref>, and Mirolli et al., <xref ref-type="bibr" rid="B33">2013</xref>) and goal-directed behavior (Baldassare et al., <xref ref-type="bibr" rid="B2">2013</xref>).</p>
<p>The 24 interdisciplinary contributions to the present Research Topic can be clustered into four groups. The first group of six contributions (<italic>IMs and brain and behavior</italic>) focuses on different types of IM mechanisms implemented in the brain. The second group of five contributions (<italic>IMs and attention</italic>) focuses on the role of IMs in attention. The third group of eight contributions (<italic>IMs and motor skills</italic>) focuses on IMs as drives for the acquisition of manipulation and navigation skills, often with an emphasis on their function in enabling cumulative, open-ended development. Finally, the fourth group of five contributions (<italic>IMs and social interaction</italic>) focuses on the relationship between IMs and social phenomena, a novel area of investigation of IMs that is increasingly attracting the attention of researchers.</p>
</sec>
<sec>
<title>2. Intrinsic motivations, brain and behavior</title>
<p>The theoretical contribution of Barto et al. (<xref ref-type="bibr" rid="B8">2013</xref>) argues for the importance of distinguishing between <italic>novelty</italic> and <italic>surprise</italic> on the basis of a comprehensive analysis of the computational literature related to the two. It then shows the utility of the distinction for improved understanding of brain and behavior phenomena where the two are often confused. Andringa et al. (<xref ref-type="bibr" rid="B1">2013</xref>) present a broad view of possible relationships between IMs and control, exploration, and agency, linking these processes to the specialization of the left and right hemispheres of the brain and showing how the interplay between these can lead to a progressive sophistication of cognition. Shah and Gurney (<xref ref-type="bibr" rid="B55">2014</xref>) propose a computational model that investigates how basal ganglia, modulated by IMs, can lead to a dynamical shift from noise-based exploration to repetition that can support the acquisition of both simple and more complex motor skills (in the present case, simulated reaching skills). Boedecker et al. (<xref ref-type="bibr" rid="B12">2013</xref>) propose a computational model based on the distinction between dorsal and ventro-medial basal ganglia regions (supporting respectively habitual and goal-directed behavior). Through the model, the authors analyze the relation between these brain regions and IMs concerning reasoning costs and the value of information. This analysis is used to account for some empirical phenomena concerning the relationship between extrinsic and IMs. Fiore et al. (<xref ref-type="bibr" rid="B17">2014</xref>) propose a biologically-constrained computational model that also focuses on different portions of basal ganglia. The model shows how these regions can be differentially regulated by a unique tonic dopaminergic signal, linked to both intrinsic and extrinsic motivations, on the basis of their different sensitivity to dopamine. The model, also tested with the simulated humanoid robot iCub, shows how these modulatory mechanisms can play important adaptive functions for the control of overt attention, manipulation, and goal-directed processes. Thirkettle et al. (<xref ref-type="bibr" rid="B58">2013</xref>) introduce the novel &#x0201C;Joystick experimental paradigm&#x0201D; developed to study intrinsically and extrinsically driven acquisition of actions. The authors demonstrate the function and effectiveness of this paradigm by presenting behavioral experiments grounded in the neuroscientific literature and concerning the acquisition of non-trivial motor actions.</p>
</sec>
<sec>
<title>3. Intrinsic motivations and attention</title>
<p>The computational work of Lonini et al. (<xref ref-type="bibr" rid="B27">2013</xref>) builds on a previous binocular system in which an IM learning signal is generated on the basis of the capacity of the system to reconstruct images encoded with sparse-coding features. This signal guides the acquisition of attention and vergence skills by reinforcement learning. The contribution here focuses on demonstrating the robustness of the system, in particular for recovering from disturbances and for self-recalibration. Di Nocera et al. (<xref ref-type="bibr" rid="B16">2014</xref>) present a behavior-based architecture that uses curiosity drives to improve the attentional capabilities of a reinforcement learning robot engaged in solving simulated survival &#x0201C;extrinsic&#x0201D; tasks. Overall, the work shows the utility of IMs to improve attention and, based on this, action selection. Mather (<xref ref-type="bibr" rid="B29">2013</xref>) briefly reviews research related to the familiarity-to-novelty attention shift observed in babies, and, on this basis, highlights the challenges that this phenomenon poses to theories on IMs. Perone and Spencer (<xref ref-type="bibr" rid="B40">2013</xref>) also deal with the familiarity-to-novelty shift. In particular, the authors propose a dynamical-field model that offers an explanation of the phenomenon as emerging from the autonomous accumulation of visual experience under the guidance of novelty-based IMs. Schlesinger and Amso (<xref ref-type="bibr" rid="B50">2013</xref>), referring to the results of tests of both human and computational agents engaged in solving a visual-exploration task, propose that free viewing of natural images in human infants can be understood as the effect of intrinsically motivated visual exploration driven by the goal of producing predictable gaze sequences. The authors highlight the implications of their approach for understanding visual development in infants.</p>
</sec>
<sec>
<title>4. Intrinsic motivations and open-ended development of motor skills</title>
<p>Santucci et al. (<xref ref-type="bibr" rid="B47">2013</xref>) focus on the problem of which IM signals are best suited to decide which skills to learn by reinforcement learning given a set of tasks. By comparing the results of systems receiving different IM signals, they show that the best IM signals are those based on mechanisms that measure the improvement of the skill competence rather than the errors, or error improvements, of predictors of the action effects on the environment. In a theoretical machine learning contribution, Schmidhuber (<xref ref-type="bibr" rid="B53">2013</xref>) proposes a system that automatically invents computational problems in order to train an increasingly-general problem solver. IM signals driving learning are generated when the system finds more efficient skills to solve all the problems generated thus far. In a similar vein, Ngo et al. (<xref ref-type="bibr" rid="B36">2013</xref>) propose an architecture for controlling a Katana simulated and real robot interacting with a blocks-world. The system is capable of self-generating goals based on its confidence in its predictions about how the environment will react to its actions. Zahedi et al. (<xref ref-type="bibr" rid="B61">2013</xref>) propose the use of task-independent IMs to support task-dependent learning on the basis of the mutual information of the past and future elements of sensor streams (predictive information). The authors conclude that a combination of predictive information with external rewards is recommended only for hard tasks to speed-up learning but at the cost of an asymptotic performance lost. Metzen and Kirchner (<xref ref-type="bibr" rid="B31">2013</xref>) propose a reinforcement learning model that self-generates tasks on the basis of graphs of states and selects the skills to learn on the basis of both novelty-based and prediction-based IMs. The system is tested with navigating and octopus-like simulated robots acting in continuous domains. Inspired by infant cognition, Pitti et al. (<xref ref-type="bibr" rid="B41">2013</xref>) present a reinforcement-learning bio-inspired gain-fields system for learning task-sets (areas of the sensorimotor space having a common underlying cause-effect structure). The system, tested in a cognitive task and with a Kinova robot arm, is capable of recognizing a given task-set as familiar and can create a new representation for it on the basis of its uncertainty and related prediction errors. Frank et al. (<xref ref-type="bibr" rid="B18">2014</xref>) propose a system for controlling the humanoid robot iCub that explores the state-action space on the basis of information gain maximization so as to improve the learning of the world model used for real-time motion planning. Law et al. (<xref ref-type="bibr" rid="B25">2014</xref>) present a schema-based memory system inspired by child early sensorimotor development for controlling the iCub robot. The system undergoes a staged learning process to acquire eye-arm reaching skills and basic manipulation skills under the guidance of novelty- and prediction-based IMs, and the progressive release of constraints focussing attention and learning on relevant experiences.</p>
</sec>
<sec>
<title>5. Intrinsic motivations and social phenomena</title>
<p>In a contribution based on game theory, Merrick and Shafi (<xref ref-type="bibr" rid="B30">2013</xref>) propose the concept of &#x0201C;optimally motivating incentive&#x0201D; for game players, and show how different instances of such an incentive (i.e., strong power, affiliation, and achievement motivation) can be used in both modeling human behavior and designing effective artificial agents. The theoretical contribution of Triesch (<xref ref-type="bibr" rid="B59">2013</xref>) starts from the idea of IMs serving the function of learning &#x0201C;efficient coding&#x0201D; of sensory data and proposes that imitation can emerge as the consequence of a general intrinsic drive to compress information that leads to matching one&#x00027;s own actions with those of the imitated tutor. Moulin-Frier et al. (<xref ref-type="bibr" rid="B34">2013</xref>) propose a model of the initial staged development of speech in infants. IMs initially drive the system to learn the control of phonation, then to produce unarticulated sounds, and finally to produce proto-syllables. The model is tested with a simulator of the vocal tract, the auditory system, the agent&#x00027;s motor control, and social interactions with peers. The contribution of Ogino et al. (<xref ref-type="bibr" rid="B37">2013</xref>) proposes a reinforcement learning model of parent-child engagement where learning signals, similar to phasic dopamine signals, are caused by both extrinsic and intrinsic information, in particular related to the presence and novelty of emotional facial expressions. Finally, Jauffret et al. (<xref ref-type="bibr" rid="B21">2013</xref>) propose a bio-inspired neural architecture that uses a prediction-based algorithm applied to sensorimotor contingencies to solve complex navigation tasks and is capable of asking for help in dead-lock situations.</p>
</sec>
<sec>
<title>6. Concluding remarks</title>
<p>The papers of the present Research Topic testify to the existence of ample interest on the Topic issues. At the same time, they show that the literature on IMs is still characterized by a heterogeneity of perspectives on their possible roles in cognition and behavior and on the possible mechanisms supporting them. On the one side, this heterogeneity is expected given the recency of the attempts to systematize the psychological, neuroscientific, and computational views on IMs within broad interdisciplinary frameworks. On the other side, the heterogeneity is also an indication of the richness of intrinsically motivated phenomena, of their importance for animals&#x00027; cognition and behavior, and of their utility for the design of autonomous robots and intelligent machines. The richness of this topic is expected to result in a further strengthening of the research in the field over the near future.</p>
<sec>
<title>Conflict of interest statement</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
</sec>
</body>
<back>
<ack>
<p>This research has received funds from the European Commission 7th Framework Programme (FP7/2007-2013), &#x0201C;Challenge 2&#x02014;Cognitive Systems, Interaction, Robotics,&#x0201D; Grant Agreement No. ICT-IP-231722, Project &#x0201C;IM-CLeVeR&#x02014;Intrinsically Motivated Cumulative Learning Versatile Robots.&#x0201D; This Frontiers Topic was accomplished as a deliverable of the IM-CLeVeR Project.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Andringa</surname> <given-names>T. C.</given-names></name> <name><surname>van den Bosch</surname> <given-names>K. A.</given-names></name> <name><surname>Vlaskamp</surname> <given-names>C.</given-names></name></person-group> (<year>2013</year>). <article-title>Learning autonomy in two or three steps: linking open-ended development, authority, and agency to motivation</article-title>. <source>Front. Psychol</source>. <volume>4</volume>:<issue>766</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2013.00766</pub-id><pub-id pub-id-type="pmid">24155734</pub-id></citation>
</ref>
<ref id="B2">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Baldassare</surname> <given-names>G.</given-names></name> <name><surname>Mannella</surname> <given-names>F.</given-names></name> <name><surname>Fiore</surname> <given-names>V. G.</given-names></name> <name><surname>Redgrave</surname> <given-names>P.</given-names></name> <name><surname>Gurney</surname> <given-names>K.</given-names></name> <name><surname>Mirolli</surname> <given-names>M.</given-names></name></person-group> (<year>2013</year>). <article-title>Intrinsically motivated action-outcome learning and goal-based action recall: a system-level bio-constrained computational model</article-title>. <source>Neural Netw</source>. <volume>41</volume>, <fpage>168</fpage>&#x02013;<lpage>187</lpage>. <pub-id pub-id-type="doi">10.1016/j.neunet.2012.09.015</pub-id><pub-id pub-id-type="pmid">23098753</pub-id></citation>
</ref>
<ref id="B3">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Baldassarre</surname> <given-names>G.</given-names></name></person-group> (<year>2011</year>). <article-title>What are intrinsic motivations? a biological perspective</article-title>, in <source>Proceedings of the International Conference on Development and Learning and Epigenetic Robotics (ICDL-EpiRob-2011)</source>, eds <person-group person-group-type="editor"><name><surname>Cangelosi</surname> <given-names>A.</given-names></name> <name><surname>Triesch</surname> <given-names>J.</given-names></name> <name><surname>Fasel</surname> <given-names>I.</given-names></name> <name><surname>Rohlfing</surname> <given-names>K.</given-names></name> <name><surname>Nori</surname> <given-names>F.</given-names></name> <name><surname>Oudeyer</surname> <given-names>P.-Y.</given-names></name> <etal/></person-group>. (<publisher-loc>New York, NY</publisher-loc>:<publisher-name>IEEE</publisher-name>), <fpage>E1</fpage>&#x02013;<lpage>E8</lpage>.</citation>
</ref>
<ref id="B4">
<citation citation-type="book"><person-group person-group-type="editor"><name><surname>Baldassarre</surname> <given-names>G.</given-names></name> <name><surname>Mirolli</surname> <given-names>M.</given-names></name></person-group> (Eds.). (<year>2013a</year>). <source>Intrinsically Motivated Learning in Natural and Artificial Systems</source>. <publisher-loc>Berlin</publisher-loc>: <publisher-name>Springer</publisher-name>. <pub-id pub-id-type="doi">10.1007/978-3-642-32375-1</pub-id></citation>
</ref>
<ref id="B5">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Baldassarre</surname> <given-names>G.</given-names></name> <name><surname>Mirolli</surname> <given-names>M.</given-names></name></person-group> (<year>2013b</year>). <article-title>Intrinsically motivated learning systems: an overview</article-title>, in <source>Intrinsically Motivated Learning in Natural and Artificial Systems</source>, eds <person-group person-group-type="editor"><name><surname>Baldassarre</surname> <given-names>G.</given-names></name> <name><surname>Mirolli</surname> <given-names>M.</given-names></name></person-group> (<publisher-loc>Berlin</publisher-loc>: <publisher-name>Springer-Verlag</publisher-name>), <fpage>1</fpage>&#x02013;<lpage>14</lpage>. <pub-id pub-id-type="doi">10.1007/978-3-642-32375-1_1</pub-id></citation>
</ref>
<ref id="B6">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Baranes</surname> <given-names>A.</given-names></name> <name><surname>Oudeyer</surname> <given-names>P.</given-names></name></person-group> (<year>2013</year>). <article-title>Active learning of inverse models with intrinsically motivated goal exploration in robots</article-title>. <source>Robot. Auton. Syst</source>. <volume>61</volume>, <fpage>49</fpage>&#x02013;<lpage>73</lpage>. <pub-id pub-id-type="doi">10.1016/j.robot.2012.05.008</pub-id></citation>
</ref>
<ref id="B7">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Barto</surname> <given-names>A.</given-names></name></person-group> (<year>2013</year>). <article-title>Intrinsic motivation and reinforcement learning</article-title>, in <source>Intrinsically Motivated Learning in Natural and Artificial Systems</source>, eds <person-group person-group-type="editor"><name><surname>Baldassarre</surname> <given-names>G.</given-names></name> <name><surname>Mirolli</surname> <given-names>M.</given-names></name></person-group> (<publisher-loc>Berlin</publisher-loc>:<publisher-name>Springer-Verlag</publisher-name>), <fpage>17</fpage>&#x02013;<lpage>47</lpage>. <pub-id pub-id-type="doi">10.1007/978-3-642-32375-1_2</pub-id></citation>
</ref>
<ref id="B8">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barto</surname> <given-names>A.</given-names></name> <name><surname>Mirolli</surname> <given-names>M.</given-names></name> <name><surname>Baldassarre</surname> <given-names>G.</given-names></name></person-group> (<year>2013</year>). <article-title>Novelty or suprise?</article-title> <source>Front. Psychol</source>. <volume>4</volume>:<issue>907</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2013.00907</pub-id><pub-id pub-id-type="pmid">24376428</pub-id></citation>
</ref>
<ref id="B9">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Barto</surname> <given-names>A. G.</given-names></name> <name><surname>Singh</surname> <given-names>S.</given-names></name> <name><surname>Chentanez</surname> <given-names>N.</given-names></name></person-group> (<year>2004</year>). <article-title>Intrinsically motivated learning of hierarchical collections of skills</article-title>, in <source>International Conference on Developmental Learning (ICDL2004)</source>, eds <person-group person-group-type="editor"><name><surname>Triesch</surname> <given-names>J.</given-names></name> <name><surname>Jebara</surname> <given-names>T.</given-names></name></person-group> (<publisher-loc>New York, NY</publisher-loc>:<publisher-name>IEEE</publisher-name>), <fpage>112</fpage>&#x02013;<lpage>119</lpage>.</citation>
</ref>
<ref id="B10">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Berlyne</surname> <given-names>D. E.</given-names></name></person-group> (<year>1950</year>). <article-title>Novelty and curiosity as determinants of exploratory behaviour</article-title>. <source>Br. J. Psychol. Gen. Sec</source>. <volume>41</volume>, <fpage>68</fpage>&#x02013;<lpage>80</lpage>. <pub-id pub-id-type="doi">10.1111/j.2044-8295.1950.tb00262.x</pub-id></citation>
</ref>
<ref id="B11">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Berlyne</surname> <given-names>D. E.</given-names></name></person-group> (<year>1966</year>). <article-title>Curiosity and exploration</article-title>. <source>Science</source> <volume>143</volume>, <fpage>25</fpage>&#x02013;<lpage>33</lpage>. <pub-id pub-id-type="doi">10.1126/science.153.3731.25</pub-id><pub-id pub-id-type="pmid">5328120</pub-id></citation>
</ref>
<ref id="B12">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Boedecker</surname> <given-names>J.</given-names></name> <name><surname>Lampe</surname> <given-names>T.</given-names></name> <name><surname>Riedmiller</surname> <given-names>M.</given-names></name></person-group> (<year>2013</year>). <article-title>Modeling effects of intrinsic and extrinsic rewards on the competition between striatal learning systems</article-title>. <source>Front. Psychol</source>. <volume>4</volume>:<issue>739</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2013.00739</pub-id><pub-id pub-id-type="pmid">24137146</pub-id></citation>
</ref>
<ref id="B13">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bromberg-Martin</surname> <given-names>E. S.</given-names></name> <name><surname>Hikosaka</surname> <given-names>O.</given-names></name></person-group> (<year>2009</year>). <article-title>Midbrain dopamine neurons signal preference for advance information about upcoming rewards</article-title>. <source>Neuron</source> <volume>63</volume>, <fpage>119</fpage>&#x02013;<lpage>126</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuron.2009.06.009</pub-id><pub-id pub-id-type="pmid">19607797</pub-id></citation>
</ref>
<ref id="B14">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Butler</surname> <given-names>R.</given-names></name></person-group> (<year>1953</year>). <article-title>Discrimination learning by rhesus monkeys to visual-exploration motivation</article-title>. <source>J. Comp. Physiol. Psychol</source>. <volume>46</volume>:<fpage>95</fpage>. <pub-id pub-id-type="doi">10.1037/h0061616</pub-id><pub-id pub-id-type="pmid">13044866</pub-id></citation>
</ref>
<ref id="B15">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carter</surname> <given-names>C. S.</given-names></name> <name><surname>Braver</surname> <given-names>T. S.</given-names></name> <name><surname>Barch</surname> <given-names>D. M.</given-names></name> <name><surname>Botvinick</surname> <given-names>M. M.</given-names></name> <name><surname>Noll</surname> <given-names>D.</given-names></name> <name><surname>Cohen</surname> <given-names>J. D.</given-names></name></person-group> (<year>1998</year>). <article-title>Anterior cingulate cortex, error detection, and the online monitoring of performance</article-title>. <source>Science</source> <volume>280</volume>, <fpage>747</fpage>&#x02013;<lpage>749</lpage>. <pub-id pub-id-type="doi">10.1126/science.280.5364.747</pub-id><pub-id pub-id-type="pmid">9563953</pub-id></citation>
</ref>
<ref id="B16">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Di Nocera</surname> <given-names>D.</given-names></name> <name><surname>Finzi</surname> <given-names>A.</given-names></name> <name><surname>Rossi</surname> <given-names>S.</given-names></name> <name><surname>Staffa</surname> <given-names>M.</given-names></name></person-group> (<year>2014</year>). <article-title>The role of intrinsic motivations in attention allocation and shifting</article-title>. <source>Front. Psychol</source>. <volume>5</volume>:<issue>273</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2014.00273</pub-id><pub-id pub-id-type="pmid">24744746</pub-id></citation>
</ref>
<ref id="B17">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fiore</surname> <given-names>V. G.</given-names></name> <name><surname>Sperati</surname> <given-names>V.</given-names></name> <name><surname>Mannella</surname> <given-names>F.</given-names></name> <name><surname>Mirolli</surname> <given-names>M.</given-names></name> <name><surname>Gurney</surname> <given-names>K.</given-names></name> <name><surname>Friston</surname> <given-names>K.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Keep focussing: striatal dopamine multiple functions resolved in a single mechanism tested in a simulated humanoid robot</article-title>. <source>Front. Psychol</source>. <volume>5</volume>:<issue>124</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2014.00124</pub-id><pub-id pub-id-type="pmid">24600422</pub-id></citation>
</ref>
<ref id="B18">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Frank</surname> <given-names>M.</given-names></name> <name><surname>Leitner</surname> <given-names>J.</given-names></name> <name><surname>Stollenga</surname> <given-names>M.</given-names></name> <name><surname>Forster</surname> <given-names>A.</given-names></name> <name><surname>Schmidhuber</surname> <given-names>J.</given-names></name></person-group> (<year>2014</year>). <article-title>Curiosity driven reinforcement learning for motion planning on humanoids</article-title>. <source>Front. Neurorobot</source>. <volume>7</volume>:<issue>25</issue>. <pub-id pub-id-type="doi">10.3389/fnbot.2013.00025</pub-id><pub-id pub-id-type="pmid">24432001</pub-id></citation>
</ref>
<ref id="B19">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Harlow</surname> <given-names>H.</given-names></name> <name><surname>Harlow</surname> <given-names>M.</given-names></name> <name><surname>Meyer</surname> <given-names>D.</given-names></name></person-group> (<year>1950</year>). <article-title>Learning motivated by a manipulation drive</article-title>. <source>J. Exp. Psychol</source>. <volume>40</volume>:<fpage>228</fpage>. <pub-id pub-id-type="doi">10.1037/h0056906</pub-id><pub-id pub-id-type="pmid">15415520</pub-id></citation>
</ref>
<ref id="B20">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Hull</surname> <given-names>C. L.</given-names></name></person-group> (<year>1943</year>). <source>Principles of Behavior</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Appleton-century-crofts</publisher-name>.</citation>
</ref>
<ref id="B21">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jauffret</surname> <given-names>A.</given-names></name> <name><surname>Cuperlier</surname> <given-names>N.</given-names></name> <name><surname>Tarroux</surname> <given-names>P.</given-names></name> <name><surname>Gaussier</surname> <given-names>P.</given-names></name></person-group> (<year>2013</year>). <article-title>From self-assessment to frustration, a small step toward autonomy in robotic navigation</article-title>. <source>Front. Neurorobot</source>. <volume>7</volume>:<issue>16</issue>. <pub-id pub-id-type="doi">10.3389/fnbot.2013.00016</pub-id><pub-id pub-id-type="pmid">24115931</pub-id></citation>
</ref>
<ref id="B22">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kakade</surname> <given-names>S.</given-names></name> <name><surname>Dayan</surname> <given-names>P.</given-names></name></person-group> (<year>2002</year>). <article-title>Dopamine: generalization and bonuses</article-title>. <source>Neural Netw</source>. <volume>15</volume>, <fpage>549</fpage>&#x02013;<lpage>559</lpage>. <pub-id pub-id-type="doi">10.1016/S0893-6080(02)00048-5</pub-id><pub-id pub-id-type="pmid">12371511</pub-id></citation>
</ref>
<ref id="B23">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kish</surname> <given-names>G.</given-names></name></person-group> (<year>1955</year>). <article-title>Learning when the onset of illumination is used as the reinforcing stimulus</article-title>. <source>J. Comp. Physiol. Psychol</source>. <volume>48</volume>, <fpage>261</fpage>&#x02013;<lpage>264</lpage>. <pub-id pub-id-type="doi">10.1037/h0040782</pub-id><pub-id pub-id-type="pmid">13252153</pub-id></citation>
</ref>
<ref id="B24">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kumaran</surname> <given-names>D.</given-names></name> <name><surname>Maguire</surname> <given-names>E. A.</given-names></name></person-group> (<year>2007</year>). <article-title>Which computational mechanisms operate in the hippocampus during novelty detection?</article-title> <source>Hippocampus</source> <volume>17</volume>, <fpage>735</fpage>&#x02013;<lpage>748</lpage>. <pub-id pub-id-type="doi">10.1002/hipo.20326</pub-id><pub-id pub-id-type="pmid">17598148</pub-id></citation>
</ref>
<ref id="B25">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Law</surname> <given-names>J.</given-names></name> <name><surname>Shaw</surname> <given-names>P.</given-names></name> <name><surname>Kevin</surname> <given-names>E.</given-names></name> <name><surname>Sheldon</surname> <given-names>M.</given-names></name> <name><surname>Lee</surname> <given-names>M.</given-names></name></person-group> (<year>2014</year>). <article-title>A psychology based approach for longitudinal development in cognitive robotics</article-title>. <source>Front. Neurorobot</source>. <volume>8</volume>:<issue>1</issue>. <pub-id pub-id-type="doi">10.3389/fnbot.2014.00001</pub-id><pub-id pub-id-type="pmid">24478693</pub-id></citation>
</ref>
<ref id="B26">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lisman</surname> <given-names>J. E.</given-names></name> <name><surname>Grace</surname> <given-names>A. A.</given-names></name></person-group> (<year>2005</year>). <article-title>The hippocampal-VTA loop: controlling the entry of information into long-term memory</article-title>. <source>Neuron</source> <volume>46</volume>, <fpage>703</fpage>&#x02013;<lpage>713</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuron.2005.05.002</pub-id><pub-id pub-id-type="pmid">15924857</pub-id></citation>
</ref>
<ref id="B27">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lonini</surname> <given-names>L.</given-names></name> <name><surname>Forestier</surname> <given-names>S.</given-names></name> <name><surname>Teuliere</surname> <given-names>C.</given-names></name> <name><surname>Zhao</surname> <given-names>Y.</given-names></name> <name><surname>Shi</surname> <given-names>B. E.</given-names></name> <name><surname>Triesch</surname> <given-names>J.</given-names></name></person-group> (<year>2013</year>). <article-title>Robust active binocular vision through intrinsically motivated learning</article-title>. <source>Front. Neurorobot</source>. <volume>7</volume>:<issue>20</issue>. <pub-id pub-id-type="doi">10.3389/fnbot.2013.00020</pub-id><pub-id pub-id-type="pmid">24223552</pub-id></citation>
</ref>
<ref id="B28">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Marsland</surname> <given-names>S.</given-names></name> <name><surname>Nehmzow</surname> <given-names>U.</given-names></name> <name><surname>Shapiro</surname> <given-names>J.</given-names></name></person-group> (<year>2005</year>). <article-title>On-line novelty detection for autonomous mobile robots</article-title>. <source>Robot. Auton. Syst</source>. <volume>51</volume>, <fpage>191</fpage>&#x02013;<lpage>206</lpage>. <pub-id pub-id-type="doi">10.1016/j.robot.2004.10.006</pub-id></citation>
</ref>
<ref id="B29">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mather</surname> <given-names>E.</given-names></name></person-group> (<year>2013</year>). <article-title>Novelty, attention, and challenges for developmental psychology</article-title>. <source>Front. Psychol</source>. <volume>4</volume>:<issue>491</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2013.00491</pub-id><pub-id pub-id-type="pmid">23914182</pub-id></citation>
</ref>
<ref id="B30">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Merrick</surname> <given-names>K. E.</given-names></name> <name><surname>Shafi</surname> <given-names>K.</given-names></name></person-group> (<year>2013</year>). <article-title>A game theoretic framework for incentive-based models of intrinsic motivation in artificial systems</article-title>. <source>Front. Psychol</source>. <volume>4</volume>:<issue>791</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2013.00791</pub-id><pub-id pub-id-type="pmid">24198797</pub-id></citation>
</ref>
<ref id="B31">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Metzen</surname> <given-names>J. H.</given-names></name> <name><surname>Kirchner</surname> <given-names>F.</given-names></name></person-group> (<year>2013</year>). <article-title>Incremental learning of skill collections based on intrinsic motivation</article-title>. <source>Front. Neurorobot</source>. <volume>7</volume>:<issue>11</issue>. <pub-id pub-id-type="doi">10.3389/fnbot.2013.00011</pub-id><pub-id pub-id-type="pmid">23898265</pub-id></citation>
</ref>
<ref id="B32">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Mirolli</surname> <given-names>M.</given-names></name> <name><surname>Baldassarre</surname> <given-names>G.</given-names></name></person-group> (<year>2013</year>). <article-title>Functions and mechanisms of intrinsic motivations: the knowledge versus competence distinction</article-title>, in <source>Intrinsically Motivated Learning in Natural and Artificial Systems</source>, eds <person-group person-group-type="editor"><name><surname>Baldassarre</surname> <given-names>G.</given-names></name> <name><surname>Mirolli</surname> <given-names>M.</given-names></name></person-group> (<publisher-loc>Berlin</publisher-loc>:<publisher-name>Springer-Verlag</publisher-name>), <fpage>49</fpage>&#x02013;<lpage>72</lpage>.</citation>
</ref>
<ref id="B33">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mirolli</surname> <given-names>M.</given-names></name> <name><surname>Baldassarre</surname> <given-names>G.</given-names></name> <name><surname>Santucci</surname> <given-names>V. G.</given-names></name></person-group> (<year>2013</year>). <article-title>Phasic dopamine as a prediction error of intrinsic and extrinsic reinforcement driving both action acquisition and reward maximization: a simulated robotic study</article-title>. <source>Neural Netw</source>. <volume>39</volume>, <fpage>40</fpage>&#x02013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.1016/j.neunet.2012.12.012</pub-id><pub-id pub-id-type="pmid">23353115</pub-id></citation>
</ref>
<ref id="B34">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moulin-Frier</surname> <given-names>C.</given-names></name> <name><surname>Nguyen</surname> <given-names>S. M.</given-names></name> <name><surname>Oudeyer</surname> <given-names>P.-Y.</given-names></name></person-group> (<year>2013</year>). <article-title>Self-organization of early vocal development in infants and machines: the role of intrinsic motivation</article-title>. <source>Front. Psychol</source>. <volume>4</volume>:<issue>1006</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2013.01006</pub-id><pub-id pub-id-type="pmid">24474941</pub-id></citation>
</ref>
<ref id="B35">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Nehmzow</surname> <given-names>U.</given-names></name> <name><surname>Gatsoulis</surname> <given-names>Y.</given-names></name> <name><surname>Kerr</surname> <given-names>E.</given-names></name> <name><surname>Condell</surname> <given-names>J.</given-names></name> <name><surname>Siddique</surname> <given-names>N.</given-names></name> <name><surname>McGinnity</surname> <given-names>M. T.</given-names></name></person-group> (<year>2013</year>). <article-title>Novelty detection as an intrinsic motivation for cumulative learning robots</article-title>, in <source>Intrinsically Motivated Learning in Natural and Artificial Systems</source>, eds <person-group person-group-type="editor"><name><surname>Baldassarre</surname> <given-names>G.</given-names></name> <name><surname>Mirolli</surname> <given-names>M.</given-names></name></person-group> (<publisher-loc>Berlin</publisher-loc>: <publisher-name>Springer-Verlag</publisher-name>), <fpage>185</fpage>&#x02013;<lpage>207</lpage>. <pub-id pub-id-type="doi">10.1007/978-3-642-32375-1_8</pub-id></citation>
</ref>
<ref id="B36">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ngo</surname> <given-names>H.</given-names></name> <name><surname>Luciw</surname> <given-names>M.</given-names></name> <name><surname>Forster</surname> <given-names>A.</given-names></name> <name><surname>Schmidhuber</surname> <given-names>J.</given-names></name></person-group> (<year>2013</year>). <article-title>Confidence-based progress-driven self-generated goals for skill acquisition in developmental robots</article-title>. <source>Front. Psychol</source>. <volume>4</volume>:<issue>833</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2013.00833</pub-id><pub-id pub-id-type="pmid">24324448</pub-id></citation>
</ref>
<ref id="B37">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ogino</surname> <given-names>M.</given-names></name> <name><surname>Nishikawa</surname> <given-names>A.</given-names></name> <name><surname>Asada</surname> <given-names>M.</given-names></name></person-group> (<year>2013</year>). <article-title>A motivation model for interaction between parent and child based on the need for relatedness</article-title>. <source>Front. Psychol</source>. <volume>4</volume>:<issue>618</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2013.00618</pub-id><pub-id pub-id-type="pmid">24062710</pub-id></citation>
</ref>
<ref id="B38">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Oudeyer</surname> <given-names>P.</given-names></name> <name><surname>Kaplan</surname> <given-names>F.</given-names></name></person-group> (<year>2007</year>). <article-title>What is intrinsic motivation? A typology of computational approaches</article-title>. <source>Front. Neurorobot</source>. <volume>1</volume>:<issue>6</issue>. <pub-id pub-id-type="doi">10.3389/neuro.12.006.2007</pub-id><pub-id pub-id-type="pmid">18958277</pub-id></citation>
</ref>
<ref id="B39">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Oudeyer</surname> <given-names>P.</given-names></name> <name><surname>Kaplan</surname> <given-names>F.</given-names></name> <name><surname>Hafner</surname> <given-names>V.</given-names></name></person-group> (<year>2007</year>). <article-title>Intrinsic motivation systems for autonomous mental development</article-title>. <source>IEEE Trans. Evol. Comput</source>. <volume>11</volume>, <fpage>265</fpage>&#x02013;<lpage>286</lpage>. <pub-id pub-id-type="doi">10.1109/TEVC.2006.890271</pub-id></citation>
</ref>
<ref id="B40">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Perone</surname> <given-names>S.</given-names></name> <name><surname>Spencer</surname> <given-names>J. P.</given-names></name></person-group> (<year>2013</year>). <article-title>Autonomous visual exploration creates developmental change in familiarity and novelty seeking behaviors</article-title>. <source>Front. Psychol</source>. <volume>4</volume>:<issue>648</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2013.00648</pub-id><pub-id pub-id-type="pmid">24065948</pub-id></citation>
</ref>
<ref id="B41">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pitti</surname> <given-names>A.</given-names></name> <name><surname>Braud</surname> <given-names>R.</given-names></name> <name><surname>Mahe</surname> <given-names>S.</given-names></name> <name><surname>Quoy</surname> <given-names>M.</given-names></name> <name><surname>Gaussier</surname> <given-names>P.</given-names></name></person-group> (<year>2013</year>). <article-title>Neural model for learning-to-learn of novel task sets in the motor domain</article-title>. <source>Front. Psychol</source>. <volume>4</volume>:<issue>771</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2013.00771</pub-id><pub-id pub-id-type="pmid">24155736</pub-id></citation>
</ref>
<ref id="B42">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ranganath</surname> <given-names>C.</given-names></name> <name><surname>Rainer</surname> <given-names>G.</given-names></name></person-group> (<year>2003</year>). <article-title>Neural mechanisms for detecting and remembering novel events</article-title>. <source>Nat. Rev. Neurosci</source>. <volume>4</volume>, <fpage>193</fpage>&#x02013;<lpage>202</lpage>. <pub-id pub-id-type="doi">10.1038/nrn1052</pub-id><pub-id pub-id-type="pmid">12612632</pub-id></citation>
</ref>
<ref id="B43">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Redgrave</surname> <given-names>P.</given-names></name> <name><surname>Gurney</surname> <given-names>K.</given-names></name></person-group> (<year>2006</year>). <article-title>The short-latency dopamine signal: a role in discovering novel actions?</article-title> <source>Nat. Rev. Neurosci</source>. <volume>7</volume>, <fpage>967</fpage>&#x02013;<lpage>975</lpage>. <pub-id pub-id-type="doi">10.1038/nrn2022</pub-id><pub-id pub-id-type="pmid">17115078</pub-id></citation>
</ref>
<ref id="B44">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ribas-Fernandes</surname> <given-names>J. J. F.</given-names></name> <name><surname>Solway</surname> <given-names>A.</given-names></name> <name><surname>Diuk</surname> <given-names>C.</given-names></name> <name><surname>McGuire</surname> <given-names>J. T.</given-names></name> <name><surname>Barto</surname> <given-names>A. G.</given-names></name> <name><surname>Niv</surname> <given-names>Y.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>A neural signature of hierarchical reinforcement learning</article-title>. <source>Neuron</source> <volume>71</volume>, <fpage>370</fpage>&#x02013;<lpage>379</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuron.2011.05.042</pub-id><pub-id pub-id-type="pmid">21791294</pub-id></citation>
</ref>
<ref id="B45">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ryan</surname> <given-names>R.</given-names></name> <name><surname>Deci</surname> <given-names>E.</given-names></name></person-group> (<year>2000a</year>). <article-title>Intrinsic and extrinsic motivations: Classic definitions and new directions</article-title>. <source>Contemp. Educ. Psychol</source>. <volume>25</volume>, <fpage>54</fpage>&#x02013;<lpage>67</lpage>. <pub-id pub-id-type="doi">10.1006/ceps.1999.1020</pub-id><pub-id pub-id-type="pmid">10620381</pub-id></citation>
</ref>
<ref id="B46">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ryan</surname> <given-names>R. M.</given-names></name> <name><surname>Deci</surname> <given-names>E. L.</given-names></name></person-group> (<year>2000b</year>). <article-title>Self-determination theory and the facilitation of intrinsic motivation, social development, and well-being</article-title>. <source>Am. Psychol</source>. <volume>55</volume>, <fpage>68</fpage>&#x02013;<lpage>78</lpage>. <pub-id pub-id-type="doi">10.1037/0003-066X.55.1.68</pub-id><pub-id pub-id-type="pmid">11392867</pub-id></citation>
</ref>
<ref id="B47">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Santucci</surname> <given-names>V. G.</given-names></name> <name><surname>Baldassarre</surname> <given-names>G.</given-names></name> <name><surname>Mirolli</surname> <given-names>M.</given-names></name></person-group> (<year>2013</year>). <article-title>Which is the best intrinsic motivation signal for learning multiple skills?</article-title> <source>Front. Neurorobot</source>. <volume>7</volume>:<issue>22</issue>. <pub-id pub-id-type="doi">10.3389/fnbot.2013.00022</pub-id><pub-id pub-id-type="pmid">24273511</pub-id></citation>
</ref>
<ref id="B48">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sara</surname> <given-names>S. J.</given-names></name></person-group> (<year>2009</year>). <article-title>The locus coeruleus and noradrenergic modulation of cognition</article-title>. <source>Nat. Rev. Neurosci</source>. <volume>10</volume>, <fpage>211</fpage>&#x02013;<lpage>223</lpage>. <pub-id pub-id-type="doi">10.1038/nrn2573</pub-id><pub-id pub-id-type="pmid">19190638</pub-id></citation>
</ref>
<ref id="B49">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Schembri</surname> <given-names>M.</given-names></name> <name><surname>Mirolli</surname> <given-names>M.</given-names></name> <name><surname>Baldassarre</surname> <given-names>G.</given-names></name></person-group> (<year>2007</year>). <article-title>Evolving internal reinforcers for an intrinsically motivated reinforcement-learning robot</article-title>, in <source>Proceedings of the 6th International Conference on Development and Learning</source>, eds <person-group person-group-type="editor"><name><surname>Demiris</surname> <given-names>Y.</given-names></name> <name><surname>Mareschal</surname> <given-names>D.</given-names></name> <name><surname>Scassellati</surname> <given-names>B.</given-names></name> <name><surname>Weng</surname> <given-names>J.</given-names></name></person-group> (<publisher-loc>New York,NY</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>E1</fpage>&#x02013;<lpage>E6</lpage>.</citation>
</ref>
<ref id="B50">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schlesinger</surname> <given-names>M.</given-names></name> <name><surname>Amso</surname> <given-names>D.</given-names></name></person-group> (<year>2013</year>). <article-title>Image free-viewing as intrinsically-motivated exploration: estimating the learnability of center-of-gaze image samples in infants and adults</article-title>. <source>Front. Psychol</source>. <volume>4</volume>:<issue>802</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2013.00802</pub-id><pub-id pub-id-type="pmid">24198801</pub-id></citation>
</ref>
<ref id="B51">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Schmidhuber</surname> <given-names>J.</given-names></name></person-group> (<year>1991</year>). <article-title>A possibility for implementing curiosity and boredom in model-building neural controllers</article-title>, in <source>Proceedings of the International Conference on Simulation of Adaptive Behavior: From Animals to Animats</source>, eds <person-group person-group-type="editor"><name><surname>Meyer</surname> <given-names>J. A.</given-names></name> <name><surname>Wilson</surname> <given-names>S. W.</given-names></name></person-group> (<publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>MIT Press/Bradford Books</publisher-name>), <fpage>222</fpage>&#x02013;<lpage>227</lpage>.</citation>
</ref>
<ref id="B52">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schmidhuber</surname> <given-names>J.</given-names></name></person-group> (<year>2010</year>). <article-title>Formal theory of creativity, fun, and intrinsic motivation (1990&#x02013;2010)</article-title>. <source>IEEE Trans. Auton. Mental Dev</source>. <volume>2</volume>, <fpage>230</fpage>&#x02013;<lpage>247</lpage>. <pub-id pub-id-type="doi">10.1109/TAMD.2010.2056368</pub-id></citation>
</ref>
<ref id="B53">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schmidhuber</surname> <given-names>J.</given-names></name></person-group> (<year>2013</year>). <article-title>Powerplay: training an increasingly general problem solver by continually searching for the simplest still unsolvable problem</article-title>. <source>Front. Psychol</source>. <volume>4</volume>:<issue>313</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2013.00313</pub-id><pub-id pub-id-type="pmid">23761771</pub-id></citation>
</ref>
<ref id="B54">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Settles</surname> <given-names>B.</given-names></name></person-group> (<year>2010</year>). <source>Active Learning Literature Survey</source>. Computer Sciences Technical Report 1648, <publisher-name>University of WisconsinMadison</publisher-name>.</citation>
</ref>
<ref id="B55">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shah</surname> <given-names>A.</given-names></name> <name><surname>Gurney</surname> <given-names>K. N.</given-names></name></person-group> (<year>2014</year>). <article-title>Emergent structured transition from variation to repetition in a biologically-plausible model of learning in basal ganglia</article-title>. <source>Front. Psychol</source>. <volume>5</volume>:<issue>91</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2014.00091</pub-id><pub-id pub-id-type="pmid">24575067</pub-id></citation>
</ref>
<ref id="B56">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Singh</surname> <given-names>S.</given-names></name> <name><surname>Barto</surname> <given-names>A.</given-names></name> <name><surname>Chentanez</surname> <given-names>N.</given-names></name></person-group> (<year>2005</year>). <article-title>Intrinsically motivated reinforcement learning</article-title>, in <source>Advances in Neural Information Processing Systems 17: Proceedings of the 2004 Conference</source>, eds <person-group person-group-type="editor"><name><surname>Saul</surname> <given-names>L. K.</given-names></name> <name><surname>Weiss</surname> <given-names>Y.</given-names></name> <name><surname>Bottou</surname> <given-names>L.</given-names></name></person-group> (<publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>The MIT Press</publisher-name>).</citation>
</ref>
<ref id="B57">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Singh</surname> <given-names>S.</given-names></name> <name><surname>Lewis</surname> <given-names>R.</given-names></name> <name><surname>Barto</surname> <given-names>A.</given-names></name> <name><surname>Sorg</surname> <given-names>J.</given-names></name></person-group> (<year>2010</year>). <article-title>Intrinsically motivated reinforcement learning: An evolutionary perspective</article-title>. <source>IEEE Trans. Auton. Mental Dev</source>. <volume>2</volume>, <fpage>70</fpage>&#x02013;<lpage>82</lpage>. <pub-id pub-id-type="doi">10.1109/TAMD.2010.2051031</pub-id></citation>
</ref>
<ref id="B58">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Thirkettle</surname> <given-names>M.</given-names></name> <name><surname>Walton</surname> <given-names>T.</given-names></name> <name><surname>Redgrave</surname> <given-names>P.</given-names></name> <name><surname>Gurney</surname> <given-names>K.</given-names></name> <name><surname>Stafford</surname> <given-names>T.</given-names></name></person-group> (<year>2013</year>). <article-title>No learning where to go without first knowing where you&#x00027;re coming from: action discovery is trajectory, not endpoint based</article-title>. <source>Front. Psychol</source>. <volume>4</volume>:<issue>638</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2013.00638</pub-id><pub-id pub-id-type="pmid">24065941</pub-id></citation>
</ref>
<ref id="B59">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Triesch</surname> <given-names>J.</given-names></name></person-group> (<year>2013</year>). <article-title>Imitation learning based on an intrinsic motivation mechanism for efficient coding</article-title>. <source>Front. Psychol</source>. <volume>4</volume>:<issue>800</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2013.00800</pub-id><pub-id pub-id-type="pmid">24204350</pub-id></citation>
</ref>
<ref id="B60">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>White</surname> <given-names>R. W.</given-names></name></person-group> (<year>1959</year>). <article-title>Motivation reconsidered: The concept of competence</article-title>. <source>Psychol. Rev</source>. <volume>66</volume>, <fpage>297</fpage>&#x02013;<lpage>333</lpage>. <pub-id pub-id-type="doi">10.1037/h0040934</pub-id><pub-id pub-id-type="pmid">13844397</pub-id></citation>
</ref>
<ref id="B61">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zahedi</surname> <given-names>K.</given-names></name> <name><surname>Martius</surname> <given-names>G.</given-names></name> <name><surname>Ay</surname> <given-names>N.</given-names></name></person-group> (<year>2013</year>). <article-title>Linear combination of one-step predictive information with an external reward in an episodic policy gradient setting: a critical analysis</article-title>. <source>Front. Psychol</source>. <volume>4</volume>:<issue>801</issue>. <pub-id pub-id-type="doi">10.3389/fpsyg.2013.00801</pub-id><pub-id pub-id-type="pmid">24204351</pub-id></citation>
</ref>
</ref-list>
</back>
</article>