<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" article-type="methods-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Behav. Neurosci.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Behavioral Neuroscience</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Behav. Neurosci.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">1662-5153</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fnbeh.2026.1751553</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Methods</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Goal-directed actions and habits in head-fixed mice</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Manusky</surname>
<given-names>Logan M.</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3336953"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Green</surname>
<given-names>Lisa M.</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1441916"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Boquiren</surname>
<given-names>Joshua A.</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3389424"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Baek</surname>
<given-names>Jade</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3388791"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Bell</surname>
<given-names>Marcus S.</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2336507"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wassum</surname>
<given-names>Kate M.</given-names>
</name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/74991"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Otis</surname>
<given-names>James M.</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/537562"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Department of Neuroscience, Medical University of South Carolina</institution>, <city>Charleston</city>, <state>SC</state>, <country country="us">United States</country></aff>
<aff id="aff2"><label>2</label><institution>Department of Psychology and Brain Research Institute, UCLA</institution>, <city>Los Angeles</city>, <state>CA</state>, <country country="us">United States</country></aff>
<aff id="aff3"><label>3</label><institution>Ralph H. Johnson VA Medical Center</institution>, <city>Charleston</city>, <state>SC</state>, <country country="us">United States</country></aff>
<aff id="aff4"><label>4</label><institution>Hollings Cancer Center, Medical University of South Carolina</institution>, <city>Charleston</city>, <state>SC</state>, <country country="us">United States</country></aff>
<author-notes>
<corresp id="c001"><label>&#x002A;</label>Correspondence: James M. Otis, <email xlink:href="mailto:otis@musc.edu">otis@musc.edu</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-25">
<day>25</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>20</volume>
<elocation-id>1751553</elocation-id>
<history>
<date date-type="received">
<day>21</day>
<month>11</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>02</day>
<month>02</month>
<year>2026</year>
</date>
<date date-type="accepted">
<day>09</day>
<month>02</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2026 Manusky, Green, Boquiren, Baek, Bell, Wassum and Otis.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Manusky, Green, Boquiren, Baek, Bell, Wassum and Otis</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-25">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>Behavioral control is fundamentally governed by a dynamic balance between flexible, goal-directed actions and efficient but highly automated habits. While the transition to habitual control can be adaptive, an imbalance favoring rigid habits over flexible control is thought to contribute significantly to the core pathology of many neuropsychiatric disorders. Despite their pervasiveness, the precise neural circuits that govern this critical balance remain poorly characterized. A major barrier to progress lies in the technical challenge of tracking single neurons in relevant circuits as goal-directed behavior becomes habitual.</p>
</sec>
<sec>
<title>Methods</title>
<p>Here, we introduce and validate a novel head-fixed instrumental learning paradigm in mice that enables the differentiation of goal-directed and habitual behavioral control. This model provides an unprecedented platform for high-resolution, longitudinal <italic>in vivo</italic> neural interrogation. To functionally validate the behavioral paradigm, we employed chemogenetic inhibition of the dorsolateral striatum (DLS) in limited-trained and overtrained mice.</p>
</sec>
<sec>
<title>Results</title>
<p>Our findings demonstrate that mice rapidly acquire lever pressing, exhibiting robust active/inactive lever discrimination, and comparable initial learning between limited and overtrained cohorts. Crucially, while mice with limited training readily reduced their lever-press behavior when the resulting outcome was devalued or omitted, overtrained mice displayed characteristic insensitivity to outcome devaluation and omission. Furthermore, chemogenetic inhibition of the DLS in overtrained mice restored sensitivity to both devaluation and contingency reversal, blocking habit expression and preserving goal-directed control.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>These results establish a paradigm for studying both goal-directed actions and habits in head-fixed mice and validate the DLS as a key neuronal substrate as previously demonstrated in freely moving models. This paradigm represents a vital methodological advancement that overcomes the technical barriers to longitudinal, cellular-level interrogation. By providing the optical stability necessary to track the same neuronal ensembles across acquisition and expression of habits, this platform enables investigations into the computational neural dynamics underlying goal-directed and habitual behaviors.</p>
</sec>
</abstract>
<kwd-group>
<kwd>behavioral neuroscience</kwd>
<kwd>calcium imaging</kwd>
<kwd>chemogenetics</kwd>
<kwd>dorsolateral striatum</kwd>
<kwd>goal-directed behavior</kwd>
<kwd>habitual behavior</kwd>
<kwd>striatum</kwd>
<kwd>two-photon</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. Funding was provided by NIH NIDA grants to JO and LM (R01-DA051650, R01-DA054271, R01-DA062041, T32-DA007288) and a VA Merit award (I01-BX006179) to JO.</funding-statement>
</funding-group>
<counts>
<fig-count count="3"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="52"/>
<page-count count="12"/>
<word-count count="9778"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Motivation and Reward</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<title>Introduction</title>
<p>Behavior is fundamentally governed by a dynamic interplay between two distinct modes of control: goal-directed actions and habits. Goal-directed actions are initially guided by action-outcome (A-O) associations, in which the value of an expected outcome drives behavior (<xref ref-type="bibr" rid="ref2">Adams and Dickinson, 1981</xref>; <xref ref-type="bibr" rid="ref5">Balleine and Dickinson, 1998</xref>; <xref ref-type="bibr" rid="ref11">Dickinson and Balleine, 1999</xref>; <xref ref-type="bibr" rid="ref37">Peak et al., 2019</xref>; <xref ref-type="bibr" rid="ref42">Vandaele et al., 2019</xref>; <xref ref-type="bibr" rid="ref49">Yin and Knowlton, 2006</xref>; <xref ref-type="bibr" rid="ref51">Yin et al., 2005a</xref>; <xref ref-type="bibr" rid="ref53">Yin et al., 2005b</xref>). This system allows for flexible behavior that can be readily adapted when circumstances change. With repeated training and reinforcement, however, this cognitively taxing approach shifts to less demanding, more automatic habitual behaviors. Here, behavior is automatically triggered by environmental cues, regardless of the outcome&#x2019;s current value (<xref ref-type="bibr" rid="ref5">Balleine and Dickinson, 1998</xref>; <xref ref-type="bibr" rid="ref49">Yin and Knowlton, 2006</xref>; <xref ref-type="bibr" rid="ref51">Yin et al., 2005a</xref>; <xref ref-type="bibr" rid="ref1">Adams, 1982</xref>; <xref ref-type="bibr" rid="ref7">Belin et al., 2009</xref>; <xref ref-type="bibr" rid="ref17">Graybiel, 2008</xref>; <xref ref-type="bibr" rid="ref40">Tricomi et al., 2009</xref>; <xref ref-type="bibr" rid="ref50">Yin et al., 2004</xref>). The transition between these behavioral states is essential for efficient and adaptive behavior; however, when this balance is disrupted, and the automatic habit system becomes dominant over the flexible goal system, it can lead to maladaptive behaviors (<xref ref-type="bibr" rid="ref6">Belin et al., 2013</xref>; <xref ref-type="bibr" rid="ref12">Everitt and Robbins, 2016</xref>; <xref ref-type="bibr" rid="ref13">Gillan et al., 2016</xref>; <xref ref-type="bibr" rid="ref21">Hogarth et al., 2013</xref>; <xref ref-type="bibr" rid="ref23">Jonkman et al., 2012</xref>; <xref ref-type="bibr" rid="ref31">Murray et al., 2014</xref>; <xref ref-type="bibr" rid="ref41">Vandaele and Janak, 2018</xref>; <xref ref-type="bibr" rid="ref43">Vanderschuren et al., 2005</xref>). Understanding the neural mechanisms that govern this transition is crucial, as an imbalance favoring habitual responses is a core pathological feature across many neuropsychiatric disorders, including substance use disorder (SUD). A major challenge in this field lies in elucidating how the brain transitions from flexible, goal-directed actions to rigid habits. This lack of clarity is a major obstacle to developing effective treatments for conditions characterized by persistent, compulsive actions.</p>
<p>Historically, freely moving operant conditioning models have been instrumental in studying habitual behaviors (<xref ref-type="bibr" rid="ref51">Yin et al., 2005a</xref>; <xref ref-type="bibr" rid="ref50">Yin et al., 2004</xref>; <xref ref-type="bibr" rid="ref27">Malvaez et al., 2018</xref>; <xref ref-type="bibr" rid="ref30">Martiros et al., 2018</xref>; <xref ref-type="bibr" rid="ref33">O&#x2019;Hare et al., 2017</xref>; <xref ref-type="bibr" rid="ref39">Thorn et al., 2010</xref>; <xref ref-type="bibr" rid="ref48">Yin and Knowlton, 2004</xref>; <xref ref-type="bibr" rid="ref52">Yin et al., 2006</xref>). However, these paradigms have limitations for the kind of longitudinal, high-resolution spatiotemporal investigation of neural circuits needed to fully capture the behavioral transition over time. To overcome this issue, researchers are increasingly combining operant conditioning paradigms with head-fixed setups and advanced neural recording technologies, such as two-photon (2P) microscopy (<xref ref-type="bibr" rid="ref8">Clarke et al., 2024</xref>; <xref ref-type="bibr" rid="ref36">Paniccia et al., 2024</xref>; <xref ref-type="bibr" rid="ref44">Vollmer et al., 2021</xref>; <xref ref-type="bibr" rid="ref45">Vollmer et al., 2022</xref>; <xref ref-type="bibr" rid="ref47">Ward et al., 2025</xref>). While head-fixed models provide advantages for detailed, long-term neural monitoring, an experimentally validated head-fixed paradigm for operant habitual reward-seeking has yet to be developed. Establishing such a model would significantly advance our ability to observe the neural dynamics underlying goal-directed actions, habits, and the transition between the two across time.</p>
<p>Here, we present a novel head-fixed operant paradigm in mice that reliably produces goal-directed behavioral control with limited training and habits with overtraining. In this context, we specifically operationalize habitual control as outcome-insensitive instrumental responding, defined by the persistence of behavior despite changes in the value or the contingency of the reinforcer. By adapting well-validated tasks from freely moving models of goal-directed and habitual behavioral control (<xref ref-type="bibr" rid="ref27">Malvaez et al., 2018</xref>), we demonstrate that mice exhibit either goal-directed or habitual responding, depending on their training duration [limited vs. extended variable-interval 30-s (VI30s) schedules]. To assess the behavioral strategy, mice were tested using the two gold-standard tests for goal-directed behavioral control, outcome devaluation and omission tasks (<xref ref-type="bibr" rid="ref4">Balleine, 2019</xref>; <xref ref-type="bibr" rid="ref10">Dickinson and Balleine, 1993</xref>; <xref ref-type="bibr" rid="ref29">Malvaez and Wassum, 2018</xref>). To validate that our head-fixed paradigm engages the canonical neural substrates of habit as found in freely moving mice, we chemogenetically inhibited the dorsolateral striatum (DLS)&#x2014;a region well-established as critical for habitual behavior in both rodent and human studies (<xref ref-type="bibr" rid="ref49">Yin and Knowlton, 2006</xref>; <xref ref-type="bibr" rid="ref40">Tricomi et al., 2009</xref>; <xref ref-type="bibr" rid="ref50">Yin et al., 2004</xref>; <xref ref-type="bibr" rid="ref39">Thorn et al., 2010</xref>; <xref ref-type="bibr" rid="ref52">Yin et al., 2006</xref>; <xref ref-type="bibr" rid="ref29">Malvaez and Wassum, 2018</xref>; <xref ref-type="bibr" rid="ref3">Alloway et al., 2017</xref>; <xref ref-type="bibr" rid="ref18">Graybiel and Grafton, 2015</xref>; <xref ref-type="bibr" rid="ref24">Lipton et al., 2019</xref>; <xref ref-type="bibr" rid="ref26">Malvaez, 2020</xref>; <xref ref-type="bibr" rid="ref32">O&#x2019;Hare et al., 2016</xref>). Together, these findings establish our head-fixed operant model as a robust and translationally relevant platform for studying goal-directed actions and habits. This model can be easily coupled with high-resolution <italic>in vivo</italic> imaging strategies and will provide unprecedented access to the spatiotemporal dynamics underlying the transition to, and persistence of, habitual behaviors.</p>
</sec>
<sec sec-type="materials|methods" id="sec2">
<title>Materials and methods</title>
<sec id="sec3">
<title>Animals</title>
<p>All experiments were approved by the Institutional Animal Care and Use Committee (IACUC) at the Medical University of South Carolina in accordance with the NIH-adopted Guide for the Care and Use of Laboratory Animals (Protocol 2021-01325-1). Adult (8&#x2013;24&#x202F;weeks) male and female C57BL/6J wild-type (WT) background mice (8&#x202F;weeks old/20&#x202F;g minimum at study onset; Jackson Labs or MUSC DLAR Breeding Colony) were group-housed pre-operatively and single-housed post-operatively under a reversed 12:12-h light cycle (lights off at 8:00&#x202F;a.m.; all experiments were performed during the dark phase) with access to standard rodent chow and water <italic>ad libitum</italic>. To facilitate instrumental learning and maintain robust responding for a caloric reward (10% Ensure), mice were placed on a regulated water restriction schedule 3&#x202F;days prior to the start of acquisition. This is a standard requirement for operant paradigms using liquid reinforcers to ensure that reward-seeking behavior is not prematurely extinguished by satiation (<xref ref-type="bibr" rid="ref15">Goltstein et al., 2018</xref>; <xref ref-type="bibr" rid="ref16">Grant et al., 2021</xref>; <xref ref-type="bibr" rid="ref20">Guo et al., 2014</xref>; <xref ref-type="bibr" rid="ref34">Otis et al., 2017</xref>; <xref ref-type="bibr" rid="ref35">Otis et al., 2019</xref>). We employed a tiered supplemental water system to maintain each animal between 85 and 90% of its initial free-feeding body weight. Unlike fixed-volume restriction paradigms, our approach adjusted daily water access based on a combination of the animal&#x2019;s current weight and its instrumental performance (lever presses) during the session. This method provides a more refined balance between behavioral motivation and animal welfare compared to traditional 24-h restriction protocols. To maintain mice at 85%&#x2013;90% of their free-feeding body weight, we regulated their daily water intake based on their behavioral performance: 50&#x2013;100 active presses: 0&#x202F;mL water, 30&#x2013;50 active presses: 0.25&#x202F;mL water, 20&#x2013;30 active presses: 0.5&#x202F;mL water, 0&#x2013;20 active presses: 1.0&#x202F;mL water. Water was provided at least 2.5&#x202F;h after the final behavioral session of the day. Mice were weighed daily before each session. If a mouse&#x2019;s weight exceeded the target, its water allowance was reduced by one category to encourage weight loss. Conversely, if a mouse&#x2019;s weight fell below the target, a separate set of criteria was applied to ensure adequate hydration: 50&#x2013;100 active presses: 0.5&#x202F;mL water, 30&#x2013;50 active presses: 1.0&#x202F;mL water, 20&#x2013;30 active presses: 1.5&#x202F;mL water, 0&#x2013;20 active presses: 2.0&#x202F;mL water. Mice were transitioned to a Teklad Diet (2,918, Inotiv) 1&#x202F;week prior to training. This fixed-formula diet was maintained throughout the study to minimize batch-to-batch nutrient fluctuations and metabolic variability. This ensured that fluctuations in body weight were a result of the water restriction protocol rather than dietary inconsistency, providing a reliable metric for adjusting water intake.</p>
</sec>
<sec id="sec4">
<title>Surgeries</title>
<p>For intracranial surgeries, all mice were anesthetized with isoflurane (0.8%&#x2013;1.5% in oxygen; 1&#x202F;L/min) and placed within a stereotaxic frame (Kopf Instruments). Ophthalmic ointment (Akron), topical anesthetic (2% Lidocaine; Akron), analgesic (Carprofen &#x0026; Ketorolac, 2&#x202F;mg/kg, i.p.), and subcutaneous sterile saline (0.9% NaCl in water) were given pre- and intra-operatively for health and pain management. An antibiotic (Cefazolin, 200&#x202F;mg/kg, s.c.) was given post-operatively to reduce the possibility of infection, and mice were allowed to recover for at least 2&#x2013;3&#x202F;weeks prior to behavioral training. All mice received head-ring implantation. A custom-made head-ring (stainless steel; 5&#x202F;mm ID, 11&#x202F;mm OD) was implanted onto the animal skull, along with 2&#x2013;3 screws and dental cement to allow for head fixation.</p>
<sec id="sec5">
<title>Behavioral chemogenetics surgeries</title>
<p>Chemogenetic manipulations were conducted to selectively inhibit DLS neurons. During surgery, bilateral injections of a virus encoding an inhibitory DREADD (AAV2-hSyn-hM4Di-mCherry) or control (AAV2-hSyn-mCherry) were administered into the DLS (AP: +1.20, ML: +/&#x2212; 1.95, DV: &#x2212;3.65; 500&#x202F;nL). A stainless-steel head-ring was cemented onto the skull using dental cement and skull screws. Viral placements were confirmed post-mortem via histology.</p>
</sec>
</sec>
<sec id="sec6">
<title>Head-fixed operant conditioning</title>
<sec id="sec7">
<title>Apparatus</title>
<p>Training took place in a set of 6 operant chambers that were custom-made (<xref ref-type="fig" rid="fig1">Figure 1D</xref>), as previously described (<xref ref-type="bibr" rid="ref44">Vollmer et al., 2021</xref>). Behavioral systems interfaced with an Arduino and custom Python-based software (<xref ref-type="bibr" rid="ref3">Alloway et al., 2017</xref>; <xref ref-type="bibr" rid="ref8">Clarke et al., 2024</xref>; <xref ref-type="bibr" rid="ref36">Paniccia et al., 2024</xref>; <xref ref-type="bibr" rid="ref44">Vollmer et al., 2021</xref>; <xref ref-type="bibr" rid="ref45">Vollmer et al., 2022</xref>; <xref ref-type="bibr" rid="ref47">Ward et al., 2025</xref>) to deliver liquid reinforcers (2&#x202F;s), play a tone cue (8&#x202F;kHz, 1&#x202F;s), record lever presses (active/inactive), and collect lick contacts. During behavioral acquisition, levers were placed in front of the mice. Pressing the active lever resulted in immediate cue presentation, followed by reward delivery (12.5&#x202F;&#x03BC;L; 10% Ensure mixed in tap water) delivered at the spout. Pressing the inactive lever produced no cue or reward. Each instrumental training session lasted 60&#x202F;min, during which mice were allowed to freely acquire Ensure for the entirety of the session.</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Timeline and head-fixed setup for goal-directed and habitual behavior paradigm. <bold>(A)</bold> Experimental timeline of head-fixed operant behavior paradigm for habitual and goal-directed behaviors. After habituation and preexposure, mice were assigned to either the overtrained or limited-trained group. Both groups received FR1, VI15s, and VI30s training; however, the overtrained group had an extended 7-day VI30s paradigm, while the limited-trained group had a short 2-day VI30s paradigm. After training, mice were tested under devaluation and omission procedures; all mice received 1&#x202F;day off and VI30s retraining in between tests. <bold>(B)</bold> Devaluation procedure involved two test days (devalued and valued) where mice were pre-fed one flavor for 45&#x202F;min in their home cage before going into the behavioral box and being tested with a 10-min probe session (no cues, no rewards). <bold>(C)</bold> Omission procedure consisted of two separate days. The first test day was a 60-min session where the reward was automatically delivered every 20&#x202F;s. A lever press resulted in a reset of the 20-s counter. Twenty-four hours after this test, mice were tested on a 10-min probe test (no cues, no rewards) to investigate memory consolidation from the day prior. <bold>(D)</bold> Diagram of operant chamber and head-fixation station. Mice were fixed into the head station and placed in a restraint tube. They had access to both an active and inactive lever as well as a lick spout. Created in part with <ext-link xlink:href="https://www.biorender.com/" ext-link-type="uri">BioRender.com</ext-link>. Manusky, L. (2026) <ext-link xlink:href="https://BioRender.com/4zmyix7" ext-link-type="uri">https://BioRender.com/4zmyix7</ext-link>, <ext-link xlink:href="https://BioRender.com/wdokkzd" ext-link-type="uri">https://BioRender.com/wdokkzd</ext-link>.</p>
</caption>
<graphic xlink:href="fnbeh-20-1751553-g001.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Panel A shows a timeline and group assignment for a rodent behavioral experiment involving surgeries, habituation, reward training with either chocolate or vanilla, devaluation, omission, and probe tests, distinguishing overtrained and limited-trained groups. Panel B details the devaluation procedure, including prefeeding and probe testing with valued or devalued rewards, illustrated with images of rodents given chocolate or vanilla. Panel C summarizes the omission test and probe, explaining reversed reward contingencies and test durations. Panel D presents a labeled illustration of the head-fixed, self-administration apparatus, showing a rodent with a head ring in a chamber with levers and tubing.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec8">
<title>Natural reward</title>
<p>All operant conditioning experiments involved reward delivery of 10% Chocolate or Vanilla Ensure Original (Abbott Nutrition, Columbus, OH). Mice were randomly assigned and equally counterbalanced to earn one of the Ensure flavors throughout training (i.e., training flavor). At least 1&#x202F;day prior to the start of instrumental studies, mice received Ensure preexposure (60-min home-cage <italic>ad libitum</italic> access of chocolate and vanilla Ensure). By offering mice unrestricted access to both flavors of Ensure in their home cages for at least 1&#x202F;day before instrumental studies, we aimed to diminish any behavioral responses driven by novelty, ensuring subsequent observations more accurately reflected the behavioral preferences. In addition, all mice were given equated exposure (i.e., non-contingent access to the alternative Ensure flavor) in a different room for a week prior to the start of training to diminish novelty of the alternative Ensure flavor.</p>
<p>A separate cohort of mice (<italic>n</italic>&#x202F;=&#x202F;8) was tested to confirm discriminability between 10% chocolate and vanilla Ensure and to rule out baseline flavor preference. Mice were given 2&#x202F;h of <italic>ad libitum</italic> access to both flavors in the home cage, and consumption did not differ (<xref ref-type="supplementary-material" rid="SM1">Supplementary Figures S1A,B</xref>). To assess discrimination, mice underwent two sensory-specific devaluation tests. Following a 90-min pre-feeding session with one flavor (devalued) (<xref ref-type="supplementary-material" rid="SM1">Supplementary Figure S1C</xref>), they received 10&#x202F;min of <italic>ad libitum</italic> access to both flavors. Mice consumed significantly more of the valued flavor, confirming the ability to discriminate between flavors (<xref ref-type="supplementary-material" rid="SM1">Supplementary Figures S1D,E</xref>).</p>
</sec>
<sec id="sec9">
<title>Acquisition</title>
<p>To reduce possible stress induced by head-fixation, mice underwent 3&#x202F;days of habituation during which they were head-restrained in custom-built operant chambers (<xref ref-type="bibr" rid="ref44">Vollmer et al., 2021</xref>) for 30&#x202F;min with no access to the levers, tone cue, or reward. Following habituation, mice were separated into the (1) limited-trained group or the (2) overtrained group and trained on a fixed-ratio 1 (FR1) schedule of reinforcement until they pressed a total of 50 times on the active lever, 2&#x202F;days in a row (60-min sessions) for delivery of their training flavor (chocolate or vanilla). Each session began with guiding the mouse into the head-fixation station and placing their body into a restraint tube, to decrease bodily movement. Both the active and inactive levers, along with a lick spout, were then positioned in front of the mouse, requiring the mouse to extend their forelimbs in order to press either lever (<xref ref-type="bibr" rid="ref44">Vollmer et al., 2021</xref>). Mice received one training session per day, with sessions conducted on consecutive days, including weekends, to ensure continuous training without rest periods. Mice required an average of 5.2&#x202F;&#x00B1;&#x202F;0.4&#x202F;days (mean &#x00B1; SEM) to meet the FR1 acquisition criteria (range: 3&#x2013;12&#x202F;days). After mice achieved performance criteria (50 presses/60&#x202F;min, 2&#x202F;days in a row), they progressed to the next stage of the paradigm.</p>
</sec>
<sec id="sec10">
<title>Variable-interval training</title>
<p>After completing FR1 training, all mice were shifted to a variable-interval 15-s (VI15s) reinforcement schedule for 1&#x202F;day. Mice designated for limited training were then trained on a VI30s schedule for 2&#x202F;days, while mice designated for overtraining remained on VI30s for 7&#x202F;days (<xref ref-type="fig" rid="fig1">Figure 1A</xref>). Although some paradigms use longer durations, this 7-day &#x201C;overtraining&#x201D; protocol aligns with established mouse models (<xref ref-type="bibr" rid="ref29">Malvaez and Wassum, 2018</xref>; <xref ref-type="bibr" rid="ref14">Giovanniello et al., 2025</xref>; <xref ref-type="bibr" rid="ref28">Malvaez et al., 2025</xref>) and contemporary studies demonstrating that extended interval-based reinforcement schedules are sufficient to induce outcome-insensitivity (<xref ref-type="bibr" rid="ref19">Gremel and Costa, 2013</xref>; <xref ref-type="bibr" rid="ref38">Rossi and Yin, 2012</xref>). We utilized a consistent VI30s schedule for both groups to isolate training duration as the primary variable, establishing a standardized platform for future longitudinal imaging without the confounding rule shifts associated with RR-to-VI transitions. All sessions lasted 60&#x202F;min. Following training, mice were tested for goal-directed or habitual behavioral strategies via devaluation and omission tests.</p>
</sec>
<sec id="sec11">
<title>Devaluation test</title>
<p>To assess sensory-specific satiety using the devaluation test, mice received two test days (devalued and valued), with the order counterbalanced across groups. On each test day, mice were first given a 45-min prefeed period of unlimited access to either the flavor earned during training (devalued) or the alternative, pre-exposed flavor (valued), with the latter controlling for general satiety. Consumption during this prefeed period did not differ between control and experimental groups (<xref ref-type="supplementary-material" rid="SM2">Supplementary Figure S2B</xref>). Immediately following this prefeed, lever pressing was measured during a 10-min, non-reinforced probe test (<xref ref-type="fig" rid="fig1">Figure 1B</xref>). Between test days, mice received an off day followed by retraining on VI30s, until mice reached at least 80% of their baseline lever press rate before proceeding to the subsequent test. Baseline was determined from the last day or the average of the last two VI30s training sessions. If one of the last 2&#x202F;days exceeded two standard deviations from the overall mean, baseline was instead calculated using the last 3&#x202F;days. The order of test days was counterbalanced across mice. In addition to raw press rates, a devaluation index was calculated for each subject: <inline-formula>
<mml:math id="M1">
<mml:mtext mathvariant="italic">Devaluation Index</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:mo>#</mml:mo>
<mml:mtext mathvariant="italic">of devalued lever presses</mml:mtext>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:mo>#</mml:mo>
<mml:mtext mathvariant="italic">of devalued</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext mathvariant="italic">valued lever presses</mml:mtext>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
</mml:mfrac>
</mml:math>
</inline-formula>. This index was used to account for variability in press rates between subjects.</p>
</sec>
<sec id="sec12">
<title>Omission test</title>
<p>After devaluation testing, mice were given a day off and retrained as described above. Once retraining criteria were met, mice underwent an omission test and a subsequent omission probe test (<xref ref-type="fig" rid="fig1">Figure 1C</xref>). The omission test was a 60-min session in which the lever-outcome contingency was reversed: Ensure was delivered non-contingently every 20&#x202F;s, and any active lever press reset the timer, delaying reward delivery (<xref ref-type="bibr" rid="ref38">Rossi and Yin, 2012</xref>). Twenty-four hours later, lever pressing was measured during a 10-min, non-reinforced omission probe test to assess the persistence of the learned behavioral change.</p>
</sec>
</sec>
<sec id="sec13">
<title>Data collection and statistical analyses</title>
<p>Lever press and lick data during acquisition and test sessions were collected using a custom Python interface, REACHER, connected to Arduino (<xref ref-type="bibr" rid="ref44">Vollmer et al., 2021</xref>). Statistical analyses were performed using GraphPad PRISM (Dotmatics, version 10). Behavioral data were analyzed using either analysis of variance (ANOVA; two-way or three-way) or t-tests (paired or unpaired), as appropriate. The independent variables analyzed included: lever type (active or inactive), sex (male or female), virus (mCherry vs. DREADD), training duration (limited vs. overtrained), and day (acquisition, devaluation test, omission test). Sidak&#x2019;s and Tukey <italic>post hoc</italic> tests were used following significant main effects and interactions with the ANOVA analyses. The two-stage linear step-up procedure of Benjamini, Krieger, and Yekutieli (BKY) was also used, as appropriate, for controlling the False Discovery Rate in multiple comparisons. Prior to analysis, all datasets were checked for normality and homogeneity of variance.</p>
<p>To ensure findings were robust against between-subject variability and missing values, key longitudinal datasets (e.g., acquisition) were cross-validated using linear mixed-effects models (REML), which yielded results consistent with our reported ANOVA findings. For analyses in <xref ref-type="fig" rid="fig2">Figure 2</xref>, mCherry control mice from chemogenetic cohorts were pooled with the original acquisition cohorts, as behavioral protocols were identical. Sample sizes were determined based on established standards in the field for chemogenetic behavioral studies. The adequacy of these sample sizes is supported by the robust effect sizes (partial eta squared) observed across all primary behavioral interactions. Mouse exclusion criteria were defined <italic>a priori</italic>. Specifically, (1) failing FR1 acquisition within 14&#x202F;days; (2) loss of head-cap stability (3); retraining exceeding 7&#x202F;days; or (4) viral expression outside the DLS. Altogether, one mouse was excluded during FR1 training, and another was excluded from omission testing, both due to head-cap instability.</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>Head-fixed mice reliably acquire instrumental lever pressing and display both goal-directed and habitual behaviors. <bold>(A)</bold> Zoomed in schematic of head-fixed operant behavior setup. <bold>(B)</bold> Behavioral design, where an active lever press triggers a 1&#x202F;s tone cue followed by a 2&#x202F;s delivery of 10% Ensure and an inactive lever press results in no cue/Ensure. <bold>(C)</bold> Grouped data of active (filled circles) and inactive (open circles) lever presses across acquisition days. The FR1 data point represents the last FR1 training session for each mouse. Mice reliably discriminate between levers, pressing significantly more on the active lever (<italic>n</italic>&#x202F;=&#x202F;27: 14M, 13F; 3-way ANOVA, lever effect: F<sub>1,25</sub>&#x202F;=&#x202F;58.25, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001, day x lever interaction: F<sub>1.81,45.16</sub>&#x202F;=&#x202F;3.723, <italic>p</italic>&#x202F;=&#x202F;0.0359; OT&#x202F;=&#x202F;overtrained, LT&#x202F;=&#x202F;limited-trained). <bold>(D)</bold> Devaluation tests showed LT mice pressed significantly more on the valued day than the devalued day, whereas OT mice showed no difference between days (<italic>n</italic>&#x202F;=&#x202F;27: 14M&#x202F;=&#x202F;filled dots, 13F&#x202F;=&#x202F;unfilled dots; two-way ANOVA, training x test day interaction: F<sub>1,25</sub>&#x202F;=&#x202F;29.57, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001, Sidak&#x2019;s <italic>post hoc</italic> test, LT: <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001, OT: <italic>p</italic>&#x202F;=&#x202F;0.6323). <bold>(E)</bold> Devaluation index significantly differed between groups; scores closer to 0.5 (red dashed line) indicate insensitivity to devaluation. LT mice were more sensitive to outcome devaluation than OT mice (<italic>n</italic>&#x202F;=&#x202F;27: 14M, 13F; t(25)&#x202F;=&#x202F;4.98, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001). <bold>(F,G)</bold> Omission test wherein <bold>(F)</bold> active lever pressing was increased (<italic>n</italic>&#x202F;=&#x202F;26; 13M, 13F; t(24)&#x202F;=&#x202F;3.48, <italic>p</italic>&#x202F;=&#x202F;0.0019) and <bold>(G)</bold> reward deliveries were reduced in the OT group (t(24)&#x202F;=&#x202F;4.40, <italic>p</italic>&#x202F;=&#x202F;0.0002). <bold>(H)</bold> Omission probe test showed a significant increase in lever pressing in the OT group (<italic>n</italic>&#x202F;=&#x202F;26; 13M, 13F; t(24)&#x202F;=&#x202F;3.55, <italic>p</italic>&#x202F;=&#x202F;0.0016). See <xref ref-type="supplementary-material" rid="SM4">Supplementary Table S1</xref> for complete analyses. All data are presented as mean &#x00B1; SEM. &#x002A;&#x002A;<italic>p</italic> &#x003C; 0.01, &#x002A;&#x002A;&#x002A;p &#x003C; 0.001, &#x002A;&#x002A;&#x002A;&#x002A;p &#x003C; 0.0001. Created in BioRender. Manusky, L. (2026) <ext-link xlink:href="https://BioRender.com/3xqnb2m" ext-link-type="uri">https://BioRender.com/3xqnb2m</ext-link>.</p>
</caption>
<graphic xlink:href="fnbeh-20-1751553-g002.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Scientific figure showing a head-fixed mouse behavioral experiment. Panel A depicts a mouse receiving a liquid reward through a spout with levers and tone cues. Panel B illustrates the experimental design with lever presses triggering cues and rewards. Panel C presents a line graph comparing lever press acquisition over days between LT and OT groups. Panels D&#x2013;H show bar graphs with individual data points comparing lever presses, devaluation indices, and reward deliveries between experimental groups under devaluation and omission tasks. Statistical significance is annotated on the graphs.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec14">
<title>Behavioral chemogenetics</title>
<p>To investigate the role of the DLS in regulating goal-directed and habitual reward-seeking behaviors, we used a site-specific chemogenetic approach. Mice were first trained on the limited 2-day or extended 7-day head-fixed instrumental paradigm, as described above. Upon successful completion of this training, mice received a systemic pretreatment of clozapine <italic>N</italic>-oxide [CNO, 10&#x202F;mg/kg; i.p.; (<xref ref-type="bibr" rid="ref25">Mahler et al., 2019</xref>)] 30&#x202F;min before each test session, which included devaluation, valuation, omission, and omission probe. During devaluation test days, CNO was administered 15&#x202F;min after the onset of the pre-feeding period. This timing was selected to ensure that peak DREADD-mediated inhibition coincided with the instrumental devaluation test. Importantly, DLS inhibition did not affect the pre-feeding process itself; no differences in the amount of Ensure consumed were observed between DREADD-expressing mice and controls [t(76)&#x202F;=&#x202F;1.579, <italic>p</italic>&#x202F;=&#x202F;0.1184], nor between the experimental groups and prior pilot cohorts [t(54)&#x202F;=&#x202F;0.006, <italic>p</italic>&#x202F;=&#x202F;0.9949].</p>
<p>After behavioral testing, mice were transcardially perfused, and brains were collected and post-fixed in 4% paraformaldehyde (PFA). For cryoprotection, brains were subsequently immersed in successive 15 and 30% sucrose solutions. Coronal sections (40&#x202F;&#x03BC;m) were cut using a cryostat, mounted on slides, and imaged on a Leica THUNDER Imager Tissue.</p>
</sec>
</sec>
<sec sec-type="results" id="sec15">
<title>Results</title>
<sec id="sec16">
<title>Acquisition of head-fixed goal-directed and habitual reward-seeking</title>
<p>Previous freely moving instrumental models have successfully produced both goal-directed and habitual behavioral control (<xref ref-type="bibr" rid="ref2">Adams and Dickinson, 1981</xref>; <xref ref-type="bibr" rid="ref52">Yin et al., 2006</xref>; <xref ref-type="bibr" rid="ref19">Gremel and Costa, 2013</xref>; <xref ref-type="bibr" rid="ref9">Corbit et al., 2012</xref>; <xref ref-type="bibr" rid="ref22">Jones et al., 2022</xref>). However, a head-fixed model capable of capturing each behavioral strategy in isolation has not yet been developed. To this end, here head-fixed mice were trained to press an active lever to receive a 1&#x202F;s tone cue paired with delivery of 10% (v/v) Ensure (<xref ref-type="fig" rid="fig2">Figures 2A</xref>,<xref ref-type="fig" rid="fig2">B</xref>). A second inactive lever was present but did not result in a cue or reward. To establish the desired goal-directed or habitual strategies using a paradigm adapted from well-validated models (<xref ref-type="bibr" rid="ref27">Malvaez et al., 2018</xref>), training progressed across three different schedules of reinforcement: FR1, VI15s, and VI30s. VI schedules were included to promote habitual control, as the unpredictability of reinforcement reduces reliance on immediate A-O associations and promotes the development of stable, outcome-insensitive behavior. To assess initial learning trajectory before the divergence in training protocols, we compared the performance of limited and overtrained groups across their shared acquisition phase. Mice in both groups pressed the active lever significantly more than the inactive, revealing comparable initial lever discrimination and overall lever press rates that reflected the progressive development of robust discrimination between the active and inactive levers (<xref ref-type="fig" rid="fig2">Figure 2C</xref>). This acquisition pattern was further validated by a linear mixed-effects model, which confirmed the primary effects of Lever (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001) and Day (<italic>p</italic>&#x202F;=&#x202F;0.028) while accounting for individual subject variability. Assessment of sex differences revealed no significant main effect of sex on active lever press rates (<xref ref-type="supplementary-material" rid="SM2">Supplementary Figure S2A</xref>). Overall, these data confirm successful and comparable initial acquisition of instrumental behavior across all animals prior to the manipulation of training duration.</p>
</sec>
<sec id="sec17">
<title>Devaluation tests differentiate goal-directed and habitual behavior</title>
<p>After completing acquisition on their respective schedules, mice received a set of devaluation tests to assess their underlying behavioral strategy. In these tests, non-reinforced lever pressing was measured after a 45-min prefeed period with the Ensure flavor earned during training (devalued condition) and compared to pressing after pre-feeding with the alternative Ensure flavor provided outside the training context (valued condition). The order of the devalued and valued conditions was counterbalanced across subjects and each mouse experienced both conditions, allowing direct within-subject comparison of responding during the valued versus devalued state. Goal-directed actions are based on knowledge of the A-O relationship and are therefore flexible, resulting in a reduction of responding when the outcome is devalued. In contrast, habits are marked by a lack of consideration of action consequences, leading to inflexibility, and persistent responding regardless of outcome&#x2019;s current value. To ensure devaluation wasn&#x2019;t simply due to varying Ensure intake during prefeed, we measured prefeed consumption and found no difference across conditions or groups (<xref ref-type="supplementary-material" rid="SM2">Supplementary Figure S2B</xref>).</p>
<p>During devaluation tests, limited-trained mice demonstrated sensitivity to the changing value of the outcome, exhibiting a significantly lower lever-press rate on the devalued test day compared to the valued test day. In contrast, overtrained mice showed no change in lever press rate across the valued and devalued test days, demonstrating insensitivity to outcome devaluation (<xref ref-type="fig" rid="fig2">Figure 2D</xref>). To further quantify this behavioral distinction, a devaluation index was calculated (# of devalued lever presses) / (# of devalued + valued lever presses). This index provides a normalized measure of goal-directed versus habitual control, where 0.5 indicates insensitivity to devaluation (habitual control) and 0.0 indicates sensitivity to devaluation (goal-directed control). Consistent with the overall press rates, the devaluation index in limited-trained mice was reduced as compared with overtrained mice, confirming that limited-trained mice were selectively sensitive to reward devaluation (<xref ref-type="fig" rid="fig2">Figure 2E</xref>). The number of licks for the valued and devalued test days did not differ (<xref ref-type="supplementary-material" rid="SM2">Supplementary Figure S2C</xref>), suggesting consumption did not change and that the observed differences were specific to the instrumental response.</p>
</sec>
<sec id="sec18">
<title>Omission tests reveal group differences in contingency sensitivity</title>
<p>Following devaluation testing and subsequent retraining, mice received an omission test designed to test their behavioral flexibility by changing the A-O relationship. In this procedure, rewards were delivered automatically every 20&#x202F;s, any lever press reset the timer, thereby delaying reward delivery. This test differentiates goal-directed actions from habits: limited-trained mice, relying on their knowledge of the A-O contingency, should rapidly reduce pressing to maximize the automatic rewards. In contrast, overtrained mice&#x2014;whose actions are independent of the A-O contingency&#x2014;are expected to maintain high press rates, demonstrating inflexibility. During the 60-min test, limited-trained mice showed behavioral flexibility by significantly reducing lever pressing in response to the reversed contingency. In contrast, overtrained mice were inflexible, continuing to press at high rates and failing to adjust their behavior despite the absence of reward (<xref ref-type="fig" rid="fig2">Figure 2F</xref>). Consistent with their persistent responding, overtrained mice received significantly fewer reward deliveries than limited-trained mice (<xref ref-type="fig" rid="fig2">Figure 2G</xref>). The number of licks for the omission test did not differ between the groups (<xref ref-type="supplementary-material" rid="SM2">Supplementary Figure S2D</xref>), suggesting consumption was not a contributing factor to the difference in lever pressing.</p>
<p>Twenty-four hours after the initial omission test, all mice completed a 10-min, non-reinforced omission probe test to assess memory consolidation of the new, reversed A-O contingency. Mice with limited training maintained low lever pressing rates, consistent with retention of the altered A-O contingency from the previous day. Conversely, overtrained mice continued to press at high rates, indicating persistent insensitivity to the prior omission contingency and a failure to adapt their behavior despite prior experience (<xref ref-type="fig" rid="fig2">Figure 2H</xref>). The number of licks during this non-reinforced omission probe test did not differ between the groups (<xref ref-type="supplementary-material" rid="SM2">Supplementary Figure S2E</xref>). In summary, these results demonstrate that our novel head-fixed instrumental learning paradigm successfully recapitulates the two distinct modes of behavioral control seen in freely moving models. The use of both devaluation and omission tests confirmed a clear divergence in behavioral strategy, with the limited-trained group exhibiting flexible, goal-directed actions and the overtrained group displaying inflexible habits.</p>
</sec>
<sec id="sec19">
<title>DLS neuronal activity is necessary for the expression of habitual behavior</title>
<p>To further verify the utility of this head-fixed approach, we assessed whether the habitual behavior would rely on the same canonical neuronal systems that have been described in freely moving studies. Thus, using chemogenetics we inhibited neuronal activity in the DLS during devaluation and omission tests in both limited-trained and overtrained mice. WT mice received bilateral DLS microinjections of either a Gi-coupled (Gi) DREADD (AAV2-hSyn-hM4Di-mCherry) or a control (CTL) virus (AAV2-hSyn-mCherry) (<xref ref-type="fig" rid="fig3">Figures 3A</xref>&#x2013;<xref ref-type="fig" rid="fig3">C</xref>). Prior to each testing session (30&#x202F;min), systemic administration of CNO (10&#x202F;mg/kg, i.p.) was performed to activate the DREADD. Prefeed consumption was again measured and did not differ across groups or test day (<xref ref-type="supplementary-material" rid="SM3">Supplementary Figure S3A</xref>).</p>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>Chemogenetic inhibition of DLS suppresses habitual responding and restores goal-directed responding. <bold>(A)</bold> Schematic of surgical strategy enabling bilateral Gi-DREADD expression in DLS neurons. Experimental groups included control (CTL; mCherry) and inhibitory DREADD (Gi; hM4Di-mCherry) mice with either limited training (LT) or overtraining (OT). All mice received 10&#x202F;mg/kg CNO via intraperitoneal (i.p.) injection 30&#x202F;min before each test session. <bold>(B)</bold> Representative image of viral placement in DLS (left), including zoomed image of injector tract (right, DAPI&#x202F;=&#x202F;blue; mCherry&#x202F;=&#x202F;red). <bold>(C)</bold> Placement map of all DREADD and control viruses. <bold>(D)</bold> Devaluation tests showed CTL-OT mice exhibited no difference between valued and devalued days, confirming insensitivity to devaluation. In contrast, CTL-LT, Gi-LT, and Gi-OT mice all had significantly greater responding on the valued versus devalued day (<italic>n</italic>&#x202F;=&#x202F;39: 19M&#x202F;=&#x202F;filled dots, 20F&#x202F;=&#x202F;unfilled dots; three-way ANOVA, test day x training interaction: F<sub>1,35</sub>&#x202F;=&#x202F;9.756, <italic>p</italic>&#x202F;=&#x202F;0.0036, two-stage BKY post hoc test, Gi-LT: <italic>p</italic>&#x202F;=&#x202F;0.0004, CTL-LT: <italic>p</italic>&#x202F;=&#x202F;0.0006, CTL-OT: <italic>p</italic>&#x202F;=&#x202F;0.2550, Gi-OT: <italic>p</italic>&#x202F;=&#x202F;0.0145). The CTL-OT mice pressed significantly more than the Gi-OT mice on the devalued day (<italic>p</italic>&#x202F;=&#x202F;0.0004), statistical result not shown. <bold>(E)</bold> Devaluation index significantly differed between CTL-OT mice and all other groups (<italic>n</italic>&#x202F;=&#x202F;39: 19M, 20F; two-way ANOVA, interaction effect: F<sub>1,35</sub>&#x202F;=&#x202F;4.196, <italic>p</italic>&#x202F;=&#x202F;0.0481, Tukey <italic>post hoc</italic> tests, Gi-LT: <italic>p</italic>&#x202F;=&#x202F;0.0052, CTL-LT: <italic>p</italic>&#x202F;=&#x202F;0.0378, Gi-OT: <italic>p</italic>&#x202F;=&#x202F;0.0047). <bold>(F)</bold> Omission test showed Gi-LT, CTL-LT, and Gi-OT mice significantly reduced active lever pressing compared to CTL-OT mice. (<italic>n</italic>&#x202F;=&#x202F;38: 19M, 19F; two-way ANOVA, interaction effect: F<sub>1,34</sub>&#x202F;=&#x202F;12.16, <italic>p</italic>&#x202F;=&#x202F;0.0014, Tukey <italic>post hoc</italic> tests, Gi-LT: <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001, CTL-LT: <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001, Gi-OT: <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001). <bold>(G)</bold> Similarly, for the number of reward deliveries received, the CTL-OT group received significantly fewer rewards than the Gi-OT, Gi-LT, and CTL-LT groups, consistent with their persistent, unrewarded pressing (<italic>n</italic>&#x202F;=&#x202F;38: 19M, 19F; two-way ANOVA, interaction effect: F<sub>1,34</sub>&#x202F;=&#x202F;16.71, <italic>p</italic>&#x202F;=&#x202F;0.0003, Tukey post hoc tests, Gi-LT: <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001, CTL-LT: <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001, Gi-OT: <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001). <bold>(H)</bold> Omission probe test wherein Gi-LT, CTL-LT, and Gi-OT mice significantly reduced active lever pressing relative to CTL-OT mice (<italic>n</italic>&#x202F;=&#x202F;38: 19M, 19F; two-way ANOVA, interaction effect: F<sub>1,34</sub>&#x202F;=&#x202F;9.961, <italic>p</italic>&#x202F;=&#x202F;0.0033, Tukey <italic>post hoc</italic> tests, Gi-LT: <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001, CTL-LT: <italic>p</italic>&#x202F;=&#x202F;0.0004, Gi-OT: <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001). See <xref ref-type="supplementary-material" rid="SM4">Supplementary Table S1</xref> for complete analyses. All data are presented as mean &#x00B1; SEM. &#x002A;<italic>p</italic>&#x202F;&#x003C;&#x202F;0.05, &#x002A;&#x002A;<italic>p</italic>&#x202F;&#x003C;&#x202F;0.01, &#x002A;&#x002A;&#x002A;<italic>p</italic>&#x202F;&#x003C;&#x202F;0.001, &#x002A;&#x002A;&#x002A;&#x002A;<italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001.</p>
</caption>
<graphic xlink:href="fnbeh-20-1751553-g003.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Panel A shows a schematic of chemogenetic inhibition in DLS of wild-type mice via viral injection and CNO administration. Panel B presents fluorescent microscopy images of DLS with mCherry expression and injector track. Panel C displays brain atlas schematics marking DLS injection sites in red at four anterior-posterior levels. Panels D&#x2013;H show bar graphs with individual data points comparing lever presses, devaluation indices, and reward deliveries between experimental groups under devaluation and omission tasks. Statistical significance is annotated on the graphs.</alt-text>
</graphic>
</fig>
<p>During devaluation testing, Gi-limited, CTL-limited, and notably, Gi-overtrained mice all demonstrated sensitivity to devaluation by significantly reducing lever presses on the devalued day compared to the valued day. Conversely, CTL-overtrained mice showed no reduction (<xref ref-type="fig" rid="fig3">Figure 3D</xref>). An effect of the DLS neuronal inhibition was further seen in Gi-overtrained mice pressing significantly less than CTL-overtrained mice on the devalued day, indicating that chemogenetic inhibition of the DLS prevented habit expression and restored goal-directed control in overtrained animals (<xref ref-type="fig" rid="fig3">Figure 3D</xref>, statistical result not shown). To account for individual differences in lever press rates, a devaluation index was calculated. CTL-overtrained mice displayed a higher index&#x2014;indicating insensitivity to devaluation&#x2014;compared to Gi-overtrained, Gi-limited, and CTL-limited mice (<xref ref-type="fig" rid="fig3">Figure 3E</xref>). Thus, Gi-overtrained mice exhibited sensitivity to devaluation, confirming that chemogenetic inhibition of the DLS restored goal-directed control in overtrained mice. Analysis of lick data showed that only the Gi-limited group displayed a significant difference in the number of licks between the valued and devalued test days, while all other groups showed no difference (<xref ref-type="supplementary-material" rid="SM3">Supplementary Figure S3B</xref>).</p>
<p>Next, we examined how chemogenetic DLS inhibition affected responding in omission and omission probe tests. In the omission test, we found that Gi-limited, CTL-limited, and notably, Gi-overtrained mice significantly reduced lever pressing and received more reward deliveries than the CTL-overtrained mice (<xref ref-type="fig" rid="fig3">Figures 3F</xref>,<xref ref-type="fig" rid="fig3">G</xref>). This pattern of responding demonstrates that Gi-overtrained mice, but not CTL-overtrained controls, regained sensitivity to changes in the instrumental contingency following chemogenetic inhibition of the DLS. This distinction persisted into the omission probe test a day later, where Gi-limited, CTL-limited, and Gi-overtrained mice maintained low press rates, while CTL-overtrained mice continued pressing at high rates despite the absence of the cue tone or reward (<xref ref-type="fig" rid="fig3">Figure 3H</xref>). In both omission and omission probe tests, lick data showed no change between any of the groups (<xref ref-type="supplementary-material" rid="SM3">Supplementary Figures S3C,D</xref>), confirming that the observed differences in pressing rates were due to behavioral adaptations and not consumption differences. These results demonstrate that DLS activity is required for the expression of outcome-insensitive responding in overtrained mice, as silencing this region reinstated goal-directed flexibility during both devaluation and omission tests.</p>
<p>Collectively, these results demonstrate that while CTL-overtrained mice continued to exhibit inflexible, habitual responding, the Gi-limited, CTL-limited, and, critically, the DLS-inhibited Gi-overtrained mice all displayed behavioral flexibility, significantly reducing their lever pressing when it no longer resulted in a valued reward. These findings provide strong evidence that chemogenetic inhibition of the DLS suppresses habitual behavior and restores goal-directed control, further validating our paradigm for modeling goal-directed and habitual actions.</p>
</sec>
</sec>
<sec sec-type="discussion" id="sec20">
<title>Discussion</title>
<p>This study introduces and validates a novel head-fixed operant paradigm in mice that reliably produces flexible, goal-directed behavioral control with limited training and inflexible habitual behavior with overtraining. Mice in this paradigm acquired instrumental responses consistently and effectively discriminated between active and inactive levers across different reinforcement schedules. The training regimen determined the behavioral strategy: overtrained mice continued lever pressing despite outcome devaluation and did not reduce pressing when rewards were omitted, whereas mice with limited training adapted their behavior when outcome value or A-O contingencies changed. Importantly, chemogenetic inhibition of the DLS in overtrained mice prevented the expression of habits, restoring sensitivity to devaluation and contingency reversal. This demonstrates that DLS activity is essential for maintaining habits and that these mice regained the ability to flexibly adjust behavior based on changes in expected outcome. These results validate our head-fixed operant paradigm as an effective model for studying both goal-directed and habitual behavior and demonstrate its utility for integration with advanced technologies that require head-fixation, such as <italic>in vivo</italic> imaging and precise circuit manipulations.</p>
<sec id="sec21">
<title>Advancing habit research with head-fixed models</title>
<p>Traditionally, studies of habitual behavior have relied on freely moving operant conditioning, which, while valuable, limits the spatiotemporal resolution and longitudinal tracking of individual neurons necessary for fully capturing the habit formation process. Recently, head-fixed setups have been adapted for various drug and reward self-administration tasks, allowing detailed neural monitoring during goal-directed learning (<xref ref-type="bibr" rid="ref8">Clarke et al., 2024</xref>; <xref ref-type="bibr" rid="ref36">Paniccia et al., 2024</xref>; <xref ref-type="bibr" rid="ref44">Vollmer et al., 2021</xref>; <xref ref-type="bibr" rid="ref45">Vollmer et al., 2022</xref>; <xref ref-type="bibr" rid="ref47">Ward et al., 2025</xref>). Our work builds on this progress by showing that mice in a head-fixed setup not only learn goal-directed actions but can also transition to and sustain habitual behavior. Behavioral outcomes in our paradigm recapitulate key features of habitual control observed in freely moving animals, including insensitivity to outcome devaluation and persistent responding under altered contingencies. Crucially, this paradigm provides a methodological framework for addressing scientific questions that have remained inaccessible in freely moving models. The mechanical stability afforded by head-fixation allows for the longitudinal tracking of neural ensembles across the multi-day transition from goal-directed to habitual states. This level of access facilitates cell-level interrogation of the specific circuit dynamics and population shifts that occur as behaviors consolidate into outcome-insensitive habits. This establishes our system as a powerful, analogous platform for dissecting the neural circuit adaptations underlying habits.</p>
</sec>
<sec id="sec22">
<title>Benefits of 2P microscopy for neural dynamics of habitual behavior</title>
<p>Our head-fixed paradigm&#x2019;s compatibility with high-resolution, 2P microscopy provides an opportunity to observe the precise neural adaptations that drive the transition to habitual behavior. 2P microscopy offers superior resolution, deeper tissue penetration, and reduced phototoxicity, enabling prolonged <italic>in vivo</italic> imaging sessions. This setup provides stable, longitudinal optical access to specific neural populations, allowing us to track cellular and synaptic changes as behaviors consolidate into habits. Crucially, this combined approach enables the direct correlation of single-neuron activity and population dynamics with the moment-to-moment emergence and expression of goal-directed actions and habits. Such detailed, time-resolved tracking of circuit activity during habit formation&#x2014;including the mapping of dynamic neural codes across learning stages and the identification of specific cells recruited during the transition&#x2014;has been largely inaccessible with previous methodologies. This level of interrogation will be essential for fully elucidating the underlying circuit mechanisms of behavioral inflexibility and rigidity.</p>
</sec>
<sec id="sec23">
<title>Causal role of the DLS in habit persistence</title>
<p>Our functional manipulations provide strong support for the established role of the DLS in habitual behavior and, crucially, validate the fidelity of our head-fixed paradigm. The DLS is widely recognized as a critical hub for habit expression. We found that chemogenetic inhibition of the DLS in overtrained mice disrupted the expression of inflexible habits, restoring sensitivity to outcome devaluation and contingency reversal. While these results&#x2014;that DLS activity is necessary for maintaining habits and that its modulation can reinstate goal-directed, flexible control&#x2014;are consistent with findings from freely moving models (<xref ref-type="bibr" rid="ref4">Balleine, 2019</xref>; <xref ref-type="bibr" rid="ref10">Dickinson and Balleine, 1993</xref>; <xref ref-type="bibr" rid="ref29">Malvaez and Wassum, 2018</xref>), our study extends this work by demonstrating that DLS activity is acutely necessary for the real-time expression of habits. Unlike foundational studies that utilized permanent lesions&#x2014;thereby affecting both the acquisition and maintenance of habits&#x2014;our results show that DLS activity is required to maintain the outcome-insensitive state even after a habit has been fully established. By showing that DLS modulation can reinstate behavioral flexibility, our work highlights the DLS as a potent therapeutic target for restoring goal-directed control.</p>
</sec>
<sec id="sec24">
<title>Methodological considerations of reinforcement logic</title>
<p>A unique feature of this paradigm is the use of a consistent VI30s schedule for both limited-trained and overtrained cohorts, rather than the canonical random ratio (RR) to VI dissociation often employed in freely moving studies (<xref ref-type="bibr" rid="ref51">Yin et al., 2005a</xref>; <xref ref-type="bibr" rid="ref27">Malvaez et al., 2018</xref>). This VI&#x202F;&#x2192;&#x202F;VI design was a deliberate methodological choice to isolate training duration as the sole independent variable. By maintaining a single reinforcement logic, we establish a standardized platform for future longitudinal imaging that avoids the confounding neural and behavioral shifts associated with rule transitions. This approach allows for the direct comparison of early-stage versus late-stage VI performance, facilitating the identification of circuit-level shifts that occur as behaviors consolidate into habits. While VI schedules are traditionally associated with accelerated habit formation, our limited-trained mice remained robustly sensitive to both sensory-specific devaluation and contingency omission. This empirical validation confirms that the limited-trained group maintains an A-O associative structure, making them a true goal-directed comparison for the overtrained habit phenotype. Furthermore, modeling the transition within a single VI schedule may more closely recapitulate the graded erosion of behavioral flexibility observed in naturalistic and pathological states, where habits often emerge from consistent, time-based reinforcement rather than shifts in work-to-reward ratios.</p>
</sec>
<sec id="sec25">
<title>Limitations and future directions</title>
<p>While the head-fixed instrumental learning paradigm presented here offers opportunities for investigating the computational neural dynamics of habitual behavior, it is important to acknowledge certain inherent limitations common to such <italic>in vivo</italic> models. While head restraint can potentially induce stress, the successful acquisition of flexible, goal-directed actions, comparable to freely moving studies, strongly suggests adequate acclimation and low confounding stress levels (<xref ref-type="bibr" rid="ref14">Giovanniello et al., 2025</xref>). Future integration of air-lifted platforms could further enhance validity and physiological monitoring. Additionally, while we utilized a consistent VI schedule to isolate the temporal transition from flexible action to habit, we acknowledge that RR schedules classically sustain goal-directed behavior for longer durations. Comparing the neural signatures of our goal-directed VI cohorts to RR-trained animals remains an important future direction to determine how reinforcement logic interacts with the rate of habit consolidation. The simplified motor requirements of head-fixation may also reduce motivational demands relative to freely moving models; future work could introduce high response requirements or more complex task structures to better engage motivated behavior. Furthermore, because the motor requirements of head-fixation are simplified and constrained, this model does not directly assess sensorimotor dimensions of habit related to motor topography, such as the development of automated motor sequences or action chunking. Future iterations of this head-fixed preparation will allow for the integration of high-resolution tracking to investigate how these complex motor features emerge alongside outcome-insensitivity. Despite these considerations, this paradigm provides a robust framework for examining the transition to, and maintenance of, habitual behavior with unparalleled temporal and spatial resolution. Collectively, these identified limitations offer valuable avenues for future model refinement and expansion.</p>
</sec>
</sec>
<sec sec-type="conclusions" id="sec26">
<title>Conclusion</title>
<p>Our results introduce and validate a novel head-fixed operant paradigm that reliably models both goal-directed and habitual behavior in mice. This paradigm demonstrates the transition to and maintenance of habitual control and shows that DLS activity is critically required for sustaining the expression of habits. Importantly, inhibition of the DLS restores behavioral flexibility, allowing animals to adjust actions based on outcome value and contingency changes. Our model provides access to high-resolution neural dynamics, paving the way for deeper insights into habit formation and maintenance, and informing targeted therapeutic strategies for maladaptive habitual actions.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec27">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec sec-type="ethics-statement" id="sec28">
<title>Ethics statement</title>
<p>The animal study was approved by MUSC Institutional Animal Care and Use Committee. The study was conducted in accordance with the local legislation and institutional requirements.</p>
</sec>
<sec sec-type="author-contributions" id="sec29">
<title>Author contributions</title>
<p>LM: Investigation, Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft, Conceptualization, Formal analysis. LG: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing, Investigation. JBo: Writing &#x2013; review &#x0026; editing, Software, Writing &#x2013; original draft, Methodology. JBa: Writing &#x2013; original draft, Investigation, Writing &#x2013; review &#x0026; editing. MB: Writing &#x2013; review &#x0026; editing, Investigation, Writing &#x2013; original draft. KW: Writing &#x2013; review &#x0026; editing, Supervision, Conceptualization, Writing &#x2013; original draft. JO: Writing &#x2013; review &#x0026; editing, Supervision, Writing &#x2013; original draft, Conceptualization.</p>
</sec>
<sec sec-type="COI-statement" id="sec30">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
<p>The author JO declared that they were an editorial board member of Frontiers, at the time of submission. This had no impact on the peer review process and the final decision.</p>
</sec>
<sec sec-type="ai-statement" id="sec31">
<title>Generative AI statement</title>
<p>The author(s) declared that Generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="sec32">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="sec33">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/fnbeh.2026.1751553/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/fnbeh.2026.1751553/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Image_1.jpeg" id="SM1" mimetype="image/jpeg" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>SUPPLEMENTARY FIGURE S1</label>
<caption>
<p>Initial 10% chocolate and vanilla Ensure preference and discrimination. <bold>(A)</bold> Consumption of vanilla (light yellow bar) and chocolate (dark brown bar) during the initial preference test. No difference in consumption for each flavor [<italic>t</italic>(7)=0.35, <italic>p</italic> =&#x202F;0.7398]. <bold>(B)</bold> Percentage preference for vanilla and chocolate, calculated based on the consumption shown in <bold>(A)</bold>. No difference in preference for each flavor [<italic>t</italic>(7)=0.38, <italic>p</italic> =&#x202F;0.7122]. <bold>(C)</bold> Consumption of vanilla and chocolate during the 90-minute prefeed phase, used to selectively devalue one of the flavors. Over the course of both tests there was no difference in prefeed consumption [<italic>t</italic>(7)=0.27, <italic>p</italic> =&#x202F;0.7939]. (<bold>D</bold>) Consumption of the valued flavor and the devalued during a 10-minute probe test following the prefeed. Consumption of the devalued flavor was significantly lower than the valued flavor [<italic>t</italic>(15)=4.48, <italic>p</italic> =&#x202F;0.0004], indicating successful devaluation. <bold>(E)</bold> The calculated devaluation index for each subject. Devaluation index (devalued consumption) / (devalued consumption + valued consumption), scores closer to 0.5 (red dashed line) indicate insensitivity to devaluation and scores closer to 0.0 indicated sensitivity to devaluation. See <xref ref-type="supplementary-material" rid="SM4">Supplementary Table S1</xref> for complete analyses. All data are presented as mean &#x00B1; SEM.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Image_2.jpeg" id="SM2" mimetype="image/jpeg" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>SUPPLEMENTARY FIGURE S2</label>
<caption>
<p>Sex comparison, prefeed consumption, and lick data across tests. <bold>(A)</bold> Number of lever presses over training paradigms, comparing males (blue) and females (pink), as well as active (filled dot) and inactive (unfilled dot) lever presses. Lever pressing significantly increased across days, with a robust difference observed between the active and inactive lever. Males and females exhibited no significant difference in overall press rate (<italic>n</italic>&#x202F;=&#x202F;27: 14M, 13F; mixed effects, three-way ANOVA, lever effect: F<sub>1,25</sub> =&#x202F;153.9, <italic>p</italic> &#x003C;&#x202F;0.0001, sex effect: F<sub>1,60</sub>&#x202F;=&#x202F;1.974, <italic>p&#x202F;=</italic>&#x202F;0.1652, day x lever interaction: F<sub>1.26,9.44</sub>&#x202F;=&#x202F;5.274, <italic>p</italic> =&#x202F;0.0401). <bold>(B)</bold> Consumption of the valued (filled bar) and the devalued (unfilled bar) flavor during the pre-feeding period did not differ between groups. <bold>(C)</bold> Number of licks during the valued and devalued test days did not differ between groups. <bold>(D)</bold> Total number of licks during the omission test in the limited-trained and overtrained groups did not differ. <bold>(E)</bold> Total number of licks during brief 10-minute omission probe test did not differ between groups. See <xref ref-type="supplementary-material" rid="SM4">Supplementary Table S1</xref> for complete analyses. All data are presented as mean &#x00B1; SEM.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Image_3.jpeg" id="SM3" mimetype="image/jpeg" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>SUPPLEMENTARY FIGURE S3</label>
<caption>
<p>DREADD prefeed and lick data. <bold>(A)</bold> Consumption of the valued (filled bar) and devalued (unfilled bar) flavor during the prefeed period, across all groups. Limited-trained animals and overtrained animals show similar consumption patterns. <bold>(B)</bold> The total number of licks for the valued and devalued test, Gi-LT mice licked significantly less on the devalued day compared to the valued day, with no difference found for any of the other groups (<italic>n</italic>&#x202F;=&#x202F;39: 19M, 20F; three-way ANOVA, test day effect: F<sub>1,35</sub>&#x202F;=&#x202F;9.110, <italic>p</italic> =&#x202F;0.0047, Two-stage BKY <italic>post hoc</italic> test, Gi-LT: <italic>p</italic> =&#x202F;0.0342). <bold>(C)</bold> Total number of licks during the omission test, no difference between groups. <bold>(D)</bold> Total number of licks during omission probe test, no difference between groups. See <xref ref-type="supplementary-material" rid="SM4">Supplementary Table S1</xref> for complete analyses. All data are presented as mean &#x00B1; SEM.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.pdf" id="SM4" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>SUPPLEMENTARY TABLE S1</label>
<caption>
<p>Supplementary statistical table.</p>
</caption>
</supplementary-material>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Adams</surname><given-names>C. D.</given-names></name></person-group> (<year>1982</year>). <article-title>Variations in the sensitivity of instrumental responding to reinforcer devaluation</article-title>. <source>Q. J. Exp. Psychol. Sect. B.</source> <volume>34</volume>, <fpage>77</fpage>&#x2013;<lpage>98</lpage>. doi: <pub-id pub-id-type="doi">10.1080/14640748208400878</pub-id></mixed-citation></ref>
<ref id="ref2"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Adams</surname><given-names>C. D.</given-names></name> <name><surname>Dickinson</surname><given-names>A.</given-names></name></person-group> (<year>1981</year>). <article-title>Instrumental responding following reinforcer devaluation</article-title>. <source>Q. J. Exp. Psychol. Sect. B.</source> <volume>33</volume>, <fpage>109</fpage>&#x2013;<lpage>121</lpage>. doi: <pub-id pub-id-type="doi">10.1080/14640748108400816</pub-id></mixed-citation></ref>
<ref id="ref3"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Alloway</surname><given-names>K. D.</given-names></name> <name><surname>Smith</surname><given-names>J. B.</given-names></name> <name><surname>Mowery</surname><given-names>T. M.</given-names></name> <name><surname>Watson</surname><given-names>G. D. R.</given-names></name></person-group> (<year>2017</year>). <article-title>Sensory processing in the dorsolateral striatum: the contribution of thalamostriatal pathways</article-title>. <source>Front. Syst. Neurosci.</source> <volume>11</volume>:<fpage>53</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fnsys.2017.00053</pub-id></mixed-citation></ref>
<ref id="ref4"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Balleine</surname><given-names>B. W.</given-names></name></person-group> (<year>2019</year>). <article-title>The meaning of behavior: discriminating reflex and volition in the brain</article-title>. <source>Neuron</source> <volume>104</volume>, <fpage>47</fpage>&#x2013;<lpage>62</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neuron.2019.09.024</pub-id>, <pub-id pub-id-type="pmid">31600515</pub-id></mixed-citation></ref>
<ref id="ref5"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Balleine</surname><given-names>B. W.</given-names></name> <name><surname>Dickinson</surname><given-names>A.</given-names></name></person-group> (<year>1998</year>). <article-title>Goal-directed instrumental action: contingency and incentive learning and their cortical substrates</article-title>. <source>Neuropharmacology</source> <volume>37</volume>, <fpage>407</fpage>&#x2013;<lpage>419</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0028-3908(98)00033-1</pub-id>, <pub-id pub-id-type="pmid">9704982</pub-id></mixed-citation></ref>
<ref id="ref6"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Belin</surname><given-names>D.</given-names></name> <name><surname>Belin-Rauscent</surname><given-names>A.</given-names></name> <name><surname>Murray</surname><given-names>J. E.</given-names></name> <name><surname>Everitt</surname><given-names>B. J.</given-names></name></person-group> (<year>2013</year>). <article-title>Addiction: failure of control over maladaptive incentive habits</article-title>. <source>Curr. Opin. Neurobiol.</source> <volume>23</volume>, <fpage>564</fpage>&#x2013;<lpage>572</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.conb.2013.01.025</pub-id>, <pub-id pub-id-type="pmid">23452942</pub-id></mixed-citation></ref>
<ref id="ref7"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Belin</surname><given-names>D.</given-names></name> <name><surname>Jonkman</surname><given-names>S.</given-names></name> <name><surname>Dickinson</surname><given-names>A.</given-names></name> <name><surname>Robbins</surname><given-names>T. W.</given-names></name> <name><surname>Everitt</surname><given-names>B. J.</given-names></name></person-group> (<year>2009</year>). <article-title>Parallel and interactive learning processes within the basal ganglia: relevance for the understanding of addiction</article-title>. <source>Behav. Brain Res.</source> <volume>199</volume>, <fpage>89</fpage>&#x2013;<lpage>102</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.bbr.2008.09.027</pub-id>, <pub-id pub-id-type="pmid">18950658</pub-id></mixed-citation></ref>
<ref id="ref8"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Clarke</surname><given-names>R. E.</given-names></name> <name><surname>Grant</surname><given-names>R. I.</given-names></name> <name><surname>Woods</surname><given-names>S. N.</given-names></name> <name><surname>Pagoota</surname><given-names>B. E.</given-names></name> <name><surname>Buchmaier</surname><given-names>S.</given-names></name> <name><surname>Bordieanu</surname><given-names>B.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Corticostriatal ensemble dynamics across heroin self-administration to reinstatement</article-title>. <source>bioRxiv.</source></mixed-citation></ref>
<ref id="ref9"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Corbit</surname><given-names>L. H.</given-names></name> <name><surname>Nie</surname><given-names>H.</given-names></name> <name><surname>Janak</surname><given-names>P. H.</given-names></name></person-group> (<year>2012</year>). <article-title>Habitual alcohol seeking: time course and the contribution of subregions of the dorsal striatum</article-title>. <source>Biol. Psychiatry</source> <volume>72</volume>, <fpage>389</fpage>&#x2013;<lpage>395</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.biopsych.2012.02.024</pub-id>, <pub-id pub-id-type="pmid">22440617</pub-id></mixed-citation></ref>
<ref id="ref10"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Dickinson</surname><given-names>A.</given-names></name> <name><surname>Balleine</surname><given-names>B.</given-names></name></person-group> (<year>1993</year>). &#x201C;<chapter-title>Actions and responses: the dual psychology of behaviour</chapter-title>&#x201D; in <source>Spatial representation: problems in philosophy and psychology</source> (<publisher-loc>Malden</publisher-loc>: <publisher-name>Blackwell Publishing</publisher-name>), <fpage>277</fpage>&#x2013;<lpage>293</lpage>.</mixed-citation></ref>
<ref id="ref11"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Dickinson</surname><given-names>A.</given-names></name> <name><surname>Balleine</surname><given-names>B.</given-names></name></person-group> (<year>1999</year>). &#x201C;<chapter-title>Actions and responses: the dual psychology of behaviour</chapter-title>&#x201D; in <source>Spatial representation: problems in philosophy and psychology</source>. eds. <person-group person-group-type="editor"><name><surname>Eilan</surname><given-names>N.</given-names></name> <name><surname>McCarthy</surname><given-names>R.</given-names></name> <name><surname>Brewer</surname><given-names>B.</given-names></name></person-group> (<publisher-loc>Oxford</publisher-loc>: <publisher-name>Oxford University Press</publisher-name>).</mixed-citation></ref>
<ref id="ref12"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Everitt</surname><given-names>B. J.</given-names></name> <name><surname>Robbins</surname><given-names>T. W.</given-names></name></person-group> (<year>2016</year>). <article-title>Drug addiction: updating actions to habits to compulsions ten years on</article-title>. <source>Annu. Rev. Psychol.</source> <volume>67</volume>, <fpage>23</fpage>&#x2013;<lpage>50</lpage>. doi: <pub-id pub-id-type="doi">10.1146/annurev-psych-122414-033457</pub-id>, <pub-id pub-id-type="pmid">26253543</pub-id></mixed-citation></ref>
<ref id="ref13"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gillan</surname><given-names>C. M.</given-names></name> <name><surname>Kosinski</surname><given-names>M.</given-names></name> <name><surname>Whelan</surname><given-names>R.</given-names></name> <name><surname>Phelps</surname><given-names>E. A.</given-names></name> <name><surname>Daw</surname><given-names>N. D.</given-names></name></person-group> (<year>2016</year>). <article-title>Characterizing a psychiatric symptom dimension related to deficits in goal-directed control</article-title>. <source>Elife</source> <volume>5</volume>:<fpage>e11305</fpage>. doi: <pub-id pub-id-type="doi">10.7554/eLife.11305</pub-id>, <pub-id pub-id-type="pmid">26928075</pub-id></mixed-citation></ref>
<ref id="ref14"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Giovanniello</surname><given-names>J. R.</given-names></name> <name><surname>Paredes</surname><given-names>N.</given-names></name> <name><surname>Wiener</surname><given-names>A.</given-names></name> <name><surname>Ram&#x00ED;rez-Armenta</surname><given-names>K.</given-names></name> <name><surname>Oragwam</surname><given-names>C.</given-names></name> <name><surname>Uwadia</surname><given-names>H. O.</given-names></name> <etal/></person-group>. (<year>2025</year>). <article-title>A dual-pathway architecture for stress to disrupt agency and promote habit</article-title>. <source>Nature</source> <volume>640</volume>, <fpage>722</fpage>&#x2013;<lpage>731</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41586-024-08580-w</pub-id>, <pub-id pub-id-type="pmid">39972126</pub-id></mixed-citation></ref>
<ref id="ref15"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Goltstein</surname><given-names>P. M.</given-names></name> <name><surname>Reinert</surname><given-names>S.</given-names></name> <name><surname>Glas</surname><given-names>A.</given-names></name> <name><surname>Bonhoeffer</surname><given-names>T.</given-names></name> <name><surname>H&#x00FC;bener</surname><given-names>M.</given-names></name></person-group> (<year>2018</year>). <article-title>Food and water restriction lead to differential learning behaviors in a head-fixed two-choice visual discrimination task for mice</article-title>. <source>PLoS One</source> <volume>13</volume>:<fpage>e0204066</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0204066</pub-id></mixed-citation></ref>
<ref id="ref16"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Grant</surname><given-names>R. I.</given-names></name> <name><surname>Doncheck</surname><given-names>E. M.</given-names></name> <name><surname>Vollmer</surname><given-names>K. M.</given-names></name> <name><surname>Winston</surname><given-names>K. T.</given-names></name> <name><surname>Romanova</surname><given-names>E. V.</given-names></name> <name><surname>Siegler</surname><given-names>P. N.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Specialized coding patterns among dorsomedial prefrontal neuronal ensembles predict conditioned reward seeking</article-title>. <source>eLife</source> <volume>10</volume>:<fpage>e65764</fpage>. doi: <pub-id pub-id-type="doi">10.7554/eLife.65764</pub-id></mixed-citation></ref>
<ref id="ref17"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Graybiel</surname><given-names>A. M.</given-names></name></person-group> (<year>2008</year>). <article-title>Habits, rituals, and the evaluative brain</article-title>. <source>Annu. Rev. Neurosci.</source> <volume>31</volume>, <fpage>359</fpage>&#x2013;<lpage>387</lpage>. doi: <pub-id pub-id-type="doi">10.1146/annurev.neuro.29.051605.112851</pub-id>, <pub-id pub-id-type="pmid">18558860</pub-id></mixed-citation></ref>
<ref id="ref18"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Graybiel</surname><given-names>A. M.</given-names></name> <name><surname>Grafton</surname><given-names>S. T.</given-names></name></person-group> (<year>2015</year>). <article-title>The striatum: where skills and habits meet</article-title>. <source>Cold Spring Harb. Perspect. Biol.</source> <volume>7</volume>:<fpage>a021691</fpage>. doi: <pub-id pub-id-type="doi">10.1101/cshperspect.a021691</pub-id>, <pub-id pub-id-type="pmid">26238359</pub-id></mixed-citation></ref>
<ref id="ref19"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gremel</surname><given-names>C. M.</given-names></name> <name><surname>Costa</surname><given-names>R. M.</given-names></name></person-group> (<year>2013</year>). <article-title>Orbitofrontal and striatal circuits dynamically encode the shift between goal-directed and habitual actions</article-title>. <source>Nat. Commun.</source> <volume>4</volume>:<fpage>2264</fpage>. doi: <pub-id pub-id-type="doi">10.1038/ncomms3264</pub-id>, <pub-id pub-id-type="pmid">23921250</pub-id></mixed-citation></ref>
<ref id="ref20"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Guo</surname><given-names>Z. V.</given-names></name> <name><surname>Hires</surname><given-names>S. A.</given-names></name> <name><surname>Li</surname><given-names>N.</given-names></name> <name><surname>O'Connor</surname><given-names>D. H.</given-names></name> <name><surname>Komiyama</surname><given-names>T.</given-names></name> <name><surname>Ophir</surname><given-names>E.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Procedures for behavioral experiments in head-fixed mice</article-title>. <source>PLoS One</source> <volume>9</volume>:<fpage>e88678</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0088678</pub-id>, <pub-id pub-id-type="pmid">24520413</pub-id></mixed-citation></ref>
<ref id="ref21"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hogarth</surname><given-names>L.</given-names></name> <name><surname>Balleine</surname><given-names>B. W.</given-names></name> <name><surname>Corbit</surname><given-names>L. H.</given-names></name> <name><surname>Killcross</surname><given-names>S.</given-names></name></person-group> (<year>2013</year>). <article-title>Associative learning mechanisms underpinning the transition from recreational drug use to addiction</article-title>. <source>Ann. N. Y. Acad. Sci.</source> <volume>1282</volume>, <fpage>12</fpage>&#x2013;<lpage>24</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1749-6632.2012.06768.x</pub-id>, <pub-id pub-id-type="pmid">23126270</pub-id></mixed-citation></ref>
<ref id="ref22"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jones</surname><given-names>B. O.</given-names></name> <name><surname>Cruz</surname><given-names>A. M.</given-names></name> <name><surname>Kim</surname><given-names>T. H.</given-names></name> <name><surname>Spencer</surname><given-names>H. F.</given-names></name> <name><surname>Smith</surname><given-names>R. J.</given-names></name></person-group> (<year>2022</year>). <article-title>Discriminating goal-directed and habitual cocaine seeking in rats using a novel outcome devaluation procedure</article-title>. <source>Learn. Mem.</source> <volume>29</volume>, <fpage>447</fpage>&#x2013;<lpage>457</lpage>. doi: <pub-id pub-id-type="doi">10.1101/lm.053621.122</pub-id>, <pub-id pub-id-type="pmid">36621907</pub-id></mixed-citation></ref>
<ref id="ref23"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jonkman</surname><given-names>S.</given-names></name> <name><surname>Pelloux</surname><given-names>Y.</given-names></name> <name><surname>Everitt</surname><given-names>B. J.</given-names></name></person-group> (<year>2012</year>). <article-title>Differential roles of the dorsolateral and midlateral striatum in punished cocaine seeking</article-title>. <source>J. Neurosci.</source> <volume>32</volume>, <fpage>4645</fpage>&#x2013;<lpage>4650</lpage>. doi: <pub-id pub-id-type="doi">10.1523/JNEUROSCI.0348-12.2012</pub-id>, <pub-id pub-id-type="pmid">22457510</pub-id></mixed-citation></ref>
<ref id="ref24"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lipton</surname><given-names>D. M.</given-names></name> <name><surname>Gonzales</surname><given-names>B. J.</given-names></name> <name><surname>Citri</surname><given-names>A.</given-names></name></person-group> (<year>2019</year>). <article-title>Dorsal striatal circuits for habits, compulsions and addictions</article-title>. <source>Front. Syst. Neurosci.</source> <volume>13</volume>:<fpage>28</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fnsys.2019.00028</pub-id>, <pub-id pub-id-type="pmid">31379523</pub-id></mixed-citation></ref>
<ref id="ref25"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mahler</surname><given-names>S. V.</given-names></name> <name><surname>Brodnik</surname><given-names>Z. D.</given-names></name> <name><surname>Cox</surname><given-names>B. M.</given-names></name> <name><surname>Buchta</surname><given-names>W. C.</given-names></name> <name><surname>Bentzley</surname><given-names>B. S.</given-names></name> <name><surname>Quintanilla</surname><given-names>J.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Chemogenetic manipulations of ventral tegmental area dopamine neurons reveal multifaceted roles in cocaine abuse</article-title>. <source>J. Neurosci.</source> <volume>39</volume>, <fpage>503</fpage>&#x2013;<lpage>518</lpage>. doi: <pub-id pub-id-type="doi">10.1523/JNEUROSCI.0537-18.2018</pub-id></mixed-citation></ref>
<ref id="ref26"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Malvaez</surname><given-names>M.</given-names></name></person-group> (<year>2020</year>). <article-title>Neural substrates of habit</article-title>. <source>J. Neurosci. Res.</source> <volume>98</volume>, <fpage>986</fpage>&#x2013;<lpage>997</lpage>. doi: <pub-id pub-id-type="doi">10.1002/jnr.24552</pub-id>, <pub-id pub-id-type="pmid">31693205</pub-id></mixed-citation></ref>
<ref id="ref27"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Malvaez</surname><given-names>M.</given-names></name> <name><surname>Greenfield</surname><given-names>V. Y.</given-names></name> <name><surname>Matheos</surname><given-names>D. P.</given-names></name> <name><surname>Angelillis</surname><given-names>N. A.</given-names></name> <name><surname>Murphy</surname><given-names>M. D.</given-names></name> <name><surname>Kennedy</surname><given-names>P. J.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Habits are negatively regulated by histone deacetylase 3 in the dorsal striatum</article-title>. <source>Biol. Psychiatry</source> <volume>84</volume>, <fpage>383</fpage>&#x2013;<lpage>392</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.biopsych.2018.01.025</pub-id>, <pub-id pub-id-type="pmid">29571524</pub-id></mixed-citation></ref>
<ref id="ref28"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Malvaez</surname><given-names>M.</given-names></name> <name><surname>Liang</surname><given-names>A.</given-names></name> <name><surname>Hall</surname><given-names>B. S.</given-names></name> <name><surname>Giovanniello</surname><given-names>J. R.</given-names></name> <name><surname>Paredes</surname><given-names>N.</given-names></name> <name><surname>Gonzalez</surname><given-names>J. Y.</given-names></name> <etal/></person-group>. (<year>2025</year>). <article-title>Striatal cell-type specific encoding stability and reorganization for agency and habit</article-title>. <source>bioRxiv.</source></mixed-citation></ref>
<ref id="ref29"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Malvaez</surname><given-names>M.</given-names></name> <name><surname>Wassum</surname><given-names>K. M.</given-names></name></person-group> (<year>2018</year>). <article-title>Regulation of habit formation in the dorsal striatum</article-title>. <source>Curr. Opin. Behav. Sci.</source> <volume>20</volume>, <fpage>67</fpage>&#x2013;<lpage>74</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cobeha.2017.11.005</pub-id>, <pub-id pub-id-type="pmid">29713658</pub-id></mixed-citation></ref>
<ref id="ref30"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Martiros</surname><given-names>N.</given-names></name> <name><surname>Burgess</surname><given-names>A. A.</given-names></name> <name><surname>Graybiel</surname><given-names>A. M.</given-names></name></person-group> (<year>2018</year>). <article-title>Inversely active striatal projection neurons and interneurons selectively delimit useful behavioral sequences</article-title>. <source>Curr. Biol.</source> <volume>28</volume>, <fpage>560</fpage>&#x2013;<lpage>73.e5</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cub.2018.01.031</pub-id>, <pub-id pub-id-type="pmid">29429614</pub-id></mixed-citation></ref>
<ref id="ref31"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Murray</surname><given-names>J. E.</given-names></name> <name><surname>Dilleen</surname><given-names>R.</given-names></name> <name><surname>Pelloux</surname><given-names>Y.</given-names></name> <name><surname>Economidou</surname><given-names>D.</given-names></name> <name><surname>Dalley</surname><given-names>J. W.</given-names></name> <name><surname>Belin</surname><given-names>D.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Increased impulsivity retards the transition to dorsolateral striatal dopamine control of cocaine seeking</article-title>. <source>Biol. Psychiatry</source> <volume>76</volume>, <fpage>15</fpage>&#x2013;<lpage>22</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.biopsych.2013.09.011</pub-id>, <pub-id pub-id-type="pmid">24157338</pub-id></mixed-citation></ref>
<ref id="ref32"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>O&#x2019;Hare</surname><given-names>J. K.</given-names></name> <name><surname>Ade</surname><given-names>K. K.</given-names></name> <name><surname>Sukharnikova</surname><given-names>T.</given-names></name> <name><surname>Van Hooser</surname><given-names>S. D.</given-names></name> <name><surname>Palmeri</surname><given-names>M. L.</given-names></name> <name><surname>Yin</surname><given-names>H. H.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>Pathway-specific striatal substrates for habitual behavior</article-title>. <source>Neuron</source> <volume>89</volume>, <fpage>472</fpage>&#x2013;<lpage>479</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neuron.2015.12.032</pub-id></mixed-citation></ref>
<ref id="ref33"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>O&#x2019;Hare</surname><given-names>J. K.</given-names></name> <name><surname>Li</surname><given-names>H.</given-names></name> <name><surname>Kim</surname><given-names>N.</given-names></name> <name><surname>Gaidis</surname><given-names>E.</given-names></name> <name><surname>Ade</surname><given-names>K.</given-names></name> <name><surname>Beck</surname><given-names>J.</given-names></name> <etal/></person-group>. (<year>2017</year>). <article-title>Striatal fast-spiking interneurons selectively modulate circuit output and are required for habitual behavior</article-title>. <source>Elife</source> <volume>6</volume>:<fpage>e26231</fpage>. doi: <pub-id pub-id-type="doi">10.7554/eLife.26231</pub-id>, <pub-id pub-id-type="pmid">28871960</pub-id></mixed-citation></ref>
<ref id="ref34"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Otis</surname><given-names>J. M.</given-names></name> <name><surname>Namboodiri</surname><given-names>V. M.</given-names></name> <name><surname>Matan</surname><given-names>A. M.</given-names></name> <name><surname>Voets</surname><given-names>E. S.</given-names></name> <name><surname>Mohorn</surname><given-names>E. P.</given-names></name> <name><surname>Kosyk</surname><given-names>O.</given-names></name> <etal/></person-group>. (<year>2017</year>). <article-title>Prefrontal cortex output circuits guide reward seeking through divergent cue encoding</article-title>. <source>Nature</source> <volume>543</volume>, <fpage>103</fpage>&#x2013;<lpage>107</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nature21376</pub-id>, <pub-id pub-id-type="pmid">28225752</pub-id></mixed-citation></ref>
<ref id="ref35"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Otis</surname><given-names>J. M.</given-names></name> <name><surname>Zhu</surname><given-names>M.</given-names></name> <name><surname>Namboodiri</surname><given-names>V. M. K.</given-names></name> <name><surname>Cook</surname><given-names>C. A.</given-names></name> <name><surname>Kosyk</surname><given-names>O.</given-names></name> <name><surname>Matan</surname><given-names>A. M.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Paraventricular thalamus projection neurons integrate cortical and hypothalamic signals for cue-reward processing</article-title>. <source>Neuron</source> <volume>103</volume>, <fpage>423</fpage>&#x2013;<lpage>31.e4</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neuron.2019.05.018</pub-id></mixed-citation></ref>
<ref id="ref36"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Paniccia</surname><given-names>J. E.</given-names></name> <name><surname>Vollmer</surname><given-names>K. M.</given-names></name> <name><surname>Green</surname><given-names>L. M.</given-names></name> <name><surname>Grant</surname><given-names>R. I.</given-names></name> <name><surname>Winston</surname><given-names>K. T.</given-names></name> <name><surname>Buchmaier</surname><given-names>S.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Restoration of a paraventricular thalamo-accumbal behavioral suppression circuit prevents reinstatement of heroin seeking</article-title>. <source>Neuron</source> <volume>112</volume>, <fpage>772</fpage>&#x2013;<lpage>85.e9</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neuron.2023.11.024</pub-id>, <pub-id pub-id-type="pmid">38141605</pub-id></mixed-citation></ref>
<ref id="ref37"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Peak</surname><given-names>J.</given-names></name> <name><surname>Hart</surname><given-names>G.</given-names></name> <name><surname>Balleine</surname><given-names>B. W.</given-names></name></person-group> (<year>2019</year>). <article-title>From learning to action: the integration of dorsal striatal input and output pathways in instrumental conditioning</article-title>. <source>Eur. J. Neurosci.</source> <volume>49</volume>, <fpage>658</fpage>&#x2013;<lpage>671</lpage>. doi: <pub-id pub-id-type="doi">10.1111/ejn.13964</pub-id>, <pub-id pub-id-type="pmid">29791051</pub-id></mixed-citation></ref>
<ref id="ref38"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rossi</surname><given-names>M. A.</given-names></name> <name><surname>Yin</surname><given-names>H. H.</given-names></name></person-group> (<year>2012</year>). <article-title>Methods for studying habitual behavior in mice</article-title>. <source>Curr. Protoc. Neurosci.</source> <volume>8</volume>:<fpage>8.29</fpage>. doi: <pub-id pub-id-type="doi">10.1002/0471142301.ns0829s60</pub-id></mixed-citation></ref>
<ref id="ref39"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Thorn</surname><given-names>C. A.</given-names></name> <name><surname>Atallah</surname><given-names>H.</given-names></name> <name><surname>Howe</surname><given-names>M.</given-names></name> <name><surname>Graybiel</surname><given-names>A. M.</given-names></name></person-group> (<year>2010</year>). <article-title>Differential dynamics of activity changes in dorsolateral and dorsomedial striatal loops during learning</article-title>. <source>Neuron</source> <volume>66</volume>, <fpage>781</fpage>&#x2013;<lpage>795</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neuron.2010.04.036</pub-id>, <pub-id pub-id-type="pmid">20547134</pub-id></mixed-citation></ref>
<ref id="ref40"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tricomi</surname><given-names>E.</given-names></name> <name><surname>Balleine</surname><given-names>B. W.</given-names></name> <name><surname>O'Doherty</surname><given-names>J. P.</given-names></name></person-group> (<year>2009</year>). <article-title>A specific role for posterior dorsolateral striatum in human habit learning</article-title>. <source>Eur. J. Neurosci.</source> <volume>29</volume>, <fpage>2225</fpage>&#x2013;<lpage>2232</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1460-9568.2009.06796.x</pub-id>, <pub-id pub-id-type="pmid">19490086</pub-id></mixed-citation></ref>
<ref id="ref41"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vandaele</surname><given-names>Y.</given-names></name> <name><surname>Janak</surname><given-names>P. H.</given-names></name></person-group> (<year>2018</year>). <article-title>Defining the place of habit in substance use disorders</article-title>. <source>Prog. Neuro-Psychopharmacol. Biol. Psychiatry</source> <volume>87</volume>, <fpage>22</fpage>&#x2013;<lpage>32</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.pnpbp.2017.06.029</pub-id>, <pub-id pub-id-type="pmid">28663112</pub-id></mixed-citation></ref>
<ref id="ref42"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vandaele</surname><given-names>Y.</given-names></name> <name><surname>Mahajan</surname><given-names>N. R.</given-names></name> <name><surname>Ottenheimer</surname><given-names>D. J.</given-names></name> <name><surname>Richard</surname><given-names>J. M.</given-names></name> <name><surname>Mysore</surname><given-names>S. P.</given-names></name> <name><surname>Janak</surname><given-names>P. H.</given-names></name></person-group> (<year>2019</year>). <article-title>Distinct recruitment of dorsomedial and dorsolateral striatum erodes with extended training</article-title>. <source>Elife</source> <volume>8</volume>:<fpage>e49536</fpage>. doi: <pub-id pub-id-type="doi">10.7554/eLife.49536</pub-id></mixed-citation></ref>
<ref id="ref43"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vanderschuren</surname><given-names>L. J.</given-names></name> <name><surname>Di Ciano</surname><given-names>P.</given-names></name> <name><surname>Everitt</surname><given-names>B. J.</given-names></name></person-group> (<year>2005</year>). <article-title>Involvement of the dorsal striatum in cue-controlled cocaine seeking</article-title>. <source>J. Neurosci.</source> <volume>25</volume>, <fpage>8665</fpage>&#x2013;<lpage>8670</lpage>. doi: <pub-id pub-id-type="doi">10.1523/jneurosci.0925-05.2005</pub-id>, <pub-id pub-id-type="pmid">16177034</pub-id></mixed-citation></ref>
<ref id="ref44"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vollmer</surname><given-names>K. M.</given-names></name> <name><surname>Doncheck</surname><given-names>E. M.</given-names></name> <name><surname>Grant</surname><given-names>R. I.</given-names></name> <name><surname>Winston</surname><given-names>K. T.</given-names></name> <name><surname>Romanova</surname><given-names>E. V.</given-names></name> <name><surname>Bowen</surname><given-names>C. W.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>A novel assay allowing drug self-administration, extinction, and reinstatement testing in head-restrained mice</article-title>. <source>Front. Behav. Neurosci.</source> <volume>15</volume>:<fpage>744715</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fnbeh.2021.744715</pub-id>, <pub-id pub-id-type="pmid">34776891</pub-id></mixed-citation></ref>
<ref id="ref45"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vollmer</surname><given-names>K. M.</given-names></name> <name><surname>Green</surname><given-names>L. M.</given-names></name> <name><surname>Grant</surname><given-names>R. I.</given-names></name> <name><surname>Winston</surname><given-names>K. T.</given-names></name> <name><surname>Doncheck</surname><given-names>E. M.</given-names></name> <name><surname>Bowen</surname><given-names>C. W.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>An opioid-gated thalamoaccumbal circuit for the suppression of reward seeking in mice</article-title>. <source>Nat. Commun.</source> <volume>13</volume>:<fpage>6865</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41467-022-34517-w</pub-id></mixed-citation></ref>
<ref id="ref47"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ward</surname><given-names>A. L.</given-names></name> <name><surname>Winston</surname><given-names>K. T.</given-names></name> <name><surname>Buchmaier</surname><given-names>S.</given-names></name> <name><surname>Cooper</surname><given-names>C. J.</given-names></name> <name><surname>Clarke</surname><given-names>R. E.</given-names></name> <name><surname>Martino</surname><given-names>M. R.</given-names></name> <etal/></person-group>. (<year>2025</year>). <article-title>A model of ethanol self-administration in head-fixed mice</article-title>. <source>Alcohol. Clin. Exp. Res.</source> <volume>49</volume>, <fpage>2103</fpage>&#x2013;<lpage>2112</lpage>. doi: <pub-id pub-id-type="doi">10.1111/acer.70132</pub-id>, <pub-id pub-id-type="pmid">40776452</pub-id></mixed-citation></ref>
<ref id="ref48"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yin</surname><given-names>H. H.</given-names></name> <name><surname>Knowlton</surname><given-names>B. J.</given-names></name></person-group> (<year>2004</year>). <article-title>Contributions of striatal subregions to place and response learning</article-title>. <source>Learn. Mem.</source> <volume>11</volume>, <fpage>459</fpage>&#x2013;<lpage>463</lpage>. doi: <pub-id pub-id-type="doi">10.1101/lm.81004</pub-id>, <pub-id pub-id-type="pmid">15286184</pub-id></mixed-citation></ref>
<ref id="ref49"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yin</surname><given-names>H. H.</given-names></name> <name><surname>Knowlton</surname><given-names>B. J.</given-names></name></person-group> (<year>2006</year>). <article-title>The role of the basal ganglia in habit formation</article-title>. <source>Nat. Rev. Neurosci.</source> <volume>7</volume>, <fpage>464</fpage>&#x2013;<lpage>476</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nrn1919</pub-id>, <pub-id pub-id-type="pmid">16715055</pub-id></mixed-citation></ref>
<ref id="ref50"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yin</surname><given-names>H. H.</given-names></name> <name><surname>Knowlton</surname><given-names>B. J.</given-names></name> <name><surname>Balleine</surname><given-names>B. W.</given-names></name></person-group> (<year>2004</year>). <article-title>Lesions of dorsolateral striatum preserve outcome expectancy but disrupt habit formation in instrumental learning</article-title>. <source>Eur. J. Neurosci.</source> <volume>19</volume>, <fpage>181</fpage>&#x2013;<lpage>189</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1460-9568.2004.03095.x</pub-id>, <pub-id pub-id-type="pmid">14750976</pub-id></mixed-citation></ref>
<ref id="ref51"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yin</surname><given-names>H. H.</given-names></name> <name><surname>Knowlton</surname><given-names>B. J.</given-names></name> <name><surname>Balleine</surname><given-names>B. W.</given-names></name></person-group> (<year>2005a</year>). <article-title>Blockade of NMDA receptors in the dorsomedial striatum prevents action-outcome learning in instrumental conditioning</article-title>. <source>Eur. J. Neurosci.</source> <volume>22</volume>, <fpage>505</fpage>&#x2013;<lpage>512</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1460-9568.2005.04219.x</pub-id>, <pub-id pub-id-type="pmid">16045503</pub-id></mixed-citation></ref>
<ref id="ref52"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yin</surname><given-names>H. H.</given-names></name> <name><surname>Knowlton</surname><given-names>B. J.</given-names></name> <name><surname>Balleine</surname><given-names>B. W.</given-names></name></person-group> (<year>2006</year>). <article-title>Inactivation of dorsolateral striatum enhances sensitivity to changes in the action-outcome contingency in instrumental conditioning</article-title>. <source>Behav. Brain Res.</source> <volume>166</volume>, <fpage>189</fpage>&#x2013;<lpage>196</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.bbr.2005.07.012</pub-id></mixed-citation></ref>
<ref id="ref53"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yin</surname><given-names>H. H.</given-names></name> <name><surname>Ostlund</surname><given-names>S. B.</given-names></name> <name><surname>Knowlton</surname><given-names>B. J.</given-names></name> <name><surname>Balleine</surname><given-names>B. W.</given-names></name></person-group> (<year>2005b</year>). <article-title>The role of the dorsomedial striatum in instrumental conditioning</article-title>. <source>Eur. J. Neurosci.</source> <volume>22</volume>, <fpage>513</fpage>&#x2013;<lpage>523</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1460-9568.2005.04218.x</pub-id>, <pub-id pub-id-type="pmid">16045504</pub-id></mixed-citation></ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0001">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/750709/overview">Jasper Heinsbroek</ext-link>, University of Alabama at Birmingham, United States</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0002">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3291830/overview">Linda Simmler</ext-link>, University of Basel, Switzerland</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3298108/overview">Adam C. G. Crego</ext-link>, Brown University, United States</p>
</fn>
</fn-group>
</back>
</article>