<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Archiving and Interchange DTD with MathML3 v1.3 20210610//EN"  "JATS-archivearticle1-3-mathml3.dtd"><article xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="1.3"><front><journal-meta><journal-id journal-id-type="nlm-ta">elife</journal-id><journal-id journal-id-type="publisher-id">eLife</journal-id><journal-title-group><journal-title>eLife</journal-title></journal-title-group><issn publication-format="electronic" pub-type="epub">2050-084X</issn><publisher><publisher-name>eLife Sciences Publications, Ltd</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">93191</article-id><article-id pub-id-type="doi">10.7554/eLife.93191</article-id><article-id pub-id-type="doi" specific-use="version">10.7554/eLife.93191.4</article-id><article-version article-version-type="publication-state">version of record</article-version><article-categories><subj-group subj-group-type="display-channel"><subject>Research Article</subject></subj-group><subj-group subj-group-type="heading"><subject>Computational and Systems Biology</subject></subj-group><subj-group subj-group-type="heading"><subject>Neuroscience</subject></subj-group></article-categories><title-group><article-title>Evidence from pupillometry, fMRI, and RNN modelling shows that gain neuromodulation mediates task-relevant perceptual switches</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name><surname>Wainstein</surname><given-names>Gabriel</given-names></name><contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0002-8106-6647</contrib-id><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">†</xref><xref ref-type="fn" rid="con1"/><xref ref-type="fn" rid="conf1"/></contrib><contrib contrib-type="author" equal-contrib="yes"><name><surname>Whyte</surname><given-names>Christopher J</given-names></name><contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0002-4627-0503</contrib-id><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">†</xref><xref ref-type="fn" rid="con2"/><xref ref-type="fn" rid="conf1"/></contrib><contrib contrib-type="author"><name><surname>Ehgoetz Martens</surname><given-names>Kaylena A</given-names></name><contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0002-8488-2295</contrib-id><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="con3"/><xref ref-type="fn" rid="conf1"/></contrib><contrib contrib-type="author"><name><surname>Müller</surname><given-names>Eli J</given-names></name><contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0003-2497-0194</contrib-id><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="con4"/><xref ref-type="fn" rid="conf1"/></contrib><contrib contrib-type="author"><name><surname>Medel</surname><given-names>Vicente</given-names></name><contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0003-2443-8683</contrib-id><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="fn" rid="con5"/><xref ref-type="fn" rid="conf1"/></contrib><contrib contrib-type="author"><name><surname>Anderson</surname><given-names>Britt</given-names></name><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="con6"/><xref ref-type="fn" rid="conf1"/></contrib><contrib contrib-type="author"><name><surname>Stöttinger</surname><given-names>Elisabeth</given-names></name><contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0003-4544-8944</contrib-id><xref ref-type="aff" rid="aff5">5</xref><xref ref-type="fn" rid="con7"/><xref ref-type="fn" rid="conf1"/></contrib><contrib contrib-type="author"><name><surname>Danckert</surname><given-names>James</given-names></name><contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0001-8093-066X</contrib-id><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="con8"/><xref ref-type="fn" rid="conf1"/></contrib><contrib contrib-type="author" equal-contrib="yes"><name><surname>Munn</surname><given-names>Brandon R</given-names></name><contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0002-3638-1605</contrib-id><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">†</xref><xref ref-type="fn" rid="con9"/><xref ref-type="fn" rid="conf1"/></contrib><contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name><surname>Shine</surname><given-names>James M</given-names></name><contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0003-1762-5499</contrib-id><email>mac.shine@sydney.edu.au</email><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">†</xref><xref ref-type="other" rid="fund1"/><xref ref-type="other" rid="fund2"/><xref ref-type="fn" rid="con10"/><xref ref-type="fn" rid="conf1"/></contrib><aff id="aff1"><label>1</label><institution-wrap><institution-id institution-id-type="ror">https://ror.org/0384j8v12</institution-id><institution>Brain and Mind Center, The University of Sydney</institution></institution-wrap><addr-line><named-content content-type="city">Sydney</named-content></addr-line><country>Australia</country></aff><aff id="aff2"><label>2</label><institution-wrap><institution-id institution-id-type="ror">https://ror.org/0384j8v12</institution-id><institution>Center for Complex Systems, The University of Sydney</institution></institution-wrap><addr-line><named-content content-type="city">Sydney</named-content></addr-line><country>Australia</country></aff><aff id="aff3"><label>3</label><institution-wrap><institution-id institution-id-type="ror">https://ror.org/01aff2v68</institution-id><institution>The University of Waterloo</institution></institution-wrap><addr-line><named-content content-type="city">Waterloo</named-content></addr-line><country>Canada</country></aff><aff id="aff4"><label>4</label><institution-wrap><institution-id institution-id-type="ror">https://ror.org/0326knt82</institution-id><institution>Latin American Brain Health (BrainLat), Universidad Adolfo Ibáñez</institution></institution-wrap><addr-line><named-content content-type="city">Santiago</named-content></addr-line><country>Chile</country></aff><aff id="aff5"><label>5</label><institution-wrap><institution-id institution-id-type="ror">https://ror.org/03hj50651</institution-id><institution>Hochschule Fresenius</institution></institution-wrap><addr-line><named-content content-type="city">Köln</named-content></addr-line><country>Germany</country></aff></contrib-group><contrib-group content-type="section"><contrib contrib-type="editor"><name><surname>Donner</surname><given-names>Tobias H</given-names></name><role>Reviewing Editor</role><aff><institution-wrap><institution-id institution-id-type="ror">https://ror.org/01zgy1s35</institution-id><institution>University Medical Center Hamburg-Eppendorf</institution></institution-wrap><country>Germany</country></aff></contrib><contrib contrib-type="senior_editor"><name><surname>Gold</surname><given-names>Joshua I</given-names></name><role>Senior Editor</role><aff><institution-wrap><institution-id institution-id-type="ror">https://ror.org/00b30xv10</institution-id><institution>University of Pennsylvania</institution></institution-wrap><country>United States</country></aff></contrib></contrib-group><author-notes><fn fn-type="con" id="equal-contrib1"><label>†</label><p>These authors contributed equally to this work</p></fn></author-notes><pub-date publication-format="electronic" date-type="publication"><day>20</day><month>06</month><year>2025</year></pub-date><volume>13</volume><elocation-id>RP93191</elocation-id><history><date date-type="sent-for-review" iso-8601-date="2023-10-19"><day>19</day><month>10</month><year>2023</year></date></history><pub-history><event><event-desc>This manuscript was published as a preprint.</event-desc><date date-type="preprint" iso-8601-date="2023-09-27"><day>27</day><month>09</month><year>2023</year></date><self-uri content-type="preprint" xlink:href="https://doi.org/10.21203/rs.3.rs-2356429/v3"/></event><event><event-desc>This manuscript was published as a reviewed preprint.</event-desc><date date-type="reviewed-preprint" iso-8601-date="2024-01-25"><day>25</day><month>01</month><year>2024</year></date><self-uri content-type="reviewed-preprint" xlink:href="https://doi.org/10.7554/eLife.93191.1"/></event><event><event-desc>The reviewed preprint was revised.</event-desc><date date-type="reviewed-preprint" iso-8601-date="2025-02-27"><day>27</day><month>02</month><year>2025</year></date><self-uri content-type="reviewed-preprint" xlink:href="https://doi.org/10.7554/eLife.93191.2"/></event><event><event-desc>The reviewed preprint was revised.</event-desc><date date-type="reviewed-preprint" iso-8601-date="2025-05-15"><day>15</day><month>05</month><year>2025</year></date><self-uri content-type="reviewed-preprint" xlink:href="https://doi.org/10.7554/eLife.93191.3"/></event></pub-history><permissions><copyright-statement>© 2024, Wainstein, Whyte et al</copyright-statement><copyright-year>2024</copyright-year><copyright-holder>Wainstein, Whyte et al</copyright-holder><ali:free_to_read/><license xlink:href="http://creativecommons.org/licenses/by/4.0/"><ali:license_ref>http://creativecommons.org/licenses/by/4.0/</ali:license_ref><license-p>This article is distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License</ext-link>, which permits unrestricted use and redistribution provided that the original author and source are credited.</license-p></license></permissions><self-uri content-type="pdf" xlink:href="elife-93191-v1.pdf"/><self-uri content-type="figures-pdf" xlink:href="elife-93191-figures-v1.pdf"/><abstract><p>Perceptual updating has been hypothesised to rely on a network reset modulated by bursts of ascending neuromodulatory neurotransmitters, such as noradrenaline, abruptly altering the brain’s susceptibility to changing sensory activity. To test this hypothesis at a large-scale, we analysed an ambiguous figures task using pupillometry and functional magnetic resonance imaging (fMRI). Behaviourally, qualitative shifts in the perceptual interpretation of an ambiguous image were associated with peaks in pupil diameter, an indirect readout of phasic bursts in neuromodulatory tone. We further hypothesised that stimulus ambiguity drives neuromodulatory tone, leading to heightened neural gain, hastening perceptual switches. To explore this hypothesis computationally, we trained a recurrent neural network (RNN) on an analogous perceptual categorisation task, allowing gain to change dynamically with classification uncertainty. As predicted, higher gain accelerated perceptual switching by transiently destabilising the network’s dynamical regime in periods of maximal uncertainty. We leveraged a low-dimensional readout of the RNN dynamics to develop two novel macroscale predictions: perceptual switches should occur with peaks in low-dimensional brain state velocity and with a flattened egocentric energy landscape. Using fMRI, we confirmed these predictions, highlighting the role of the neuromodulatory system in the large-scale network reconfigurations mediating adaptive perceptual updates.</p></abstract><kwd-group kwd-group-type="author-keywords"><kwd>fMRI</kwd><kwd>pupillometry</kwd><kwd>neural network</kwd><kwd>switching</kwd><kwd>perception</kwd><kwd>neuromodulation</kwd></kwd-group><kwd-group kwd-group-type="research-organism"><title>Research organism</title><kwd>Human</kwd></kwd-group><funding-group><award-group id="fund1"><funding-source><institution-wrap><institution-id institution-id-type="FundRef">http://dx.doi.org/10.13039/501100000925</institution-id><institution>National Health and Medical Research Council</institution></institution-wrap></funding-source><principal-award-recipient><name><surname>Shine</surname><given-names>James M</given-names></name></principal-award-recipient></award-group><award-group id="fund2"><funding-source><institution-wrap><institution-id institution-id-type="FundRef">http://dx.doi.org/10.13039/501100000923</institution-id><institution>Australian Research Council</institution></institution-wrap></funding-source><principal-award-recipient><name><surname>Shine</surname><given-names>James M</given-names></name></principal-award-recipient></award-group><funding-statement>The funders had no role in study design, data collection and interpretation, or the decision to submit the work for publication.</funding-statement></funding-group><custom-meta-group><custom-meta specific-use="meta-only"><meta-name>Author impact statement</meta-name><meta-value>Phasic neuromodulatory bursts actively drive adaptive perceptual updating by triggering large-scale brain network reconfigurations, as demonstrated through integrated pupillometry, fMRI, and computational modelling.</meta-value></custom-meta><custom-meta specific-use="meta-only"><meta-name>publishing-route</meta-name><meta-value>prc</meta-value></custom-meta></custom-meta-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>The overwhelming majority of neurons in our brains have only indirect interactions with the external world. This means that the identity of sensory inputs is inherently ambiguous (<xref ref-type="bibr" rid="bib9">Bogacz, 2017</xref>; <xref ref-type="bibr" rid="bib27">Flounders et al., 2019</xref>; <xref ref-type="bibr" rid="bib28">Friston, 2005</xref>; <xref ref-type="bibr" rid="bib36">Hohwy, 2013</xref>; <xref ref-type="bibr" rid="bib16">Clark, 2013</xref>). The equivocal nature of perceptual input is overcome by incorporating prior information about the causal structure of the world into sensory inferences. This is clearly evidenced in laboratory experiments that present participants with sensory inputs that offer two equally valid yet mutually exclusive perceptual interpretations (e.g. the Necker cube illusion and binocular rivalry): in these ambiguous scenarios, observers periodically switch between mutually exclusive percepts (<xref ref-type="bibr" rid="bib34">Hohwy et al., 2008</xref>; <xref ref-type="bibr" rid="bib1">Alais and Blake, 2005</xref>; <xref ref-type="bibr" rid="bib89">van Ee, 2005</xref>).</p><p>Outside of conditions of extreme perceptual ambiguity, perceptual awareness is remarkably stable, suggesting that the nervous system can rapidly (and flexibly) identify the best ‘match’ between visual data and a stable (likely known) stimulus category (<xref ref-type="bibr" rid="bib34">Hohwy et al., 2008</xref>; <xref ref-type="bibr" rid="bib35">Hohwy, 2012</xref>). Importantly, this process of combining ambiguous sensory input with prior information must be dynamic: adaptive behaviour requires that the relative reliability of prior information and current sensory input are made suitably contextually dependent (<xref ref-type="bibr" rid="bib51">Moran et al., 2013</xref>; <xref ref-type="bibr" rid="bib77">Shine et al., 2021</xref>; <xref ref-type="bibr" rid="bib59">Parr and Friston, 2018</xref>; <xref ref-type="bibr" rid="bib58">Parr and Friston, 2017</xref>). In ecological settings, the problem is even more pronounced: not only does the reliability of the sensory input vary, the urgency of perceptual decision-making also changes between context (<xref ref-type="bibr" rid="bib85">Thura et al., 2020</xref>; <xref ref-type="bibr" rid="bib8">Bogacz et al., 2006</xref>; <xref ref-type="bibr" rid="bib56">Murphy et al., 2016</xref>).</p><p>Neuroimaging studies investigating perceptual updating and switches have typically identified a distributed set of regions within the cerebral cortex (<xref ref-type="bibr" rid="bib79">Stöttinger et al., 2015</xref>; <xref ref-type="bibr" rid="bib96">Weilnhammer et al., 2017</xref>). These cortical regions are presumed to play a role in attentional shifts driving switches in perceptual contents by selectively boosting activity within the relevant circuits (<xref ref-type="bibr" rid="bib96">Weilnhammer et al., 2017</xref>; <xref ref-type="bibr" rid="bib65">Reynolds and Heeger, 2009</xref>; <xref ref-type="bibr" rid="bib20">Desimone and Duncan, 1995</xref>). This interpretation is complemented by behavioural evidence showing that attention plays a prominent role in determining the contents of perception in bistable perception tasks where competition is not resolved at low-levels of the visual hierarchy (<xref ref-type="bibr" rid="bib49">Meng and Tong, 2004</xref>; <xref ref-type="bibr" rid="bib22">Dieter and Tadin, 2011</xref>). Similarly, computational models of perceptual decision-making typically consist of winner-take-all competition between cortical populations (<xref ref-type="bibr" rid="bib99">Wong and Wang, 2006</xref>; <xref ref-type="bibr" rid="bib24">Eckhoff et al., 2011</xref>; <xref ref-type="bibr" rid="bib95">Wang, 2002</xref>). Yet, the ability to flexibly respond to ambiguous visual inputs according to changing task demands is a feature that is present across phylogeny (<xref ref-type="bibr" rid="bib15">Cisek, 2019</xref>) and hence is present in a wide variety of animals that have poorly developed cerebral cortices (<xref ref-type="bibr" rid="bib13">Carter et al., 2020</xref>). Indeed, phasic change in the highly conserved ascending arousal system have been linked to moment-by-moment adaptive updates in the relative weighting of prior information, sensory input, and the urgency of the perceptual decision process through neuromodulatory-mediated alterations in neural gain (<xref ref-type="bibr" rid="bib68">Sales et al., 2019</xref>; <xref ref-type="bibr" rid="bib90">Vincent et al., 2019</xref>; <xref ref-type="bibr" rid="bib42">Jordan and Keller, 2023</xref>; <xref ref-type="bibr" rid="bib55">Murphy et al., 2014</xref>).</p><p>The ascending neuromodulatory system, and specifically the noradrenergic locus coeruleus (LC), is well-suited to modulate the large-scale, brain state switches required to flexibly alter perceptual contents (<xref ref-type="bibr" rid="bib83">Szabadi, 2018</xref>; <xref ref-type="bibr" rid="bib11">Briand et al., 2007</xref>). While the cell body of the LC is located in the brainstem, the nucleus sends projections throughout the central nervous system, wherein its axons release noradrenaline, which in turn modulate the excitability of targeted regions (<xref ref-type="bibr" rid="bib77">Shine et al., 2021</xref>). In previous work, it has been argued that the phasic release of noradrenaline from the LC acts as a ‘network reset’ signal, which effectively disrupts ongoing processing, and hence allows animals to reconfigure their ongoing neural dynamics towards more salient (and hopefully, behaviourally relevant) processes (<xref ref-type="bibr" rid="bib70">Sara, 2009</xref>; <xref ref-type="bibr" rid="bib38">Jacob and Nienborg, 2018</xref>; <xref ref-type="bibr" rid="bib10">Bouret and Sara, 2005</xref>). This mechanism is of critical importance in ecological contexts in which an animal needs to be able to both focus on the current task in an exploitative mode (such as foraging), while being able to rapidly modify its internal, attentional, and behavioural state when required (e.g. if resources are depleted, or in the presence of a predator).</p><p>Preliminary evidence in the context of bistable perception has shown that when a stimulus is task-relevant, pupil diameter (a non-specific and indirect readout of phasic LC activity [<xref ref-type="bibr" rid="bib44">Joshi and Gold, 2020</xref>; <xref ref-type="bibr" rid="bib69">Samuels and Szabadi, 2008</xref>; <xref ref-type="bibr" rid="bib61">Pfeffer et al., 2022</xref>; <xref ref-type="bibr" rid="bib19">de Gee et al., 2020</xref>] and neuromodulatory tone) is tightly linked to switches in the content of perception (<xref ref-type="bibr" rid="bib55">Murphy et al., 2014</xref>; <xref ref-type="bibr" rid="bib25">Einhäuser et al., 2008</xref>; <xref ref-type="bibr" rid="bib64">Reimer et al., 2016</xref>). In line with this, recent modelling has shown that linking perceptual updates to fluctuations in neuromodulatory tone recapitulates the phasic-tonic firing rate pattern known to characterise LC spiking dynamics and improves performance in reinforcement learning tasks (<xref ref-type="bibr" rid="bib68">Sales et al., 2019</xref>). Thus, whilst the LC could plausibly mediate perceptual switches in a task-relevant setting, we still need a more robust test of this hypothesis.</p><p>Based on previous work (<xref ref-type="bibr" rid="bib70">Sara, 2009</xref>; <xref ref-type="bibr" rid="bib38">Jacob and Nienborg, 2018</xref>; <xref ref-type="bibr" rid="bib10">Bouret and Sara, 2005</xref>; <xref ref-type="bibr" rid="bib75">Shine, 2019</xref>; <xref ref-type="bibr" rid="bib93">Wainstein et al., 2021</xref>), and the projections of the LC to many of the regions implicated in whole-brain imaging studies of perceptual uncertainty (<xref ref-type="bibr" rid="bib69">Samuels and Szabadi, 2008</xref>; <xref ref-type="bibr" rid="bib17">de Gee et al., 2014</xref>; <xref ref-type="bibr" rid="bib18">de Gee et al., 2017</xref>), we hypothesised that task-related perceptual switches can be modulated by phasic bursts of LC activity, which act as a ‘network reset’ (<xref ref-type="bibr" rid="bib10">Bouret and Sara, 2005</xref>), flattening the whole-brain energy landscape (<xref ref-type="bibr" rid="bib54">Munn et al., 2021</xref>) and thus allowing cortical dynamics to evolve into a new state thereby changing the contents of perception.</p><p>To test this hypothesis, we leveraged a cognitive task designed to investigate switches in perceptual categorisation (<xref ref-type="bibr" rid="bib80">Stöttinger et al., 2016</xref>). We observed that pupil diameter peaked at the point of the perceptual switch and predicted their timing. We then trained a recurrent neural network (RNN) to perform an analogous change detection task. Based on previous modelling and theory, we allowed the gain of the activation function (an established mechanism for the action of noradrenaline on the cerebral cortex; <xref ref-type="bibr" rid="bib77">Shine et al., 2021</xref>; <xref ref-type="bibr" rid="bib74">Shine et al., 2018</xref>; <xref ref-type="bibr" rid="bib72">Servan-schreiber, 2016</xref>) to vary as a function of the uncertainty in the pretrained network’s perceptual categorisation. This revealed that heightened gain facilitated earlier perceptual switches by transiently destabilising the network’s dynamics under conditions of maximal uncertainty. Further analyses translated these neural dynamics into two predictions that could be tested in fMRI data (<xref ref-type="bibr" rid="bib79">Stöttinger et al., 2015</xref>; <xref ref-type="bibr" rid="bib80">Stöttinger et al., 2016</xref>): (1) heightened gain increases the velocity of low-dimensional neural trajectories around perceptual switches, and (2) it flattens the energy landscape of the neural state space (<xref ref-type="bibr" rid="bib54">Munn et al., 2021</xref>). Overall, our results support the hypothesis that phasic bursts of neuromodulatory activity act as a ‘network reset’ (<xref ref-type="bibr" rid="bib70">Sara, 2009</xref>; <xref ref-type="bibr" rid="bib10">Bouret and Sara, 2005</xref>), dynamically disrupting stable network states and facilitating switches in perceptual categorisation. This reset mechanism highlights the role of neuromodulatory systems in transiently reorganising network dynamics to enhance flexibility and adaptability in response to uncertainty.</p></sec><sec id="s2" sec-type="results"><title>Results</title><sec id="s2-1"><title>Evoked pupil dilations coincide with the resolution of perceptual ambiguity</title><p>To assess the role of the ascending arousal activity during task performance, we analysed a dataset of 35 participants who performed an ambiguous figures task whilst simultaneously recording pupil diameter with an eye tracker device (SR Research, 1000 Hz). Briefly, the task consisted of a set of continuously transforming images that transition from an initial object (e.g. a shark) into a second object (e.g. a plane), while preserving basic psychophysical attributes (<xref ref-type="fig" rid="fig1">Figure 1A</xref>). Crucially, even though the task stimuli change incrementally and linearly, with maximal ambiguity at the mid-point of each trial (the peak of the dotted line curve in <xref ref-type="fig" rid="fig1">Figure 1A</xref>), awareness of a change in the stimulus is known to ‘pop out’, often at different times on each trial (<xref ref-type="bibr" rid="bib80">Stöttinger et al., 2016</xref>). When these perceptual switches occurred, subjects were instructed to change the button they were pressing, thus indicating a change in perceptual interpretation across stimuli. Participants viewed 20 unique sets of images, each of which morphed from a starting image into a second image through 15 equally spaced intermittent stages (<xref ref-type="fig" rid="fig1">Figure 1A</xref>). For each participant, we identified the first and last time they viewed a sequence of images, as well as the three images leading up to and following an identified perceptual switch, irrespective of the categories associated with each specific object switch. The rest of the analyses in this article are organised around this perceptual transition.</p><fig id="fig1" position="float"><label>Figure 1.</label><caption><title>Pupil diameter tracks perceptual change.</title><p>(<bold>A</bold>) Example trial showing the continuous change from a stable image (plane) into a shark; Lower: the probability of detecting a switch (<italic>Δ</italic>) as a function of Image – most switches occur around the mid-point, but not exclusively so, leading to our prediction of heightened locus coeruleus activity at the switch point. (<bold>B</bold>) Representation of the locus coeruleus (red), its diffuse projections to the whole-brain network and its link to pupil dilation. (<bold>C</bold>) Pupil diameter group average evoked response time locked to the perceptual change (dark line, <italic>t=</italic>0). We observed an increase of the pupillary response that peaked at the perceptual change. (<bold>D</bold>) Group average of evoked pupillary responses to image switches – red represents the faster response when the switch occurs at image 6; green indicates a medium response with the switch at image 8; and blue denotes the slowest response with the switch at image 10.</p></caption><graphic mimetype="image" mime-subtype="tiff" xlink:href="elife-93191-fig1-v1.tif"/></fig><p>Given the known (admittedly non-specific) relationship between LC activity and the dynamics of pupil diameter (<xref ref-type="bibr" rid="bib43">Joshi et al., 2016</xref>; <xref ref-type="fig" rid="fig1">Figure 1B</xref>), we were able to test the hypothesis that neuromodulatory tone is associated with perceptual switching. The linear nature of the morphing procedure meant that luminance levels (which could otherwise bias pupil diameter; <xref ref-type="bibr" rid="bib83">Szabadi, 2018</xref>; <xref ref-type="bibr" rid="bib44">Joshi and Gold, 2020</xref>; <xref ref-type="bibr" rid="bib69">Samuels and Szabadi, 2008</xref>) were kept constant across all trials. Additionally, motor preparation was controlled by requiring subjects to press a button on each image (indicating the content of their perception). Mapping all blink-corrected, filtered, and normalised trials over time.</p><p>We observed a clear increase in the phasic pupillary response approximately three trials before participants switched to a new perceptual category, potentially reflecting the onset of increased ambiguity towards a new object (<xref ref-type="fig" rid="fig1">Figure 1C</xref>). This response peaked at the point of the perceptual switch, corresponding to the maximum pupil diameter (<xref ref-type="fig" rid="fig1">Figure 1C</xref>). Further analysis revealed a significant increase in the mean pupil response starting three images before the change point (mean <italic>β</italic>=0.22; <italic>t</italic><sub>(32)</sub> = 8.02, p=2.3 × 10<sup>−19</sup>), before returning to baseline levels.</p><p>Next, we sought to elucidate the relationship between ascending arousal, quantified by pupil diameter, and the temporal dynamics of perceptual shifts on a trial-by-trial basis. Given the pivotal role of the LC in modulating sensory processing and perceptual switches (<xref ref-type="fig" rid="fig1">Figure 1B</xref>), we hypothesised that the speed of a perceptual switch would correlate with neuromodulatory tone. Specifically, we predicted that trials with faster perceptual switches would be associated with an increase in pupil diameter, while slower switches would correspond to a decrease.</p><p>To test this prediction, we performed a two-level linear model analysis. The peak pupil diameter observed during the perceptual switch was designated as the independent variable, and the trial on which the perceptual shift was reported served as the regressor for each subject. To control for potential confounds, such as impulsive premature responses, and address reduced statistical power in extreme response epochs (both early and late), we limited our analysis to responses within two images from the median switch point (9±2; 84.1% of total trials). At the group level, we conducted a one-tailed <italic>t</italic>-test on the regressors from the linear model. As expected, we observed an inverse relationship between evoked pupil diameter and the trial marking the perceptual switch (mean <italic>β</italic>=–0.19, <italic>t</italic><sub>(27)</sub>=–2.6452, p=6.7 × 10⁻³, SD=0.3880). Earlier responses showed a positive relationship with higher evoked pupil diameter during the switch epoch (<xref ref-type="fig" rid="fig1">Figure 1D</xref>, red), whereas later responses were associated with a more constricted pupil (<xref ref-type="fig" rid="fig1">Figure 1D</xref>, blue). In summary, these results provide indirect evidence for our hypothesis that ascending neuromodulation – such as LC activity – is associated with the speed of perceptual switches.</p></sec><sec id="s2-2"><title>Computational evidence for neuromodulatory-mediated perceptual switches in a recurrent neural network</title><p>Our initial results provided confirmatory evidence implicating the neuromodulatory tone of the ascending arousal system in perceptual switches. There is evidence, however, suggesting that simply changing stimulus categories can also induce similar pupillary dilations (<xref ref-type="bibr" rid="bib25">Einhäuser et al., 2008</xref>; <xref ref-type="bibr" rid="bib37">Hupé et al., 2009</xref>, <xref ref-type="bibr" rid="bib46">Kloosterman et al., 2015</xref>). What we need, therefore, is a more mechanistic means of both framing and testing our network reset hypothesis in the context of perceptual switching. Along with others (<xref ref-type="bibr" rid="bib47">Kosciessa et al., 2021</xref>; <xref ref-type="bibr" rid="bib26">Eldar et al., 2013</xref>; <xref ref-type="bibr" rid="bib88">Urai et al., 2017</xref>; <xref ref-type="bibr" rid="bib46">Kloosterman et al., 2015</xref>), we have used a combination of computational modelling (<xref ref-type="bibr" rid="bib74">Shine et al., 2018</xref>; <xref ref-type="bibr" rid="bib52">Müller et al., 2020</xref>), neurobiological theory (<xref ref-type="bibr" rid="bib77">Shine et al., 2021</xref>), and multi-model neuroimaging (<xref ref-type="bibr" rid="bib65">Reynolds and Heeger, 2009</xref>; <xref ref-type="bibr" rid="bib13">Carter et al., 2020</xref>; <xref ref-type="bibr" rid="bib55">Murphy et al., 2014</xref>; <xref ref-type="bibr" rid="bib83">Szabadi, 2018</xref>) to suggest that noradrenaline alters neural gain (<xref ref-type="bibr" rid="bib72">Servan-schreiber, 2016</xref>; <xref ref-type="bibr" rid="bib3">Aston-Jones and Cohen, 2005</xref>), which in turn affects inter-regional communication flattening the energy landscape traversed by the brain’s dynamics allowing the brain state to jump between perceptual attractors more easily. Whether these signatures of large-scale network reconfiguration are mechanistically related to network reset remains an important and open question.</p><p>To test whether our hypothesised neuromodulatory mechanism could recapitulate the behaviour we observed in the ambiguous figures task, we trained 50 continuous time RNNs constrained to respect Dale’s law (i.e. 80/20 split of purely excitatory/inhibitory units; <xref ref-type="bibr" rid="bib78">Song et al., 2016</xref>; <xref ref-type="bibr" rid="bib100">Yang and Wang, 2020</xref>) to perform a perceptual change detection task analogous to the task performed by our participants (<xref ref-type="fig" rid="fig2">Figure 2A</xref>). The input and readout weights were constrained to be purely excitatory and only the firing rate of excitatory units contributed to the readout (<xref ref-type="bibr" rid="bib78">Song et al., 2016</xref>; see ‘Methods’).</p><fig-group><fig id="fig2" position="float"><label>Figure 2.</label><caption><title>A recurrent neural network (RNN) model of perceptual switching.</title><p>(<bold>A</bold>) We trained a continuous time E/I RNN to categorise linearly changing inputs representing two discrete categories (e.g. output z<sub>1</sub> and output z<sub>2</sub>). (<bold>B</bold>) Softmax of network outputs on example trial with <inline-formula><alternatives><mml:math id="inf1"><mml:mi>γ</mml:mi><mml:mo>=</mml:mo><mml:mo>.</mml:mo><mml:mn>6</mml:mn></mml:math><tex-math id="inft1">\begin{document}$\gamma =.6$\end{document}</tex-math></alternatives></inline-formula>, dotted line shows the timing of the perceptual switch. (<bold>C</bold>) Following training, the firing rate of the excitatory units was clearly separated into two stimulus-selective clusters – those that responded maximally to u<sub>1</sub> (blue) and those that respond maximally to u<sub>2</sub> (orange). Inhibitory units demonstrated a similar modular clustering but were sorted by the selectivity of the excitatory units they inhibited. (<bold>D</bold>) Dynamics of gain on example trial with <inline-formula><alternatives><mml:math id="inf2"><mml:mi>γ</mml:mi><mml:mo>=</mml:mo><mml:mo>.</mml:mo><mml:mn>6</mml:mn></mml:math><tex-math id="inft2">\begin{document}$\gamma =.6$\end{document}</tex-math></alternatives></inline-formula> which peaks close to the perceptual switch (inset shows similarity to pupil diameter). (<bold>E</bold>) Simplified network structure implied by selectivity analysis. Excitatory units (blue) form two stimulus-selective modules. Each excitatory cluster is inhibited by a cluster of inhibitory units and a third non-selective inhibitory population. Pipette shows lesion targets. (<bold>F</bold>) Switch time as a function of <inline-formula><alternatives><mml:math id="inf3"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft3">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula> magnitude (i.e. magnitude of uncertainty forcing). Lower black line shows a speeding effect of heightened <inline-formula><alternatives><mml:math id="inf4"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft4">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula> (and therefore heightened gain at the perceptual switch). Teal lines show switch time for lesions to the inhibitory population targeting the initially dominant population (dark teal upper), and lesions to the inhibitory population selective for the stimulus the input is morphing into (light teal middle).</p></caption><graphic mimetype="image" mime-subtype="tiff" xlink:href="elife-93191-fig2-v1.tif"/></fig><fig id="fig2s1" position="float" specific-use="child-fig"><label>Figure 2—figure supplement 1.</label><caption><title>Switch time as a function of gain for the network simulated with static (i.e. constant) gain.</title></caption><graphic mimetype="image" mime-subtype="tiff" xlink:href="elife-93191-fig2-figsupp1-v1.tif"/></fig><fig id="fig2s2" position="float" specific-use="child-fig"><label>Figure 2—figure supplement 2.</label><caption><title>Left selectivity of excitatory units (0: completely selective for <inline-formula><alternatives><mml:math id="inf5"><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:math><tex-math id="inft5">\begin{document}$u_{1}$\end{document}</tex-math></alternatives></inline-formula>, 1: completely selective for <inline-formula><alternatives><mml:math id="inf6"><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub></mml:math><tex-math id="inft6">\begin{document}$u_{2}$\end{document}</tex-math></alternatives></inline-formula>).</title><p>Right selectivity of inhibitory units sorted by the degree to which they inhibit excitatory units with selectivity &gt;0.5 or &lt;0.5.</p></caption><graphic mimetype="image" mime-subtype="tiff" xlink:href="elife-93191-fig2-figsupp2-v1.tif"/></fig></fig-group><p>Each network was provided with a two-dimensional input <inline-formula><alternatives><mml:math id="inf7"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>u</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>t</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mo stretchy="false">[</mml:mo><mml:msub><mml:mi>u</mml:mi><mml:mn>1</mml:mn></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mi>u</mml:mi><mml:mn>2</mml:mn></mml:msub><mml:msup><mml:mo stretchy="false">]</mml:mo><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mstyle></mml:math><tex-math id="inft7">\begin{document}$u\left (t\right)=[u_1,u_2]^T$\end{document}</tex-math></alternatives></inline-formula> with each column representing the ‘sensory evidence’ for each of the two stimulus categories (<xref ref-type="fig" rid="fig2">Figure 2A</xref>). The task lasted for 1 s of simulation time (we used a shorter time period for the simulation than the empirical task so that we could keep the integration step relatively small, making the training and simulations more numerically tractable): to mimic the linear transition between image categories in our task, each trial began with maximum evidence for one of the two categoriesand minimum evidence for the other (e.g. <inline-formula><alternatives><mml:math id="inf8"><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:math><tex-math id="inft8">\begin{document}$u_{1}=1,u_{2}=0$\end{document}</tex-math></alternatives></inline-formula>), and then linearly changed the evidence over the course of each trial such that by the final time-step the evidence for each category had switched (e.g. <inline-formula><alternatives><mml:math id="inf9"><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:math><tex-math id="inft9">\begin{document}$u_{1}=0,u_{2}=1$\end{document}</tex-math></alternatives></inline-formula>). At each time point, the network was trained to output a categorical response indicating which input dimension had a higher value (<xref ref-type="fig" rid="fig2">Figure 2B</xref>). Following training, all networks achieved near-perfect behavioural accuracy (0.97±0.02).</p><p>We next sought to test our hypothesis about the role of neural gain in perceptual switches. In previous work, we (and others) have argued that the impact of neuromodulators (such as NA) on population-level activity can be approximated by steepening (or flattening) the sigmoid activation function, thus mimicking the effect NA has on neuronal excitability by liberating intracellular calcium stores and/or opening (or closing) voltage-gated ions channels (<xref ref-type="bibr" rid="bib77">Shine et al., 2021</xref>; <xref ref-type="bibr" rid="bib94">Wainstein et al., 2022</xref>). As a first test of this hypothesis, we manipulated the <italic>gain</italic> of the sigmoid activation function for all units in the network across a range of gain values (0.5–1.5) in a static manner. As predicted, increased gain (red; corresponding to heightened adrenergic tone) leads to earlier ‘perceptual switches’ in the network output whereas low gain caused later switches (<xref ref-type="fig" rid="fig2s1">Figure 2—figure supplement 1</xref>).</p><p>Having confirmed that static manipulations of gain alter the speed of perceptual switches, we constructed a more precise test of our hypothesis. Specifically, inspired by previous theoretical and experimental work showing that sensory prediction errors (i.e. transient increases in perceptual uncertainty) lead to phasic bursts in the noradrenergic LC (<xref ref-type="bibr" rid="bib68">Sales et al., 2019</xref>; <xref ref-type="bibr" rid="bib42">Jordan and Keller, 2023</xref>), we made gain time dependent with dynamics governed by a linear ODE with a forcing term proportional to the uncertainty (i.e. the entropy <inline-formula><alternatives><mml:math id="inf10"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>H</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>z</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:munder><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:munder><mml:mi>p</mml:mi><mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:mi>z</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mi>l</mml:mi><mml:mi>n</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>p</mml:mi><mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:mi>z</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math><tex-math id="inft10">\begin{document}$H\left (z\right)=\sum _{i}p\left (z\right)_{i}ln\left (p\left (z\right)_{i}\right)$\end{document}</tex-math></alternatives></inline-formula>) of the network’s readout (<xref ref-type="fig" rid="fig2">Figure 2A</xref>).<disp-formula id="equ1"><alternatives><mml:math id="m1"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mi>τ</mml:mi><mml:mfrac><mml:mrow><mml:mi>d</mml:mi><mml:mi>g</mml:mi></mml:mrow><mml:mrow><mml:mi>d</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:mfrac><mml:mo>=</mml:mo><mml:msub><mml:mi>g</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mi>o</mml:mi><mml:mi>n</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>−</mml:mo><mml:mi>g</mml:mi><mml:mo>+</mml:mo><mml:mi>γ</mml:mi><mml:mi>H</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>z</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:mstyle></mml:mrow></mml:mstyle></mml:math><tex-math id="t1">\begin{document}$$\displaystyle \tau \frac{dg}{dt}= g_{tonic}- g +\gamma H\left (z\right)$$\end{document}</tex-math></alternatives></disp-formula></p><p>When the network’s readout becomes uncertain approaching the perceptual switch (i.e. has high entropy), gain increases in a phasic manner (with magnitude <inline-formula><alternatives><mml:math id="inf11"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft11">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula>), and in the absence of the forcing, gain decays exponentially to its tonic value (<inline-formula><alternatives><mml:math id="inf12"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msub><mml:mi>g</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mi>o</mml:mi><mml:mi>n</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mstyle></mml:math><tex-math id="inft12">\begin{document}$g_{tonic}=1$\end{document}</tex-math></alternatives></inline-formula>). This modification resulted in gain dynamics reminiscent of the participant’s pupil diameter (<xref ref-type="fig" rid="fig2">Figure 2D</xref>), and crucially, the speed of perceptual switches increased with the magnitude of the uncertainty-driven forcing term (<inline-formula><alternatives><mml:math id="inf13"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft13">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula>; <xref ref-type="fig" rid="fig2">Figure 2F</xref>).</p><p>Having confirmed our hypothesis that increasing gain as a function of the network uncertainty increased the speed of perceptual switches, we next sought to understand the mechanisms governing this effect starting with the circuit level and working our way up to the population level (c.f. Sheringtonian and Hopfieldian modes of analysis; <xref ref-type="bibr" rid="bib4">Barack and Krakauer, 2021</xref>). Because of the constraint that the input and output weights were strictly positive, we could use their (normalised) value as a measure of stimulus selectivity. Inspection of the firing rates sorted by input weights revealed that the networks had learned to complete the task by segregating both excitatory and inhibitory units into two stimulus-selective clusters (<xref ref-type="fig" rid="fig2">Figure 2C</xref>). As the inhibitory units could not contribute to the networks read out, we hypothesised that they likely played an indirect role in perceptual switching by inhibiting the population of excitatory neurons selective for the currently dominant stimulus, allowing the competing population to take over and a perceptual switch to occur.</p><p>To test this hypothesis, we sorted the inhibitory units by the selectivity of the excitatory units they inhibit (i.e. by the normalised value of the readout weights). Inspecting the histogram of this selectivity metric revealed a bimodal distribution, with peaks at each extreme strongly inhibiting a stimulus-selective excitatory population at the exclusion of the other (<xref ref-type="fig" rid="fig2s2">Figure 2—figure supplement 2</xref>). Based on the fact that leading up to the perceptual switch point both the input and firing rate of the dominant population are higher than the competing population, we hypothesised that gain likely speeds perceptual switches by actively inhibiting the currently dominant population rather than exciting/disinhibiting the competing population. We predicted, therefore, that lesioning the inhibitory units selective for the stimulus (i.e. with normalised selectivity &gt;0.5) that is initially dominant would dramatically slow perceptual switches, whilst lesioning the inhibitory units selective for the stimulus the input is morphing into would have a comparatively minor slowing effect on switch times since the population is not receiving sufficient input to take over until approximately half-way through the trial irrespective of the inhibition it receives. As selectivity is not entirely one-to-one, we expect both lesions to slow perceptual switches but differ in magnitude. In line with our prediction, lesioning the inhibitory units strongly selective for the initially dominant population greatly slowed perceptual switches (<xref ref-type="fig" rid="fig2">Figure 2F</xref>, upper), whereas lesioning the population selective for the stimulus the input morphs into removed the speeding effect of gain but had a comparatively small slowing effect on perceptual switches (<xref ref-type="fig" rid="fig2">Figure 2F</xref>, lower).</p><p>Having found a circuit-level explanation for the speeding effect of gain, we next sought to understand the network’s behaviour at a population level by interrogating the parameter space (with dimensions defined by network input and gain) traversed by the network. Unlike standard non-linear dynamical systems with stationary or (very) slowly time-varying parameters, input and gain change rapidly over the course of each trial, dynamically shifting the location and existence of the attractors shaping the network dynamics. Each trial is, therefore, characterised by a trajectory through a two-dimensional parameter space with dimensions corresponding to the gain of the activation function and the mismatch between input dimensions (<inline-formula><alternatives><mml:math id="inf14"><mml:mi>Δ</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mi>p</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:math><tex-math id="inft14">\begin{document}$\Delta input$\end{document}</tex-math></alternatives></inline-formula>).</p><p>Based on the selectivity of the network firing rates, we hypothesised that the dynamics were shaped by a fixed-point attractor, whose location and existence were determined by gain and Δ<italic>input</italic>, and changed dynamically over the course of a single trial (<xref ref-type="bibr" rid="bib6">Beer, 2022</xref>; <xref ref-type="bibr" rid="bib5">Beer, 2000</xref>; <xref ref-type="bibr" rid="bib82">Sussillo, 2014</xref>; <xref ref-type="bibr" rid="bib81">Sussillo and Barak, 2013</xref>). Because of the large size of the network, we could not solve for the fixed points or study their stability analytically. Instead, we opted for a numerical approach and characterised the dynamical regime (i.e. the location and existence of approximate fixed-point attractors) across all combinations of (static) gain and <inline-formula><alternatives><mml:math id="inf15"><mml:mi>Δ</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mi>p</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:math><tex-math id="inft15">\begin{document}$\Delta input$\end{document}</tex-math></alternatives></inline-formula> visited by the network. Specifically, for each combination of elements in the parameter space <inline-formula><alternatives><mml:math id="inf16"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>θ</mml:mi><mml:mo>∈</mml:mo><mml:msup><mml:mi>R</mml:mi><mml:mrow><mml:mi>g</mml:mi><mml:mi>a</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mo>×</mml:mo><mml:mi mathvariant="normal">Δ</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mi>p</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math><tex-math id="inft16">\begin{document}$\theta \in R^{gain\times \Delta input}$\end{document}</tex-math></alternatives></inline-formula> we ran 100 simulations with initial conditions (firing rates) drawn from a uniform distribution between [0,1], and let the dynamics run for 10 s of simulation time (10 times the length of the task – longer simulation times did not qualitatively change the results) without noise. As we were interested in the existence of fixed-point attractors rather than their precise location, at each time point we computed the difference in firing rate between successive time points (<inline-formula><alternatives><mml:math id="inf17"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi mathvariant="normal">Δ</mml:mi><mml:mi>r</mml:mi><mml:mo>=</mml:mo><mml:munder><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:munder><mml:msub><mml:mi>r</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:mi>t</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>−</mml:mo><mml:msub><mml:mi>r</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>t</mml:mi><mml:mo>−</mml:mo><mml:mi mathvariant="normal">Δ</mml:mi><mml:mi>t</mml:mi></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math><tex-math id="inft17">\begin{document}$\Delta r=\sum _{i}r_{i}\left (t\right)- r_{i}\left (t- \Delta t\right)$\end{document}</tex-math></alternatives></inline-formula>) across the network. For each simulation, we computed both the proportion of trials that converged to a value of <inline-formula><alternatives><mml:math id="inf18"><mml:mi>Δ</mml:mi><mml:mi>r</mml:mi></mml:math><tex-math id="inft18">\begin{document}$\Delta r$\end{document}</tex-math></alternatives></inline-formula> below 10<sup>-2</sup> giving us proxy for the presence of fixed points, and the time to convergence, giving us a measure of the ‘strength’ of the attractor.</p><p>Across gain values when <inline-formula><alternatives><mml:math id="inf19"><mml:mi>Δ</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mi>p</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:math><tex-math id="inft19">\begin{document}$\Delta input$\end{document}</tex-math></alternatives></inline-formula> had unambiguous values (<inline-formula><alternatives><mml:math id="inf20"><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>≫</mml:mo><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub></mml:math><tex-math id="inft20">\begin{document}$u_{1}\gg u_{2}$\end{document}</tex-math></alternatives></inline-formula> or <inline-formula><alternatives><mml:math id="inf21"><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mo>≫</mml:mo><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:math><tex-math id="inft21">\begin{document}$u_{2}\gg u_{1}$\end{document}</tex-math></alternatives></inline-formula>), the network rapidly converged across all initialisations (<xref ref-type="fig" rid="fig3">Figure 3A and C–H</xref>). When <inline-formula><alternatives><mml:math id="inf22"><mml:mi>Δ</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mi>p</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:math><tex-math id="inft22">\begin{document}$\Delta input$\end{document}</tex-math></alternatives></inline-formula> became ambiguous, however, the dynamics acquired a decaying (inhibition-driven) oscillation and on many trials did not converge within the time frame of the simulation. As gain increased, the range of <inline-formula><alternatives><mml:math id="inf23"><mml:mi>Δ</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mi>p</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:math><tex-math id="inft23">\begin{document}$\Delta input$\end{document}</tex-math></alternatives></inline-formula> values characterised by oscillatory dynamics broadened. Crucially, for sufficiently high values of gain, ambiguous <inline-formula><alternatives><mml:math id="inf24"><mml:mi>Δ</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mi>p</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:math><tex-math id="inft24">\begin{document}$\Delta input$\end{document}</tex-math></alternatives></inline-formula> values transitioned the network into a regime characterised by high-amplitude oscillations (<xref ref-type="fig" rid="fig3">Figure 3D and G</xref>). Each trial can, therefore, be characterised by a trajectory through this two-dimensional parameter space, with dynamics shaped by the dynamical regimes of each location visited (<xref ref-type="fig" rid="fig3">Figure 3A and B</xref>).</p><fig-group><fig id="fig3" position="float"><label>Figure 3.</label><caption><title>Analysis of recurrent neural network (RNN) dynamical regime.</title><p>(<bold>A</bold>) Contour map of convergence time across the full gain by Δinput parameter space averaged across 100 initialisations with random initial conditions. Example parameter trajectories shown in white for high and low γ trials. (<bold>B</bold>) Contour map of convergence proportion across the full parameter space. (<bold>C–E</bold>) Example dynamics with gain = 1.1 and Δinput ≈ [1, 0],[. 5, .5], and [0,1] r, respectively. (<bold>F–H</bold>) Example dynamics with gain = 1.5 and Δinput ≈ [1, 0],[. 5, .5], and[0,1] , respectively.</p></caption><graphic mimetype="image" mime-subtype="tiff" xlink:href="elife-93191-fig3-v1.tif"/></fig><fig id="fig3s1" position="float" specific-use="child-fig"><label>Figure 3—figure supplement 1.</label><caption><title>Example network dynamics initialised with parameter values well inside the oscillatory regime (<inline-formula><alternatives><mml:math id="inf25"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>u</mml:mi><mml:mo>≈</mml:mo><mml:mrow><mml:mo>[</mml:mo><mml:mrow><mml:mn>.5</mml:mn><mml:mspace width="thinmathspace"/><mml:mn>.5</mml:mn></mml:mrow><mml:mo>]</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math><tex-math id="inft25">\begin{document}$u\approx \left [.5\, .5\right ]$\end{document}</tex-math></alternatives></inline-formula>, gain = 1.5) with initial conditions determined by the selectivity of each unit.</title><p>Excitatory units selective for <inline-formula><alternatives><mml:math id="inf26"><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:math><tex-math id="inft26">\begin{document}$u_{1}$\end{document}</tex-math></alternatives></inline-formula>, and the associated inhibitory units, were fully activated. Excitatory units selective for <inline-formula><alternatives><mml:math id="inf27"><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub></mml:math><tex-math id="inft27">\begin{document}$u_{2}$\end{document}</tex-math></alternatives></inline-formula> (and the associated inhibitory units) were initially silenced. Example network conforms with our prediction displaying an out-of-phase oscillation where the initially dominant population is rapidly silenced and the competing population is boosted after a brief delay.</p></caption><graphic mimetype="image" mime-subtype="tiff" xlink:href="elife-93191-fig3-figsupp1-v1.tif"/></fig></fig-group><p>When uncertainty had a small impact on gain (low <inline-formula><alternatives><mml:math id="inf28"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft28">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula>), the network had a trajectory through an initial regime characterised by the rapid convergence to a fixed point where the population representing the initial stimulus dominated whilst the other was silent (<xref ref-type="fig" rid="fig3">Figure 3C</xref>), an uncertain regime characterised by oscillations with all neurons partially activated (<xref ref-type="fig" rid="fig3">Figure 3D</xref>), and after passing through the oscillatory regime, the network once again entered a (new) fix-point regime where the population representing the initial stimulus was silent whilst the other was dominant (<xref ref-type="fig" rid="fig3">Figure 3E</xref>).</p><p>For high <inline-formula><alternatives><mml:math id="inf29"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft29">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula> trials, the network again started and finished in states characterised by rapid convergence to a fixed point representing the dominant input dimension (<xref ref-type="fig" rid="fig3">Figure 3F–H</xref>). However, it differed in how it transitioned between these states. Uncertain inputs generated high-amplitude oscillations, causing the network to flip-flop between active and silent states (<xref ref-type="fig" rid="fig3">Figure 3G</xref>). We hypothesised that, within the task, this mechanism silenced the initially dominant population, while boosting the competing population. To test this, we initialised each network with parameter values well inside the oscillatory regime (u ≈ [. 5 . 5], gain = 1.5) with initial conditions determined by the selectivity of each unit. Excitatory units selective for <italic>u</italic><sub><italic>1</italic></sub>, as well as the associated inhibitory units projecting to this population, were fully activated, whilst the excitatory units selective for <italic>u</italic><sub><italic>2</italic></sub> (and the associated inhibitory units) were silenced (and vice versa for u<sub>2</sub> → u<sub>1</sub>trials). As we predicted, when initialised in this state the network dynamics displayed an out-of-phase oscillation where the initially dominant population was rapidly silenced and the competing population was boosted after a brief delay (219 (ms), ±114; <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>).</p><p>At the population level, therefore, heightened gain at points of ambiguity accelerates perceptual switches by transiently pushing the dynamics into an unstable regime. This regime replaces the fixed-point attractor representing the input with an oscillatory regime that actively inhibits the currently dominant population and boosts the competing population, before transitioning back to a stable (approximate) fixed-point attractor representing the new stimulus (<xref ref-type="fig" rid="fig3">Figure 3F–H</xref> and <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>).</p></sec><sec id="s2-3"><title>Large-scale neural predictions of recurrent neural network model</title><p>Having confirmed the behavioural component of our gain modulation hypothesis in our model, and characterised both the circuit and population level mechanisms, we next sought to test our hypotheses that the speeding effect of uncertainty-driven gain on perceptual switches is mediated by a flattening of the energy landscape traversed by the network dynamics. Crucially, translating the dynamics of the RNN into an energy-based framework also allowed us to generate a series of predictions that we could later test in functional neuroimaging data.</p><p>In recent work (<xref ref-type="bibr" rid="bib54">Munn et al., 2021</xref>, <xref ref-type="bibr" rid="bib84">Taylor et al., 2022</xref>), we have shown that peaks in BOLD within the LC precede large changes in brain state dynamics. Viewed through the lens of dynamical systems theory (<xref ref-type="bibr" rid="bib40">John et al., 2022</xref>) in which the brain is treated as a dynamical system whose state space (i.e. an instantaneous snapshot of the activity of all regions of the system) evolves over time shaped by the presence (or absence) of attractors, the effect of the LC can be conceptualised as akin to lowering the energy barrier required to escape a fixed-point attractor or as a transient injection of kinetic energy via an external force allowing the brain to reach a novel location in state-space (<xref ref-type="bibr" rid="bib54">Munn et al., 2021</xref>). Crucially, there are two complementary viewpoints from which we can construct an energy landscape; the first allocentric (i.e. third-person view) perspective quantifies the energy associated with each position in state space, whereas the second egocentric (i.e. first-person view) perspective quantifies the energy-associated relative changes independent of the direction of movement or the location in state space. The allocentric perspective is straightforwardly comparable to the potential function of a dynamical system but can only be applied to low-dimensional data in settings where a position-like quantity is meaningfully defined. The egocentric perspective is analogous to taking the point of view of a single particle in a physical setting and quantifying the energy associated with movement relative to the particle’s initial location. An egocentric framework is thus more applicable, when signal magnitude is relative rather than absolute (see ‘Methods and <xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1</xref> for an intuitive explanation of the allocentric and egocentric energy landscape analysis on a toy dynamical system).</p><p>To characterise the energy landscape traversed by the network dynamics, we ran both time-resolved allocentric and egocentric energy landscape analyses. For the allocentric analysis, we first had to reduce the dimensionality of the RNN’s dynamics by performing a principal component analysis (PCA) on the concatenated activity of the network at gain = 1. The set of PCs was low-dimensional, with 80.58±6.34% of the variance explained by the first principal component (PC<sub>1</sub>). Based on this information, we projected the network activity on each trial and for each gain value and timepoint onto the first PC. The resultant low-dimensional trajectories all showed a change in direction around the timepoint of the switch in network output from category 1 to category 2 (and v.v.; <xref ref-type="fig" rid="fig4">Figure 4A</xref>). This recapitulates a system jumping between attractors, occurring earlier as a function of heightened gain associated with heightened values of <inline-formula><alternatives><mml:math id="inf30"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft30">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula> (<xref ref-type="fig" rid="fig4">Figure 4A</xref>). This switch not only occurred sooner as a function of heightened gain, it also occurred at a higher neural ‘speed’ with the velocity of the trajectory peaking sharply at the point of the switch under high <inline-formula><alternatives><mml:math id="inf31"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft31">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula>, whereas the transition between states was comparatively gradual under low <inline-formula><alternatives><mml:math id="inf32"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft32">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula> (<xref ref-type="fig" rid="fig4">Figure 4B</xref>).</p><fig-group><fig id="fig4" position="float"><label>Figure 4.</label><caption><title>Allocentric and egocentric energy landscape dynamics underlying the perceptual speeding effect of heightened gain.</title><p>(<bold>A</bold>) Example network trajectory projected onto PC<sub>1</sub> and averaged across trials for low (0.1; solid blue), medium (0.5; dotted green), and high (0.9; solid red) <inline-formula><alternatives><mml:math id="inf33"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft33">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula> for the <inline-formula><alternatives><mml:math id="inf34"><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>→</mml:mo><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub></mml:math><tex-math id="inft34">\begin{document}$u_{1}\rightarrow u_{2}$\end{document}</tex-math></alternatives></inline-formula> condition. (<bold>B</bold>) (abs) Velocity of PC<sub>1</sub> trajectories across low (0.1), medium (0.5), and high (0.9) <inline-formula><alternatives><mml:math id="inf35"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft35">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula>. (<bold>C, D</bold>) Allocentric landscapes for low (0.1; blue) and high (0.9; red) <inline-formula><alternatives><mml:math id="inf36"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft36">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula> conditions. Trial-averaged PC<sub>1</sub> trajectory shown in black. For purposes of visualisation energy, values &gt; 6 are set to a constant value. (<bold>E, F</bold>) Egocentric landscapes for low (0.1; blue) and high (0.9; red) <inline-formula><alternatives><mml:math id="inf37"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft37">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula> conditions. (<bold>G</bold>) (Allocentric) neural work for low (0.1), medium (0.5), and high (0.9) <inline-formula><alternatives><mml:math id="inf38"><mml:mi>γ</mml:mi><mml:mo>,</mml:mo></mml:math><tex-math id="inft38">\begin{document}$\gamma ,$\end{document}</tex-math></alternatives></inline-formula> averaged across networks and conditions. (<bold>H</bold>) Egocentric AUC for low (0.1), medium (0.5), and high (0.9) <inline-formula><alternatives><mml:math id="inf39"><mml:mi>γ</mml:mi><mml:mo>,</mml:mo></mml:math><tex-math id="inft39">\begin{document}$\gamma ,$\end{document}</tex-math></alternatives></inline-formula> averaged across networks and conditions. Note that the time series represent simulations from a model with low noise, and hence did not require error bars.</p></caption><graphic mimetype="image" mime-subtype="tiff" xlink:href="elife-93191-fig4-v1.tif"/></fig><fig id="fig4s1" position="float" specific-use="child-fig"><label>Figure 4—figure supplement 1.</label><caption><title>Energy landscape analyses.</title><p>Top row: time series generated from a (super critical) pitchfork bifurcation <inline-formula><alternatives><mml:math id="inf40"><mml:mover accent="true"><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mo>˙</mml:mo></mml:mover><mml:mo>=</mml:mo><mml:mi>α</mml:mi><mml:mi>x</mml:mi><mml:mo>−</mml:mo><mml:msup><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mn>3</mml:mn></mml:mrow></mml:msup></mml:math><tex-math id="inft40">\begin{document}$\overset{˙}{x}=\alpha x- x^{3}$\end{document}</tex-math></alternatives></inline-formula> with <inline-formula><alternatives><mml:math id="inf41"><mml:mi>α</mml:mi><mml:mo>=</mml:mo><mml:mn>0.25</mml:mn></mml:math><tex-math id="inft41">\begin{document}$\alpha =0.25$\end{document}</tex-math></alternatives></inline-formula> (red left) and <inline-formula><alternatives><mml:math id="inf42"><mml:mi>α</mml:mi><mml:mo>=</mml:mo><mml:mn>0.75</mml:mn></mml:math><tex-math id="inft42">\begin{document}$\alpha =0.75$\end{document}</tex-math></alternatives></inline-formula> (blue right), respectively, simulated in the presence of noise (<inline-formula><alternatives><mml:math id="inf43"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>σ</mml:mi><mml:mo>=</mml:mo><mml:mn>0.25</mml:mn></mml:mrow></mml:mstyle></mml:math><tex-math id="inft43">\begin{document}$\sigma =0.25$\end{document}</tex-math></alternatives></inline-formula>).</p><p>Second row: the potential <inline-formula><alternatives><mml:math id="inf44"><mml:mi>V</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mi>x</mml:mi></mml:mrow></mml:mfenced><mml:mo>=</mml:mo><mml:mo>−</mml:mo><mml:mrow><mml:mo stretchy="false">∫</mml:mo><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mo>˙</mml:mo></mml:mover></mml:mrow></mml:mrow><mml:mi>d</mml:mi><mml:mi>x</mml:mi></mml:math><tex-math id="inft44">\begin{document}$V\left (x\right)=- \int \overset{˙}{x}dx$\end{document}</tex-math></alternatives></inline-formula> for each dynamical system. Third row: allocentric landscape recovers the shape of the (analytic) potential with the depth and minima of each energy well scaling with <inline-formula><alternatives><mml:math id="inf45"><mml:mi>α</mml:mi></mml:math><tex-math id="inft45">\begin{document}$\alpha $\end{document}</tex-math></alternatives></inline-formula>. Fourth row: shallow and deep potentials are associated with high and low energy for large MSD values (respectively). Fifth row left: egocentric landscape with <inline-formula><alternatives><mml:math id="inf46"><mml:mi>α</mml:mi><mml:mo>=</mml:mo><mml:mn>0.25</mml:mn></mml:math><tex-math id="inft46">\begin{document}$\alpha =0.25$\end{document}</tex-math></alternatives></inline-formula> minus egocentric landscape with <inline-formula><alternatives><mml:math id="inf47"><mml:mi>α</mml:mi><mml:mo>=</mml:mo><mml:mn>0.75</mml:mn></mml:math><tex-math id="inft47">\begin{document}$\alpha =0.75$\end{document}</tex-math></alternatives></inline-formula>. X and Y axes have been reversed for visual interpretability. Fifth row right: energy under the curve for each landscape obtained by summing over time.</p></caption><graphic mimetype="image" mime-subtype="tiff" xlink:href="elife-93191-fig4-figsupp1-v1.tif"/></fig></fig-group><p>With a low-dimensional description of our data in hand, we leveraged the relationship between probability and energy in statistical mechanics to construct a measure of the allocentric energy landscape (<xref ref-type="fig" rid="fig4">Figure 4C and D</xref>) traversed by the low-dimensional dynamics (<inline-formula><alternatives><mml:math id="inf48"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>C</mml:mi><mml:mn>1</mml:mn><mml:mi>τ</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>l</mml:mi><mml:mi>n</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mi>P</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>P</mml:mi><mml:mi>C</mml:mi><mml:mn>1</mml:mn><mml:mi>τ</mml:mi></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mfrac><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math><tex-math id="inft48">\begin{document}$E_{PC1\tau }=ln\left (\frac{1}{P\left (PC1\tau \right)}\right)$\end{document}</tex-math></alternatives></inline-formula>; see ‘Methods’ for derivation) with a window size of <inline-formula><alternatives><mml:math id="inf49"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>τ</mml:mi><mml:mo>=</mml:mo><mml:mn>250</mml:mn><mml:mspace width="thinmathspace"/><mml:mi mathvariant="normal">m</mml:mi><mml:mi mathvariant="normal">s</mml:mi></mml:mrow></mml:mstyle></mml:math><tex-math id="inft49">\begin{document}$\tau =250\,\rm ms$\end{document}</tex-math></alternatives></inline-formula>. Across values of <inline-formula><alternatives><mml:math id="inf50"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>γ</mml:mi></mml:mrow></mml:mstyle></mml:math><tex-math id="inft50">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula>, this revealed a potential-like energy landscape with a minimum that evolved with the currently dominant input dimension. To quantify the effect of gain mediated changes on the allocentric energy landscape, we devised a measure – neural work – of the ‘force’ exerted on the low-dimensional trajectory by the vector field quantified by allocentric energy landscape at each time point in the trial <inline-formula><alternatives><mml:math id="inf51"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msub><mml:mi>W</mml:mi><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mo>−</mml:mo><mml:mi>d</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>d</mml:mi><mml:mi>x</mml:mi></mml:mrow></mml:mfrac><mml:msub><mml:mi>s</mml:mi><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mstyle></mml:math><tex-math id="inft51">\begin{document}$W_{t}=\frac{- dE_{t}}{dx}s_{t}$\end{document}</tex-math></alternatives></inline-formula>. Where <inline-formula><alternatives><mml:math id="inf52"><mml:msub><mml:mrow><mml:mi>s</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:math><tex-math id="inft52">\begin{document}$s_{t}$\end{document}</tex-math></alternatives></inline-formula> is the displacement of the PC trajectory in each window, and <inline-formula><alternatives><mml:math id="inf53"><mml:mfrac><mml:mrow><mml:mi>d</mml:mi><mml:msub><mml:mrow><mml:mi>E</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>d</mml:mi><mml:mi>x</mml:mi></mml:mrow></mml:mfrac></mml:math><tex-math id="inft53">\begin{document}$\frac{dE_{t}}{dx}$\end{document}</tex-math></alternatives></inline-formula> is the gradient of the energy values computed between the start and end of each window. We found that increasing gain (via increasing <inline-formula><alternatives><mml:math id="inf54"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft54">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula>) increased the magnitude of work done at turning points of the trajectory analogous to the application of an external force (<xref ref-type="fig" rid="fig4">Figure 4G</xref>; and equivalent to a change in the dynamical velocity of the landscape, accelerating the change from one perceptual interpretation to another).</p><p>Although explanatory useful in understanding the operation of the RNN, the allocentric landscape is not straightforwardly applicable to non-invasive neuroimaging data. In order to compare our network dynamics to neuroimaging data, and with previous work from our group, we inferred an estimate of the egocentric energy landscape (<xref ref-type="fig" rid="fig4">Figure 4E and F</xref>) traversed by the dynamics. Specifically, we calculated the mean-squared displacement <inline-formula><alternatives><mml:math id="inf55"><mml:msub><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:mi>D</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mn>0</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mfenced open="⟨" close="⟩" separators="|"><mml:mrow><mml:msup><mml:mrow><mml:mfenced open="|" close="|" separators="|"><mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mn>0</mml:mn></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>τ</mml:mi></mml:mrow></mml:msub><mml:mo>−</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mn>0</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:msub></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:msub></mml:math><tex-math id="inft55">\begin{document}$MSD_{t,t_{0}}=\left \langle \left |x_{t_{0}+\tau }- x_{t_{0}}\right |^{2}\right \rangle _{n}$\end{document}</tex-math></alternatives></inline-formula> of the firing rate of each unit in the RNN in steps of <inline-formula><alternatives><mml:math id="inf56"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>τ</mml:mi><mml:mo>=</mml:mo><mml:mn>250</mml:mn><mml:mspace width="thinmathspace"/><mml:mi mathvariant="normal">m</mml:mi><mml:mi mathvariant="normal">s</mml:mi></mml:mrow></mml:mstyle></mml:math><tex-math id="inft56">\begin{document}$\tau =250\,\rm ms$\end{document}</tex-math></alternatives></inline-formula>, and as we did with the allocentric analysis, calculated the probability – and from this the energy <inline-formula><alternatives><mml:math id="inf57"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:mi>D</mml:mi><mml:mo>,</mml:mo><mml:mi>τ</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>l</mml:mi><mml:mi>n</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mi>P</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>D</mml:mi><mml:mrow><mml:mi>τ</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mfrac><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math><tex-math id="inft57">\begin{document}$E_{MSD,\tau }=ln\left (\frac{1}{P\left (MSD_{\tau }\right)}\right)$\end{document}</tex-math></alternatives></inline-formula> – associated with each MSD value and time step. In line with our hypothesis, and with previous work from our group, the energy required for large movements in state space (i.e. large MSD values) decreased as a function of <inline-formula><alternatives><mml:math id="inf58"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft58">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula> (<xref ref-type="fig" rid="fig4">Figure 4E and F</xref>) analogous to the application of an external force transiently increasing the kinetic energy of a particle. To quantify the degree of flattening, we calculated the area under the curve across values of <inline-formula><alternatives><mml:math id="inf59"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft59">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula> showing a substantial reduction in the energy associated with large MSD values as a function of heightened <inline-formula><alternatives><mml:math id="inf60"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft60">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula> (and therefore gain; <xref ref-type="fig" rid="fig4">Figure 4H</xref>).</p><p>These results reinforce our previous work and clearly demonstrate that the implementation of neuromodulatory-mediated dynamics in the RNN acted in a similar fashion to previously observed patterns in resting-state fMRI (<xref ref-type="bibr" rid="bib15">Cisek, 2019</xref>). In addition, our results confirm that the putative impact of the release of noradrenaline from the LC can change the manner in which brain states evolve over time, facilitating the navigation of otherwise difficult state transitions (<xref ref-type="bibr" rid="bib15">Cisek, 2019</xref>).</p></sec><sec id="s2-4"><title>Low-dimensional signature of ambiguity resolution and perceptual change</title><p>Having confirmed our hypothesis about the speeding effect of gain in our RNN model, we next sought to test the predictions in the human brain – that is, examining whether the increase in neural speed and the flattening of the energy landscape observed in the RNN were also present in functional neuroimaging data. To this end, we re-analysed an existing BOLD dataset collected while participants performed a similar version of the ambiguous figures task to identify the low-dimensional patterns that occur during the perceptual change.</p><p>We were, however, left with a dilemma: RNNs provide a proof-in-principle of how computations can be instantiated in neural networks; however, there are key differences between artificial neural networks and the human brain that require careful consideration (<xref ref-type="bibr" rid="bib66">Richards et al., 2019</xref>; <xref ref-type="bibr" rid="bib23">Doerig et al., 2023</xref>). While both RNNs and the brain are thought to compute through dynamics (<xref ref-type="bibr" rid="bib91">Vyas et al., 2020</xref>), the human brain is comprised of highly specialised neural circuits that have been shaped over evolutionary time to perform a range of highly idiosyncratic functions that matter for adaptive behaviour (<xref ref-type="bibr" rid="bib91">Vyas et al., 2020</xref>), but are not necessarily related to task-switching. So where in the brain should we look for the same low-dimensional signatures we observed in the RNN as a function of gain? Rather than select a particular region a priori, we instead opted for a data-driven approach – PCA – which summarises regional time series concatenated across all subjects and trials into a set of low-dimensional patterns that can then be interrogated in a similar fashion to the activity of the RNN (see ‘Methods’ for details). Consistent with previous work (<xref ref-type="bibr" rid="bib76">Shine et al., 2019</xref>), a small number of PCs mapped onto distributed regions across the brain (<xref ref-type="fig" rid="fig5">Figure 5A</xref>) and explained a substantial proportion of the variance observed in the task (PC<sub>1-3</sub> explained 32% of the total variance).</p><fig-group><fig id="fig5" position="float"><label>Figure 5.</label><caption><title>Low-dimensional switch-related dynamics and connectivity.</title><p>(<bold>A</bold>) Spatial loadings of PC<sub>1</sub> (green), PC<sub>2</sub> (red), and PC<sub>3</sub> (blue). (<bold>B</bold>) Mean absolute β loading (solid lines) and group standard error (shaded) of PC<sub>1</sub> (green), PC<sub>2</sub> (red), and PC<sub>3</sub> (blue), organised around the image switch point (Δ) – the dotted grey lines show the 95th percentile of the null distribution of a block-resampling permutation. (<bold>C</bold>) Radar plot showing the partial correlations of PC<sub>1</sub> (green), PC<sub>2</sub> (red), and PC<sub>3</sub> (blue). (<bold>D</bold>) Evoked brain activity of PC<sub>2</sub> + PC<sub>3</sub> during the perceptual switch. (<bold>E</bold>) Group averaged functional connectivity and module assignments using a Louvain analysis – three clusters were observed. (<bold>F</bold>) Pearson’s correlation between the sum of PC<sub>2</sub> and PC<sub>3</sub> (per subject) and a joint-histogram comparing Integration (participation coefficient) and segregation (module-degree Z-score); p&lt;0.05 following permutation testing.</p></caption><graphic mimetype="image" mime-subtype="tiff" xlink:href="elife-93191-fig5-v1.tif"/></fig><fig id="fig5s1" position="float" specific-use="child-fig"><label>Figure 5—figure supplement 1.</label><caption><title>Energy landscape analyses.</title><p>(<bold>A</bold>) Pearson’s correlation between each PCs and the evoked brain activity at the perceptual switch (β values), dashed line at PC<sub>2</sub>. (<bold>B</bold>) Pearson’s correlation between the inverted brain maps using βPC (PC<sub>(1-i)</sub> × βPC<sub>(1-i)</sub>). Dashed line shows that the correlation gets to 94% using the first three PCs (Pearson’s <italic>r</italic>=0.94, p&lt;0.001).</p></caption><graphic mimetype="image" mime-subtype="tiff" xlink:href="elife-93191-fig5-figsupp1-v1.tif"/></fig></fig-group><p>To isolate the low-dimensional component that best reflected the task (<xref ref-type="fig" rid="fig1">Figure 1A</xref>), we performed a principal component regression (<xref ref-type="bibr" rid="bib41">Jolliffe, 1982</xref>) that modelled the switch point of each trial using the loadings of the top 3 PCs calculated from fMRI data. PC<sub>1</sub> was not selectively aligned with switches, both PC<sub>2</sub> and PC<sub>3</sub> showed a pronounced, isolated peak around the switch point across trials (<xref ref-type="fig" rid="fig5">Figure 5B</xref>), with PC<sub>2</sub> showing the most robust task-related engagement (<xref ref-type="fig" rid="fig5">Figure 5B</xref> and <xref ref-type="fig" rid="fig5s1">Figure 5—figure supplement 1</xref>). To ensure that these results could not be explained by the spatial autocorrelation inherent within the PC maps, we created a null distribution of regression coefficients calculated using the same statistical model but with block-resampling applied to the switch times in the design matrix. The dotted grey line in <xref ref-type="fig" rid="fig5">Figure 5B</xref> denotes the 95th percentile of the null distribution, and clearly shows that the engagement of both PC<sub>2</sub> and PC<sub>3</sub> during the switch point was greater than to be expected by chance. Furthermore, to validate that the perceptual switch was predominantly represented by PC<sub>2</sub> and PC<sub>3</sub> (<xref ref-type="fig" rid="fig5">Figure 5D</xref>), we conducted a regression with these two PCs as predictors and the evoked activity derived from the original BOLD time series as the dependent variable. The resulting variance accounted for was 88% (R<sup>2</sup>=0.88, <italic>β</italic>=0.99, p=9.2 × 10<sup>–178</sup>).</p><p>To determine whether PC<sub>2</sub> or PC<sub>3</sub> was a better index of perceptual switching, we then correlated the spatial loadings of PC<sub>2</sub> and PC<sub>3</sub> with the spatial map associated with the term ‘switching’ from a meta-analysis performed on the <italic>neurosynth</italic> database (<xref ref-type="bibr" rid="bib101">Yarkoni et al., 2011</xref>). We observed a significant positive correlation between the map for ‘switching’ and both PC<sub>2</sub> (<italic>r</italic>=0.453, p=3.041 × 10<sup>–18</sup>) and PC<sub>3</sub> (<italic>r</italic>=0.115, p=0.037); however, the correlation for PC<sub>3</sub> was much lower than PC<sub>3,</sub> suggesting that PC<sub>2</sub> was a better match for ‘switching’. The spatial map of PC<sub>2</sub> was also positively correlated with other terms putatively associated with the ambiguous figures task (notably, ‘effort’, ‘load’, and ‘attention’; all <italic>r</italic>&gt;0.2; and not with ‘episodic’, which was included as a negative control), a partial correlation analysis revealed that PC<sub>2</sub> was selectively associated with ‘switching’ and ‘attention’ (<xref ref-type="fig" rid="fig5">Figure 5C</xref>). Given the multifaceted nature of the ambiguous figures task, the convergence between brain maps for ‘switching’, ‘attention’, and ‘effort’ was to be expected, and we therefore did not try to dissociate them in further analysis.</p><p>Before turning to the predictions of the RNN, we first sought to validate the face validity of focusing on a limited number of principal components. In previous work, we have linked the impacts of NA on systems-level neural dynamics to alterations in network topology (<xref ref-type="bibr" rid="bib54">Munn et al., 2021</xref>; <xref ref-type="bibr" rid="bib74">Shine et al., 2018</xref>; <xref ref-type="bibr" rid="bib73">Shine et al., 2016</xref>), with NA increasing large-scale network integration. Given that PCA naturally captures patterns of covariance between regions, we expected to see that the observed time signatures of PC engagement at the switch point should coincide with similar measures of network integration. To test this hypothesis, we clustered the time-averaged functional connectivity matrix using a hierarchical modular decomposition approach (see ‘Methods’) – doing so revealed three main clusters (<xref ref-type="fig" rid="fig5">Figure 5E</xref>). For each participant, we used this matrix and the three clusters to estimate the amount of integration (using the participation coefficient) and segregation (using the module-degree Z-score, see ‘Methods’) of each region. We then correlated a joint histogram of these measures with the sum of subject-specific regression coefficients for PC<sub>2</sub> and PC<sub>3</sub> and observed a robust correlation with integration (<xref ref-type="fig" rid="fig5">Figure 5F</xref>; p&lt;0.05 following permutation testing). These results clearly demonstrate the highly convergent nature of PCA and our previous network-based approaches.</p></sec><sec id="s2-5"><title>Confirmation of model predictions in whole-brain BOLD data</title><p>Based on the patterns observed in the RNN (i.e. those in <xref ref-type="fig" rid="fig2">Figures 2</xref>—<xref ref-type="fig" rid="fig4">4</xref>), we hypothesised that the energy landscape topography would decrease, and the velocity of the low-dimensional brain patterns would peak at the switch point. Given the prominent role in switching, we focused our analysis on the PC<sub>2</sub> time series. To estimate the (egocentric) energy landscape, we first estimated the mean displacement of PC<sub>2</sub> by averaging the β value around the switch point and then divided this term by the logarithm of the inverse probability of the loading of PC<sub>2</sub>, which was also inferred from the GLM. Using this approach, we observed that PC<sub>2</sub> was maximally displaced at the perceptual change, suggesting that the brain state showed a substantial shift from baseline during the perceptual change. Energy (log[1/<italic>p<sub>switch</sub></italic>]; see ‘Methods’) showed a U-shaped pattern around the perceptual change point – that is, with a minimum value in the perceptual change along with the first and last images (<xref ref-type="fig" rid="fig6">Figure 6B–D</xref>). To relate this measure to the energy landscape framework, and to control by the specific displacement occurring at each image, we then calculated the ratio between energy and the mean displacement (i.e. energy landscape ’depth’; <xref ref-type="fig" rid="fig6">Figure 6A</xref>). As predicted, the brain state reduced the amount of energy per displacement towards its minimum around the perceptual change (<xref ref-type="fig" rid="fig6">Figure 6B</xref>). We interpret this set of results as the system flattening the energy landscape, reducing the energy (i.e. higher system changes become more common) required for large displacement values, effectively generating a ‘network reset’ (<xref ref-type="bibr" rid="bib70">Sara, 2009</xref>; <xref ref-type="bibr" rid="bib10">Bouret and Sara, 2005</xref>; <xref ref-type="bibr" rid="bib71">Sara, 2015</xref>) of the brain state, which ultimately facilitated an updating of the content of perception.</p><fig id="fig6" position="float"><label>Figure 6.</label><caption><title>Confirmation of model predictions in whole-brain BOLD data.</title><p>(<bold>A</bold>) analysis of the recurrent neural network (RNN) also predicted that the energy landscape dictating the likelihood of state transitions should be flat (i.e. have a small attractor depth) at the switch point. (<bold>B</bold>) The energy landscape was demonstratively flatter (quantified as surprisal over brain activity displacement) at the switch point. (<bold>C</bold>) By interrogating the low-dimensional trajectories in the RNN, we predicted that there should be a peak in the gradient of the loadings in principal component space at the switch point between output #1 and output #2. (<bold>D</bold>) The gradient (Δx<sub>PC</sub>) of the β loading of PC<sub>2</sub> as a function of the switch point.</p></caption><graphic mimetype="image" mime-subtype="tiff" xlink:href="elife-93191-fig6-v1.tif"/></fig><p>To analyse speed-evoked changes in brain trajectories, we used a GLM to analyse each PC time series as a function of each perceptual switch. Our design matrix included the first and last images seen in each set, along with the three images leading up to the switch, the switch trial itself and the three images following the switch (see ‘Methods’ for details). This approach thus allowed us to track the low-dimensional signature of the brain through the processing and resolution of perceptual ambiguity. As predicted (<xref ref-type="fig" rid="fig6">Figure 6C</xref>), we found evidence that PC<sub>2</sub> showed a peak in velocity at the change point (<xref ref-type="fig" rid="fig6">Figure 6D</xref>) providing confirmatory evidence that the low-dimensional brain state dynamics observed in whole-brain fMRI were highly similar to those observed in the trained RNN.</p></sec></sec><sec id="s3" sec-type="discussion"><title>Discussion</title><p>Here, we studied the relationship between the ascending arousal system, low-dimensional neuronal trajectories and energy landscape dynamics during a perceptual switch task. Our results provide evidence that the ascending arousal system is involved in the modulation of dynamic brain state topography during task-relevant perceptual switches. We found that pupil diameter tracked with ambiguity of task stimuli and was directly related to the speed of perceptual switches (<xref ref-type="fig" rid="fig1">Figure 1</xref>). Next, we confirmed that this process could be replicated in an RNN Model (<xref ref-type="fig" rid="fig2">Figure 2</xref>) of perceptual change detection where the gain of the activation function was updated dynamically by the uncertainty of the network’s classification output (<xref ref-type="fig" rid="fig2">Figures 2</xref> and <xref ref-type="fig" rid="fig3">3</xref>). We then used this model to generate two key predictions: around the time of the perceptual switch brain state velocity should peak, and the egocentric energy landscape should flatten which we confirmed in neuroimaging data (<xref ref-type="fig" rid="fig4">Figures 4</xref>—<xref ref-type="fig" rid="fig6">6</xref>). Together, these results suggest that the ascending arousal system facilitates state changes in the content of perception by transiently increasing neural gain – acting in a manner analogous to an external forcing function transiently increasing kinetic energy in the system – flattening the ego-centric energy landscape and thereby reducing the energy needed to reset the system topography in an adaptive and task-dependent manner.</p><p>The relationship between perception and pupil diameter found here is consistent with the role of the ascending neuromodulation in cognition and attention (<xref ref-type="bibr" rid="bib3">Aston-Jones and Cohen, 2005</xref>; <xref ref-type="bibr" rid="bib94">Wainstein et al., 2022</xref>). For instance, the LC dynamically changes its activity according to external and cognitive demands imposed on the system (<xref ref-type="bibr" rid="bib43">Joshi et al., 2016</xref>; <xref ref-type="bibr" rid="bib3">Aston-Jones and Cohen, 2005</xref>; <xref ref-type="bibr" rid="bib94">Wainstein et al., 2022</xref>; <xref ref-type="bibr" rid="bib48">Liu et al., 2017</xref>; <xref ref-type="bibr" rid="bib57">Nieuwenhuis et al., 2005</xref>). Importantly, our results extend these findings by suggesting a more precise role for LC-mediated alterations in neural gain. Specifically based on the pupil dynamics in our task and previous experimental and theoretical work, we hypothesised that neural gain should change dynamically as a function of uncertainty (operationalised here as perceptual ambiguity) via the recruitment of the LC (along with other structures in the ascending arousal system), which then subsequently increases brain-wide communication by increasing the gain in targeted brain regions (<xref ref-type="bibr" rid="bib77">Shine et al., 2021</xref>; <xref ref-type="bibr" rid="bib56">Murphy et al., 2016</xref>; <xref ref-type="bibr" rid="bib74">Shine et al., 2018</xref>; <xref ref-type="bibr" rid="bib57">Nieuwenhuis et al., 2005</xref>). In the pupillometry data, pupil diameter (which is an indirect marker of the noradrenergic system; <xref ref-type="bibr" rid="bib83">Szabadi, 2018</xref>; <xref ref-type="bibr" rid="bib44">Joshi and Gold, 2020</xref>) increased as a function of perceptual ambiguity, which rose sharply in the few images prior to the reported perceptual change (<xref ref-type="fig" rid="fig1">Figure 1D</xref>). Based upon this finding, we then implemented an analogous mechanism in our pretrained RNN by making gain depend upon the entropy of the network’s classification which acted as a forcing function transiently increasing gain when the input became ambiguous, which, in line with our hypothesis, lead to earlier perceptual switches. We chose to use an RN instead of a simpler (more transparent) model as we wanted to use the RNN as a means of both hypothesis generation and hypothesis testing. Specifically, unlike more standard neuronal models which are handcrafted to reproduce a specific effect, when building an RNN the modeller only specifies the network inputs, labels, and the parameter constraints (e.g. Dale’s law) in advance. The dynamics of the RNN are entirely determined by optimisation. Post-training manipulations of the RNN are not built in, or in any way guaranteed to work, making them more analogous to experimental manipulations of an approximately task-optimal brain-like system. Confirmatory results are arguably, therefore, a first step towards an in vitro experimental test.</p><p>Thus, we provide early empirical and computational evidence that ascending neuromodulatory activity facilitates state changes in perception under conditions of perceptual ambiguity (<xref ref-type="bibr" rid="bib55">Murphy et al., 2014</xref>; <xref ref-type="bibr" rid="bib17">de Gee et al., 2014</xref>; <xref ref-type="bibr" rid="bib18">de Gee et al., 2017</xref>) when a stimulus is task relevant. Importantly, we do not expect that our results will generalise to experimental setting when a stimulus is not task relevant. We can make sense of this computationally by imagining the gain dynamics in our model if we added in a second task-irrelevant condition where at the beginning of each trial the model was given a cue indicating whether it would have to simply ‘maintain fixation’ or readout the category of the input. In the presence of the task-irrelevant cue, the model would read out the ‘maintain fixation’ action with high certainty and thus not ramp up gain. We hypothesise therefore that the pupil dynamics observed in the task will depend on participants’ task set. Indeed, there is evidence from a recent multistable perception experiment showing that arousal-related changes in pupil dilation disappear when the stimulus is not task-relevant. The authors of the study attribute the arousal-dependent pupil dilation to task execution. This explanation, however, could not explain the ramping of pupil diameter in our task where the participants perform an action on every trial. Instead, based upon the workings of our computational model, we hypothesise that arousal-based changes in pupil diameter are driven by task-set-related uncertainty and thus will depend on task relevance rather than task execution per se.</p><p>A core neuroanatomical property of the LC noradrenergic system is that a relatively small number of neurons (~50,000 in an adult human) projects to almost all brain regions (<xref ref-type="bibr" rid="bib69">Samuels and Szabadi, 2008</xref>; <xref ref-type="bibr" rid="bib87">Totah et al., 2019</xref>). This organisation implies that the LC acts as a low-dimensional modulator of the much more high-dimensional cerebral cortex. Subtle changes in the activity of LC can have significant effects on how different brain regions communicate (<xref ref-type="bibr" rid="bib74">Shine et al., 2018</xref>; <xref ref-type="bibr" rid="bib94">Wainstein et al., 2022</xref>; <xref ref-type="bibr" rid="bib48">Liu et al., 2017</xref>; <xref ref-type="bibr" rid="bib102">Zerbi et al., 2019</xref>; <xref ref-type="bibr" rid="bib33">Hansen et al., 2022</xref>; <xref ref-type="bibr" rid="bib32">Hansen et al., 2021</xref>). The mechanism of gain modulation in our model was, likewise, dependent on a low-dimensional process, with the network output altering the gain uniformly across the full network. At a neuronal level, NA increases excitability by liberating intracellular calcium and opening (or closing) voltage-gated ions channels (<xref ref-type="bibr" rid="bib77">Shine et al., 2021</xref>; <xref ref-type="bibr" rid="bib94">Wainstein et al., 2022</xref>). In our model, this global increase in excitability increased the speed of perceptual switches by recruiting inhibitory units to more rapidly actively inhibit the population encoding the initially dominant stimulus. At a population level, the interaction between excitatory and inhibitory units led to the emergence of a gain-dependent oscillatory regime which suppresses the currently active population encoding the initially dominant stimulus and boosts the competing quiescent population. At the scale of the full network, the gain-mediated changes resemble the transient application of an external forcing function pushing the network trajectory in the direction of the new percept which, from the perspective of the allocentric landscape, manifests as a spike in neural work at turning points in the network’s low-dimensional trajectory, leading up to and following the perceptual switch. From the egocentric perspective, this is characterised by a flattening of the landscape analogous to an externally driven increase in kinetic energy making large changes in the location of a particle more likely.</p><p>In line with the predictions of the RNN in our analysis of the BOLD data, we showed that the velocity of the low- dimensional brain state trajectory most associated with perceptual switching increased significantly during the point of reported perceptual change in comparison (<xref ref-type="fig" rid="fig5">Figure 5B</xref>), which we interpret as the brain moving from one attractor to another (<xref ref-type="fig" rid="fig6">Figure 6A</xref>). Importantly, we showed that around the perceptual switch, the energy needed for each unit of change in brain state (i.e. displacement) is smaller than at other points in the task (<xref ref-type="fig" rid="fig6">Figure 6A and B</xref>). Under the (egocentric) energy landscape framework (<xref ref-type="bibr" rid="bib54">Munn et al., 2021</xref>; <xref ref-type="bibr" rid="bib84">Taylor et al., 2022</xref>), this tells us that the landscape is flattened, and the energy required to transition between states is reduced. Together with the pupillary findings (<xref ref-type="fig" rid="fig1">Figure 1</xref>), the computation model (<xref ref-type="fig" rid="fig2">Figures 2</xref>—<xref ref-type="fig" rid="fig4">4</xref>), and replication from former results (<xref ref-type="bibr" rid="bib54">Munn et al., 2021</xref>; <xref ref-type="bibr" rid="bib84">Taylor et al., 2022</xref>; <xref ref-type="fig" rid="fig5">Figure 5E and F</xref>), we propose that the ascending neuromodulatory system is responsible for the large-scale flattening of the egocentric energy landscape which facilitating changes in task-relevant perceptual content.</p><p>This work is not without limitations. First, the pupil diameter dataset and the fMRI analysis came from different participants, such that the link between the pupil diameter and the fMRI results is inherently indirect. Moreover, differences in task timing, structure, and instructions between the fMRI and pupil experiments add complexity to interpreting the results. For instance, the fMRI task includes jittered inter-trial intervals (ITIs) and catch trials, features absent in the pupil task, which presents a more rapid stimulus sequence. These differences may have influenced perceptual switch points and task behaviour across experiments. Additionally, the specificity of the pupil diameter as a marker of the LC activity is under active debate (<xref ref-type="bibr" rid="bib44">Joshi and Gold, 2020</xref>). For instance, there is evidence suggesting a role of the superior colliculus, the dorsal raphe nucleus, and central cholinergic system in driving pupil dilations (<xref ref-type="bibr" rid="bib75">Shine, 2019</xref>; <xref ref-type="bibr" rid="bib14">Cazettes et al., 2021</xref>; <xref ref-type="bibr" rid="bib91">Vyas et al., 2020</xref>; <xref ref-type="bibr" rid="bib76">Shine et al., 2019</xref>). Although there is uncertainty regarding whether these other nuclei are directly related to pupil dilation or only indirectly via their connections with other neural regions and nuclei. Despite this, we believe that our pupillometry dataset captures an important function of the noradrenergic system in cases of task-relevant perceptual ambiguity as there is strong evidence showing that pupil diameter is a reliable marker of noradrenergic activity during evoked cognitive tasks (<xref ref-type="bibr" rid="bib93">Wainstein et al., 2021</xref>; <xref ref-type="bibr" rid="bib102">Zerbi et al., 2019</xref>; <xref ref-type="bibr" rid="bib2">Alnæs et al., 2014</xref>; <xref ref-type="bibr" rid="bib39">Janitzky et al., 2015</xref>; <xref ref-type="bibr" rid="bib63">Reimer et al., 2014</xref>). Additionally, the sample size of our fMRI study makes it difficult to generalise our results. In spite of this, the converging evidence from the pupillometry dataset, the fMRI dataset, and the computational model supports the role of the ascending neuromodulation in mediating task-relevant perceptual switches. Future work is needed both in humans, with higher sample sizes utilising fMRI and eye-tracking recordings, as well as animal studies, to directly modulate and record the LC activity in a task manipulating perceptual uncertainty.</p><sec id="s3-1"><title>Conclusion</title><p>In summary, we provide computational and empirical evidence for the association between neuromodulation, pupil dilation, and (egocentric) energy landscape flattening in task-relevant perceptual switches. Our results strengthen our understanding of the neurobiological processes underpinning moment-by-moment adaptive changes to perception. Specifically, we suggest that the widespread excitatory projections of the noradrenergic arousal system mediate the systems-level reconfigurations of cortical network architecture (<xref ref-type="bibr" rid="bib87">Totah et al., 2019</xref>; <xref ref-type="bibr" rid="bib102">Zerbi et al., 2019</xref>) via uncertainty-driven alterations in neural gain. This suggests that more highly conserved features of the nervous system may play a role in driving task-relevant switches in the contents of perception.</p></sec></sec><sec id="s4" sec-type="methods"><title>Methods</title><sec id="s4-1"><title>Overview of empirical data</title><p>There were two independent groups analysed in this study: 35 subjects performed a perceptual decision-making perceptual task while pupil diameter was recorded; and a separate group of 17 subjects performed a version of the task adapted for the MRI scanner. Data are available at <ext-link ext-link-type="uri" xlink:href="https://github.com/ShineLabUSYD/AmbiguousFigures">https://github.com/ShineLabUSYD/AmbiguousFigures</ext-link> (copy archived at <xref ref-type="bibr" rid="bib98">Whyte et al., 2025</xref>).</p></sec><sec id="s4-2"><title>Perceptual task</title><p>Twenty picture sets were used in which line drawings of common objects morphed over 15 iterations into a different object (<xref ref-type="fig" rid="fig1">Figure 1A</xref>). Picture sets were selected from a larger set validated in an earlier study (<xref ref-type="bibr" rid="bib80">Stöttinger et al., 2016</xref>). In the original study, participants reported verbally what they saw by typing in the name of the object. This reporting method guaranteed that participants could freely indicate what they saw without being restricted by categories (e.g. forced choice). Picture sets for the current study were selected with the criterion that all sets were perceived categorically in the normative study (i.e. that the majority of participants in the normative study categorised each picture they saw as either the first object or second object in the set; <xref ref-type="bibr" rid="bib79">Stöttinger et al., 2015</xref>). Selecting only the categorically perceived image sets guaranteed that pictures in the middle of the morphing sequence were not simply ‘noisier' than pictures at the beginning or end. In other words, the ambiguous images were still easily categorised by participants as either object 1 or object 2. All images were a standard size (316 × 316 pixels) and were displayed on a white background. In addition, in the fMRI study, participants were presented with two kinds of control picture sets to ensure that they were responding to changes in the pictures in the set rather than simply to the position in the set (e.g. always switching after the eighth picture). In these control picture sets, a salient deviating picture was presented either after 3 pictures or after 13 pictures, resulting in an early or late abrupt shift. Those sets served as controls and were not analysed further.</p><p>The picture morphing task consisted of five experimental runs. We randomised the order in which the picture sets were presented in each run and kept this randomised order consistent across participants. Picture morphing in each picture set occurred over 15 discrete steps, each corresponding with the acquisition of a whole-brain image. In the fMRI experiment, each picture within a set was presented for 2 s. Pictures were randomly intermixed with eight inter-stimulus intervals (2, 4, 6, or 8 s) during which participants saw a fixation cross. In the eyetracking experiments, each picture was presented for 750 ms, followed by a fixation cross of 2 s. Participants provided their responses in the scanner using two buttons on a four-button Cedrus fibre optic system. In a two-alternative forced-choice task, participants were asked to press the first button when they ‘saw the first object' and the second button when they ‘saw the second object' – this ensured that there was not a motor confound present on only the switch trials. All participants were ignorant as to the identity of the second object in each picture set. At the end of each set of 15 images, the word END was presented for 2 s to indicate that the next picture set would begin shortly. Participants provided their responses in the fMRI scanner using a Cedrus fibre-optic response system with four buttons. For the two-alternative forced-choice task, participants were instructed to press the first button when they ‘saw the first object’ and the second button when they ‘saw the second object’. This design ensured that motor responses were not confounded with perceptual switches as responses occurred on both switch and non-switch trials. Importantly, participants were not informed about the identity of the second object in each picture set beforehand. At the end of each sequence of 15 images, the word 'END' was displayed for 2 s to signal the conclusion of that picture set and the imminent start of the next one.</p></sec><sec id="s4-3"><title>Participants</title><p>A total of 17 (six males) neurologically healthy participants with normal or corrected to normal vision took part in the fMRI study (mean age 27.65±8.01). Fifteen were right-hand dominant. A separate cohort of 35 participants performed the task while simultaneous pupil diameter was recorded using an eye tracker device (SR Research, 1000 Hz). None of the participants had a history of brain injury. Participants received $30 for their participation. All participants provided informed consent prior to participation. The research protocol was approved by the Office of Research Ethics at the University of Waterloo and the Tri-Hospital Research Ethics Board of the Region of Waterloo in Ontario, Canada.</p></sec><sec id="s4-4"><title>Pupillometry</title><p>Fluctuations in pupil diameter of the left eye were collected using an Eyelink 1000 (SR Research Ltd., Mississauga, Ontario, Canada), with a 1 kHz sampling frequency. Blinks, artefacts, and outliers were removed and linearly interpolated (<xref ref-type="bibr" rid="bib92">Wainstein et al., 2017</xref>). High-frequency noise was smoothed using a second-order 2.5 Hz low-pass Butterworth filter. To obtain the pupil diameter average profile, data from each participant were normalised across each trial (corresponding to the 15 consecutive image set). This allowed us to correct for low-frequency baseline changes without eliminating the load effect and baseline differences due to load manipulations (<xref ref-type="bibr" rid="bib12">Campos-Arteaga et al., 2020</xref>; <xref ref-type="bibr" rid="bib67">Rojas-Líbano et al., 2019</xref>).</p></sec><sec id="s4-5"><title>Recurrent neural network modelling</title><p>We used PyTorch (<xref ref-type="bibr" rid="bib60">Paszke, 2019</xref>) to implement and train 50 continuous-time RNNs that we constrained to respect Dale’s law (<inline-formula><alternatives><mml:math id="inf61"><mml:msub><mml:mrow><mml:mi>N</mml:mi></mml:mrow><mml:mrow><mml:mi>E</mml:mi><mml:mo>+</mml:mo><mml:mi>I</mml:mi></mml:mrow></mml:msub></mml:math><tex-math id="inft61">\begin{document}$N_{E+I}$\end{document}</tex-math></alternatives></inline-formula>=40, 80% excitatory  <inline-formula><alternatives><mml:math id="inf62"><mml:msub><mml:mrow><mml:mi>N</mml:mi></mml:mrow><mml:mrow><mml:mi>E</mml:mi></mml:mrow></mml:msub></mml:math><tex-math id="inft62">\begin{document}$N_{E}$\end{document}</tex-math></alternatives></inline-formula>= 32, and 20% inhibitory  <inline-formula><alternatives><mml:math id="inf63"><mml:msub><mml:mrow><mml:mi>N</mml:mi></mml:mrow><mml:mrow><mml:mi>I</mml:mi></mml:mrow></mml:msub></mml:math><tex-math id="inft63">\begin{document}$N_{I}$\end{document}</tex-math></alternatives></inline-formula>= 8) using the procedure set out in <xref ref-type="bibr" rid="bib100">Yang and Wang, 2020</xref>. The dynamics of each network evolved according to the following system of stochastic differential equations:<disp-formula id="equ2"><alternatives><mml:math id="m2"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mi>d</mml:mi><mml:mi>x</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>τ</mml:mi></mml:mfrac><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mo>−</mml:mo><mml:mi>x</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>t</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>+</mml:mo><mml:msup><mml:mi>W</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msup><mml:mi>r</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>t</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>+</mml:mo><mml:msup><mml:mi>W</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>n</mml:mi></mml:mrow></mml:msup><mml:mi>u</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>t</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mi>d</mml:mi><mml:mi>t</mml:mi><mml:mo>+</mml:mo><mml:mi>d</mml:mi><mml:mi>W</mml:mi></mml:mstyle></mml:mrow></mml:mstyle></mml:math><tex-math id="t2">\begin{document}$$\displaystyle dx=\frac{1}{\tau }\left (- x\left (t\right)+W^{rec}r\left (t\right)+W^{in}u\left (t\right)\right)dt+dW$$\end{document}</tex-math></alternatives></disp-formula></p><p>where <inline-formula><alternatives><mml:math id="inf64"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>x</mml:mi><mml:mo>∈</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:mi>N</mml:mi><mml:mo>×</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math><tex-math id="inft64">\begin{document}$x\in \mathbb{R}^{N\times 1}$\end{document}</tex-math></alternatives></inline-formula> represents the sub-threshold activation of each unit, <inline-formula><alternatives><mml:math id="inf65"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>u</mml:mi><mml:mo>∈</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn><mml:mo>×</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math><tex-math id="inft65">\begin{document}$u\in \mathbb{R}^{2\times 1}$\end{document}</tex-math></alternatives></inline-formula> the external input into the network, <inline-formula><alternatives><mml:math id="inf66"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mi>W</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msup><mml:mo>∈</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:mn>40</mml:mn><mml:mo>×</mml:mo><mml:mn>40</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math><tex-math id="inft66">\begin{document}$W^{rec}\in \mathbb{R}^{40\times 40}$\end{document}</tex-math></alternatives></inline-formula> the recurrent weights, <inline-formula><alternatives><mml:math id="inf67"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mi>W</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>n</mml:mi></mml:mrow></mml:msup><mml:mo>∈</mml:mo><mml:msup><mml:mrow><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow></mml:mrow><mml:mrow><mml:mn>40</mml:mn><mml:mo>×</mml:mo><mml:mn>2</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math><tex-math id="inft67">\begin{document}$W^{in}\in {\mathbb R}^{40\times 2}$\end{document}</tex-math></alternatives></inline-formula> the input weights, and <inline-formula><alternatives><mml:math id="inf68"><mml:mi>τ</mml:mi></mml:math><tex-math id="inft68">\begin{document}$\tau $\end{document}</tex-math></alternatives></inline-formula> the time constant which we set to 100 ms. In addition to task input, each unit in the network was driven by a Weiner process <inline-formula><alternatives><mml:math id="inf69"><mml:mi>d</mml:mi><mml:mi>W</mml:mi></mml:math><tex-math id="inft69">\begin{document}$dW$\end{document}</tex-math></alternatives></inline-formula>. The subthreshold activation variable <inline-formula><alternatives><mml:math id="inf70"><mml:mi>x</mml:mi></mml:math><tex-math id="inft70">\begin{document}$x$\end{document}</tex-math></alternatives></inline-formula> was converted into a vector of instantaneous firing rates by applying a sigmoid function <inline-formula><alternatives><mml:math id="inf71"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>r</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mn>1</mml:mn><mml:mo>+</mml:mo><mml:msup><mml:mi>e</mml:mi><mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mo>−</mml:mo><mml:mi>g</mml:mi><mml:mi>x</mml:mi></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:msup></mml:mrow></mml:mfrac></mml:mrow></mml:mstyle></mml:math><tex-math id="inft71">\begin{document}$r=\frac{1}{1+e^{\left (- gx\right)}}$\end{document}</tex-math></alternatives></inline-formula>, where <inline-formula><alternatives><mml:math id="inf72"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>g</mml:mi><mml:mo>∈</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:mi>N</mml:mi><mml:mo>×</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math><tex-math id="inft72">\begin{document}$g\in \mathbb{R} ^{N\times 1}$\end{document}</tex-math></alternatives></inline-formula> is a vector containing the gain control parameter of each unit’s activation function that was multiplied element wise with <inline-formula><alternatives><mml:math id="inf73"><mml:mi>x</mml:mi></mml:math><tex-math id="inft73">\begin{document}$x$\end{document}</tex-math></alternatives></inline-formula>. Network outputs <inline-formula><alternatives><mml:math id="inf74"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>z</mml:mi><mml:mo>∈</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn><mml:mo>×</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math><tex-math id="inft74">\begin{document}$z\in \mathbb{R}^{2\times 1}$\end{document}</tex-math></alternatives></inline-formula> were given by a linear readout of the excitatory population’s firing rate <inline-formula><alternatives><mml:math id="inf75"><mml:mi>z</mml:mi><mml:mo>=</mml:mo><mml:msup><mml:mrow><mml:mi>W</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msup><mml:msub><mml:mrow><mml:mi>r</mml:mi></mml:mrow><mml:mrow><mml:mi>E</mml:mi></mml:mrow></mml:msub></mml:math><tex-math id="inft75">\begin{document}$z=W^{out}r_{E}$\end{document}</tex-math></alternatives></inline-formula>. Where <inline-formula><alternatives><mml:math id="inf76"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mi>W</mml:mi><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msup><mml:mo>∈</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mrow><mml:mi>E</mml:mi></mml:mrow></mml:msub><mml:mo>×</mml:mo><mml:mn>2</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math><tex-math id="inft76">\begin{document}$W^{out}\in \mathbb{R} ^{N_{E}\times 2}$\end{document}</tex-math></alternatives></inline-formula>. The network’s choice at each time point was the maximum of the two-dimensional output <inline-formula><alternatives><mml:math id="inf77"><mml:mi>z</mml:mi></mml:math><tex-math id="inft77">\begin{document}$z$\end{document}</tex-math></alternatives></inline-formula>.</p><p>We imposed Dale’s law on the recurrent weights of the network by parametrising the weight matrix with a mask <inline-formula><alternatives><mml:math id="inf78"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mi>W</mml:mi><mml:mrow><mml:mi>m</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msup><mml:mo>∈</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="double-struck">R</mml:mi></mml:mrow><mml:mrow><mml:mn>40</mml:mn><mml:mo>×</mml:mo><mml:mn>40</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math><tex-math id="inft78">\begin{document}$W^{mask}\in \mathbb{R}^{40\times 40}$\end{document}</tex-math></alternatives></inline-formula>, which contained zeros in the leading diagonal (removing self-connections), +1 in all non-diagonal entries of the first 32 rows/columns, and -1 in the remaining eight rows/columns. We obtained the constrained recurrent weight matrix by multiplying the absolute value of the trained weights element wise with the mask <inline-formula><alternatives><mml:math id="inf79"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mi>W</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msup><mml:mo>=</mml:mo><mml:mrow><mml:mo>|</mml:mo><mml:msubsup><mml:mi>W</mml:mi><mml:mrow><mml:mi>p</mml:mi><mml:mi>l</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msubsup><mml:mo>|</mml:mo></mml:mrow><mml:mo>⨀</mml:mo><mml:msup><mml:mi>W</mml:mi><mml:mrow><mml:mi>m</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math><tex-math id="inft79">\begin{document}$W^{rec}=\left |W_{plastic}^{rec}\right |\bigodot W^{mask}$\end{document}</tex-math></alternatives></inline-formula>, thereby imposing an 80/20 E/I ratio. Similarly, we constrained the projection of the input to the network and the readout projection to be strictly positive by taking the absolute value of the trained input and output weights <inline-formula><alternatives><mml:math id="inf80"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mi>W</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>n</mml:mi></mml:mrow></mml:msup><mml:mo>=</mml:mo><mml:mrow><mml:mo>|</mml:mo><mml:msubsup><mml:mi>W</mml:mi><mml:mrow><mml:mi>p</mml:mi><mml:mi>l</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>n</mml:mi></mml:mrow></mml:msubsup><mml:mo>|</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math><tex-math id="inft80">\begin{document}$W^{in}=\left |W_{plastic}^{in}\right |$\end{document}</tex-math></alternatives></inline-formula>, <inline-formula><alternatives><mml:math id="inf81"><mml:msup><mml:mrow><mml:mi>W</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msup><mml:mo>=</mml:mo><mml:mfenced open="|" close="|" separators="|"><mml:mrow><mml:msubsup><mml:mrow><mml:mi>W</mml:mi></mml:mrow><mml:mrow><mml:mi>p</mml:mi><mml:mi>l</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msubsup></mml:mrow></mml:mfenced></mml:math><tex-math id="inft81">\begin{document}$W^{out}=\left |W_{plastic}^{out}\right |$\end{document}</tex-math></alternatives></inline-formula>.</p><p>Following standard practice (<xref ref-type="bibr" rid="bib100">Yang and Wang, 2020</xref>), we simulated the network by discretising the system using a Euler–Maruyama integration scheme, where <inline-formula><alternatives><mml:math id="inf82"><mml:mi>α</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>d</mml:mi><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mi>τ</mml:mi></mml:mrow></mml:mfrac></mml:math><tex-math id="inft82">\begin{document}$\alpha =\frac{dt}{\tau }$\end{document}</tex-math></alternatives></inline-formula>, and <inline-formula><alternatives><mml:math id="inf83"><mml:msub><mml:mrow><mml:mi>σ</mml:mi></mml:mrow><mml:mrow><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>0.01</mml:mn></mml:math><tex-math id="inft83">\begin{document}$\sigma _{rec}=0.01$\end{document}</tex-math></alternatives></inline-formula>.<disp-formula id="equ3"><alternatives><mml:math id="m3"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mi>x</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>t</mml:mi><mml:mo>+</mml:mo><mml:mi mathvariant="normal">Δ</mml:mi><mml:mi>t</mml:mi></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>−</mml:mo><mml:mi>α</mml:mi></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mi>x</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>t</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>+</mml:mo><mml:mi>α</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msup><mml:mi>W</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msup><mml:mi>r</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>t</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>+</mml:mo><mml:msup><mml:mi>W</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>n</mml:mi></mml:mrow></mml:msup><mml:mi>u</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>t</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mo>+</mml:mo><mml:msub><mml:mi>σ</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:msqrt><mml:mi mathvariant="normal">Δ</mml:mi><mml:mi>t</mml:mi></mml:msqrt><mml:mi>N</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mstyle></mml:mrow></mml:mstyle></mml:math><tex-math id="t3">\begin{document}$$\displaystyle x\left (t+\Delta t\right)=\left (1- \alpha \right)x\left (t\right)+\alpha \left (W^{rec}r\left (t\right)+W^{in}u\left (t\right)\right)+\sigma _{rec}\sqrt{\Delta t}N \left (0,1\right)$$\end{document}</tex-math></alternatives></disp-formula></p><p>Each network was trained by optimising <inline-formula><alternatives><mml:math id="inf84"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msubsup><mml:mi>W</mml:mi><mml:mrow><mml:mi>p</mml:mi><mml:mi>l</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>n</mml:mi></mml:mrow></mml:msubsup></mml:mrow></mml:mstyle></mml:math><tex-math id="inft84">\begin{document}$W_{plastic}^{in}$\end{document}</tex-math></alternatives></inline-formula>, <inline-formula><alternatives><mml:math id="inf85"><mml:msubsup><mml:mrow><mml:mi>W</mml:mi></mml:mrow><mml:mrow><mml:mi>p</mml:mi><mml:mi>l</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msubsup></mml:math><tex-math id="inft85">\begin{document}$W_{plastic}^{rec}$\end{document}</tex-math></alternatives></inline-formula>, and <inline-formula><alternatives><mml:math id="inf86"><mml:msubsup><mml:mrow><mml:mi>W</mml:mi></mml:mrow><mml:mrow><mml:mi>p</mml:mi><mml:mi>l</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msubsup></mml:math><tex-math id="inft86">\begin{document}$W_{plastic}^{out}$\end{document}</tex-math></alternatives></inline-formula> to minimise a cross-entropy loss function through 1000 iterations of back propagation through time (<xref ref-type="bibr" rid="bib97">Werbos, 1990</xref>) with ADAM (<xref ref-type="bibr" rid="bib45">Kingma and Ba, 2015</xref>). Batches consisted of single trials which for our simple task (described below) was sufficient for each network to converge on near-perfect behavioural accuracy. All training was performed with the gain control parameter set to 1. Again following standard practice, we trained the networks with a relatively large time step of  <inline-formula><alternatives><mml:math id="inf87"><mml:mi>Δ</mml:mi><mml:mi>t</mml:mi></mml:math><tex-math id="inft87">\begin{document}$\Delta t$\end{document}</tex-math></alternatives></inline-formula> = 200 ms. Following training, to ensure numerical stability we exported the trained weights into MATLAB and simulated the system with a bespoke numerical integration scheme with <inline-formula><alternatives><mml:math id="inf88"><mml:mi>Δ</mml:mi><mml:mi>t</mml:mi></mml:math><tex-math id="inft88">\begin{document}$\Delta t$\end{document}</tex-math></alternatives></inline-formula> set 1ms.</p><p>The task consisted of a simple change detection paradigm analogous to the task performed by our human participants. Specifically, at each time point the network was fed a two-dimensional input <inline-formula><alternatives><mml:math id="inf89"><mml:mi>u</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:mfenced><mml:mo>=</mml:mo><mml:msup><mml:mrow><mml:mfenced open="[" close="]" separators="|"><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>u</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mi>T</mml:mi></mml:mrow></mml:msup></mml:math><tex-math id="inft89">\begin{document}$u\left (t\right)=\left [\begin{array}{cc}u_{1} &amp; u_{2}\end{array}\right ]^{T}$\end{document}</tex-math></alternatives></inline-formula>, with each column representing the ‘sensory evidence’ for each of the two stimulus categories. The task lasted for 1 s of simulation time beginning with maximum evidence for one of the two categories <inline-formula><alternatives><mml:math id="inf90"><mml:mi>u</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:mfenced><mml:mo>=</mml:mo><mml:msup><mml:mrow><mml:mfenced open="[" close="]" separators="|"><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mn>0</mml:mn></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mi>T</mml:mi></mml:mrow></mml:msup></mml:math><tex-math id="inft90">\begin{document}$u\left (t\right)=\left [\begin{array}{cc}1 &amp; 0\end{array}\right ]^{T}$\end{document}</tex-math></alternatives></inline-formula> and over the course of each trial changed linearly such so that at the half-way point of the simulation the sensory evidence for each stimulus category changed was perfectly matched category <inline-formula><alternatives><mml:math id="inf91"><mml:mi>u</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:mfenced><mml:mo>=</mml:mo><mml:msup><mml:mrow><mml:mfenced open="[" close="]" separators="|"><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mo>.</mml:mo><mml:mn>5</mml:mn></mml:mtd><mml:mtd><mml:mo>.</mml:mo><mml:mn>5</mml:mn></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mi>T</mml:mi></mml:mrow></mml:msup></mml:math><tex-math id="inft91">\begin{document}$u\left (t\right)=\left [\begin{array}{cc}.5 &amp; .5\end{array}\right ]^{T}$\end{document}</tex-math></alternatives></inline-formula> and by the final time step consisted of maximum evidence for the second stimulus category <inline-formula><alternatives><mml:math id="inf92"><mml:mi>u</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:mfenced><mml:mo>=</mml:mo><mml:msup><mml:mrow><mml:mfenced open="[" close="]" separators="|"><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mn>0</mml:mn></mml:mtd><mml:mtd><mml:mn>1</mml:mn></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mi>T</mml:mi></mml:mrow></mml:msup></mml:math><tex-math id="inft92">\begin{document}$u\left (t\right)=\left [\begin{array}{cc}0 &amp; 1\end{array}\right ]^{T}$\end{document}</tex-math></alternatives></inline-formula> . We trained the network to output a response for stimulus category 1 whenever  <inline-formula><alternatives><mml:math id="inf93"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>&gt;</mml:mo><mml:mn>0.5</mml:mn></mml:mrow></mml:mstyle></mml:math><tex-math id="inft93">\begin{document}$u_{1}&gt;0.5$\end{document}</tex-math></alternatives></inline-formula>, and <inline-formula><alternatives><mml:math id="inf94"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mo>&lt;</mml:mo><mml:mn>0.5</mml:mn><mml:mo>,</mml:mo></mml:mrow></mml:mstyle></mml:math><tex-math id="inft94">\begin{document}$u_{2}&lt; 0.5,$\end{document}</tex-math></alternatives></inline-formula> and category 2 whenever  <inline-formula><alternatives><mml:math id="inf95"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>&lt;</mml:mo><mml:mn>0.5</mml:mn></mml:mrow></mml:mstyle></mml:math><tex-math id="inft95">\begin{document}$u_{1}&lt;0.5$\end{document}</tex-math></alternatives></inline-formula>, and <inline-formula><alternatives><mml:math id="inf96"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msub><mml:mi>u</mml:mi><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mo>&gt;</mml:mo><mml:mn>0.5</mml:mn></mml:mrow></mml:mstyle></mml:math><tex-math id="inft96">\begin{document}$u_{2}&gt; 0.5$\end{document}</tex-math></alternatives></inline-formula>.</p><p>To test our hypothesis that perceptual uncertainty increases neuromodulatory via phasic bursts in the noradrenergic LC, we made gain time dependent with dynamics governed by a linear ODE with a forcing term proportional to the uncertainty (i.e. the entropy <inline-formula><alternatives><mml:math id="inf97"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>H</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>z</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:munder><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:munder><mml:mi>p</mml:mi><mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:mi>z</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mi>l</mml:mi><mml:mi>n</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>p</mml:mi><mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:mi>z</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math><tex-math id="inft97">\begin{document}$H\left (z\right)=\sum _{i}p\left (z\right)_{i}ln\left (p\left (z\right)_{i}\right)$\end{document}</tex-math></alternatives></inline-formula>) of the network’s readout.<disp-formula id="equ4"><alternatives><mml:math id="m4"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mi>d</mml:mi><mml:mi>g</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>τ</mml:mi></mml:mfrac><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msub><mml:mi>g</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mi>o</mml:mi><mml:mi>n</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>−</mml:mo><mml:mi>g</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>t</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>+</mml:mo><mml:mi>γ</mml:mi><mml:mi>H</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>z</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mi>d</mml:mi><mml:mi>t</mml:mi></mml:mstyle></mml:mrow></mml:mstyle></mml:math><tex-math id="t4">\begin{document}$$\displaystyle dg=\frac{1}{\tau } \left (g_{tonic}- g\left (t\right)+\gamma H\left (z\right)\right)dt$$\end{document}</tex-math></alternatives></disp-formula></p><p>where <inline-formula><alternatives><mml:math id="inf98"><mml:mi>p</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mi>z</mml:mi></mml:mrow></mml:mfenced></mml:math><tex-math id="inft98">\begin{document}$p\left (z\right)$\end{document}</tex-math></alternatives></inline-formula> is obtained by passing <inline-formula><alternatives><mml:math id="inf99"><mml:mi>z</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:mfenced></mml:math><tex-math id="inft99">\begin{document}$z\left (t\right)$\end{document}</tex-math></alternatives></inline-formula> through a softmax function at each time step of the simulation <inline-formula><alternatives><mml:math id="inf100"><mml:msub><mml:mrow><mml:mi>p</mml:mi><mml:mo>(</mml:mo><mml:mi>z</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>e</mml:mi><mml:mi>x</mml:mi><mml:mi>p</mml:mi><mml:mo>⁡</mml:mo><mml:mo>(</mml:mo><mml:msub><mml:mrow><mml:mi>ω</mml:mi><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mrow><mml:msubsup><mml:mo stretchy="false">∑</mml:mo><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>K</mml:mi></mml:mrow></mml:msubsup><mml:mrow><mml:mi>e</mml:mi><mml:mi>x</mml:mi><mml:mi>p</mml:mi><mml:mo>⁡</mml:mo><mml:mo>(</mml:mo><mml:msub><mml:mrow><mml:mi>ω</mml:mi><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mrow></mml:mfrac></mml:math><tex-math id="inft100">\begin{document}$p\left (z\right)_{i}=\frac{exp \left (\omega z_{i}\right)}{\sum _{j}^{K}exp \left (\omega z_{j}\right)}$\end{document}</tex-math></alternatives></inline-formula> with inverse temperature parameter <inline-formula><alternatives><mml:math id="inf101"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>ω</mml:mi><mml:mo>=</mml:mo><mml:mn>0.25</mml:mn></mml:mrow></mml:mstyle></mml:math><tex-math id="inft101">\begin{document}$\omega =0.25$\end{document}</tex-math></alternatives></inline-formula>. When the network approaches the half-way point in the trial, input is maximally ambiguous and the distribution <inline-formula><alternatives><mml:math id="inf102"><mml:mi>p</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mi>z</mml:mi></mml:mrow></mml:mfenced></mml:math><tex-math id="inft102">\begin{document}$p\left (z\right)$\end{document}</tex-math></alternatives></inline-formula> approaches a uniform distribution leading <inline-formula><alternatives><mml:math id="inf103"><mml:mi>H</mml:mi><mml:mo>(</mml:mo><mml:mi>z</mml:mi><mml:mo>)</mml:mo></mml:math><tex-math id="inft103">\begin{document}$H\left (z\right)$\end{document}</tex-math></alternatives></inline-formula> to approach its maximum value, which in turn leads to a phasic increase in gain (with magnitude <inline-formula><alternatives><mml:math id="inf104"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft104">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula>). In the absence of forcing (i.e. under conditions of perceptual certainty), gain decays exponentially to its tonic value (<inline-formula><alternatives><mml:math id="inf105"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msub><mml:mi>g</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mi>o</mml:mi><mml:mi>n</mml:mi><mml:mi>i</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mstyle></mml:math><tex-math id="inft105">\begin{document}$g_{tonic}=1$\end{document}</tex-math></alternatives></inline-formula>).</p><p>To study how the population dynamics of the trained networks changed as a function of gain in a shared space, we performed a PCA on the concatenated activity of the network at  <inline-formula><alternatives><mml:math id="inf106"><mml:mi>γ</mml:mi></mml:math><tex-math id="inft106">\begin{document}$\gamma $\end{document}</tex-math></alternatives></inline-formula> = 0. The set of principal components was highly low-dimensional, with 80.58±6.34% of the variance explained by the first principal component (PC<sub>1</sub>). We then projected the trial-averaged activity at each gain value at each timepoint onto the top PC.</p></sec><sec id="s4-6"><title>Energy landscape analysis</title><p>Leveraging previous work from our group (<xref ref-type="bibr" rid="bib54">Munn et al., 2021</xref>), we constructed a measure of the energy landscape traversed by each network through an analogy to the relationship between probability and energy in statistical mechanics (<xref ref-type="bibr" rid="bib86">Tkačik et al., 2015</xref>; <xref ref-type="bibr" rid="bib53">Munn and Gong, 2018</xref>) given by the Boltzmann distribution.<disp-formula id="equ5"><alternatives><mml:math id="m5"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:msub><mml:mi>p</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>z</mml:mi></mml:mfrac><mml:msup><mml:mi>e</mml:mi><mml:mrow><mml:mo>−</mml:mo><mml:mi>β</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msup></mml:mstyle></mml:mrow></mml:mstyle></mml:math><tex-math id="t5">\begin{document}$$\displaystyle p_{i}=\frac{1}{z}e^{- \beta E_{i}}$$\end{document}</tex-math></alternatives></disp-formula></p><p>where <inline-formula><alternatives><mml:math id="inf107"><mml:msub><mml:mrow><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:math><tex-math id="inft107">\begin{document}$p_{i}$\end{document}</tex-math></alternatives></inline-formula> denotes the probability of each state, <inline-formula><alternatives><mml:math id="inf108"><mml:msub><mml:mrow><mml:mi>E</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:math><tex-math id="inft108">\begin{document}$E_{i}$\end{document}</tex-math></alternatives></inline-formula> the energy of each state, <inline-formula><alternatives><mml:math id="inf109"><mml:mi>β</mml:mi></mml:math><tex-math id="inft109">\begin{document}$\beta $\end{document}</tex-math></alternatives></inline-formula> the thermodynamic beta, and <inline-formula><alternatives><mml:math id="inf110"><mml:mi>z</mml:mi></mml:math><tex-math id="inft110">\begin{document}$z$\end{document}</tex-math></alternatives></inline-formula> the canonical partition function. Solving for <inline-formula><alternatives><mml:math id="inf111"><mml:msub><mml:mrow><mml:mi>E</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:math><tex-math id="inft111">\begin{document}$E_{i}$\end{document}</tex-math></alternatives></inline-formula> , we obtain<disp-formula id="equ6"><alternatives><mml:math id="m6"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>β</mml:mi></mml:mfrac><mml:mi>l</mml:mi><mml:mi>n</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mi>z</mml:mi><mml:msub><mml:mi>p</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfrac><mml:mo>)</mml:mo></mml:mrow></mml:mstyle></mml:mrow></mml:mstyle></mml:math><tex-math id="t6">\begin{document}$$\displaystyle E_{i}=\frac{1}{\beta }ln\left (\frac{1}{zp_{i}}\right)$$\end{document}</tex-math></alternatives></disp-formula></p><p>Instead of inferring the probability distribution from the energy of a state as is done in physics, we used the fitdist function in MATLAB with a Gaussian kernel (<inline-formula><alternatives><mml:math id="inf112"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>P</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>x</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mn>4</mml:mn><mml:mi>n</mml:mi></mml:mrow></mml:mfrac><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:munderover><mml:mi>K</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mfrac><mml:mi>x</mml:mi><mml:mn>4</mml:mn></mml:mfrac><mml:mo>)</mml:mo></mml:mrow><mml:mo>,</mml:mo></mml:mrow></mml:mstyle></mml:math><tex-math id="inft112">\begin{document}$P\left (x\right)=\frac{1}{4n}\sum _{i=1}^{n}K\left (\frac{x}{4}\right),$\end{document}</tex-math></alternatives></inline-formula> where <inline-formula><alternatives><mml:math id="inf113"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>K</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mi>u</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mn>2</mml:mn><mml:msqrt><mml:mi>π</mml:mi></mml:msqrt></mml:mrow></mml:mfrac><mml:msup><mml:mi>e</mml:mi><mml:mrow><mml:mfrac><mml:mrow><mml:mo>−</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mn>2</mml:mn></mml:mfrac><mml:msup><mml:mi>u</mml:mi><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math><tex-math id="inft113">\begin{document}$K\left (u\right)=\frac{1}{2\sqrt{\pi }}e^{\frac{- 1}{2}u^{2}}$\end{document}</tex-math></alternatives></inline-formula>) to infer the probability of the state, and then solved for the energy. As <inline-formula><alternatives><mml:math id="inf114"><mml:mrow><mml:msubsup><mml:mo stretchy="false">∫</mml:mo><mml:mrow><mml:mo>−</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mrow><mml:mo>+</mml:mo><mml:mi>∞</mml:mi></mml:mrow></mml:msubsup><mml:mrow><mml:mi>P</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mi>x</mml:mi></mml:mrow></mml:mfenced><mml:mi>d</mml:mi><mml:mi>x</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mrow></mml:math><tex-math id="inft114">\begin{document}$\int _{- \infty }^{+\infty }P\left (x\right)dx=1$\end{document}</tex-math></alternatives></inline-formula> by construction, the partition function <inline-formula><alternatives><mml:math id="inf115"><mml:mi>z</mml:mi></mml:math><tex-math id="inft115">\begin{document}$z$\end{document}</tex-math></alternatives></inline-formula>, which we define here to be the integral of the pdf, is equal to 1, which, after setting <inline-formula><alternatives><mml:math id="inf116"><mml:mi>β</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:math><tex-math id="inft116">\begin{document}$\beta =1$\end{document}</tex-math></alternatives></inline-formula>, yields<disp-formula id="equ7"><alternatives><mml:math id="m7"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>l</mml:mi><mml:mi>n</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:msub><mml:mi>p</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mfrac><mml:mo>)</mml:mo></mml:mrow></mml:mstyle></mml:mrow></mml:mstyle></mml:math><tex-math id="t7">\begin{document}$$\displaystyle E_{i}=ln\left (\frac{1}{p_{i}}\right)$$\end{document}</tex-math></alternatives></disp-formula></p><p>For the allocentric landscape analysis, we defined the state of the system in terms of the trial-averaged loadings on PC<sub>1</sub> which we divided into 250 ms windows. For the egocentric landscape analysis, we calculated the mean-squared displacement (MSD) of the activity of the RNN at each time point <inline-formula><alternatives><mml:math id="inf117"><mml:msub><mml:mrow><mml:mi>τ</mml:mi></mml:mrow><mml:mrow><mml:mn>0</mml:mn></mml:mrow></mml:msub></mml:math><tex-math id="inft117">\begin{document}$\tau _{0}$\end{document}</tex-math></alternatives></inline-formula> relative to the reference point <inline-formula><alternatives><mml:math id="inf118"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msub><mml:mi>τ</mml:mi><mml:mrow><mml:mn>0</mml:mn></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>τ</mml:mi></mml:mrow></mml:mstyle></mml:math><tex-math id="inft118">\begin{document}$\tau _{0}+\tau $\end{document}</tex-math></alternatives></inline-formula>:<disp-formula id="equ8"><alternatives><mml:math id="m8"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>D</mml:mi><mml:mrow><mml:mi>τ</mml:mi><mml:mo>,</mml:mo><mml:msub><mml:mi>τ</mml:mi><mml:mrow><mml:mn>0</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mo>⟨</mml:mo><mml:msup><mml:mrow><mml:mo>|</mml:mo><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:msub><mml:mi>τ</mml:mi><mml:mrow><mml:mn>0</mml:mn></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>τ</mml:mi></mml:mrow></mml:msub><mml:mo>−</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:msub><mml:mi>τ</mml:mi><mml:mrow><mml:mn>0</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:msub></mml:mrow><mml:mo>|</mml:mo></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msup><mml:mo>⟩</mml:mo></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:msub></mml:mstyle></mml:mrow></mml:mstyle></mml:math><tex-math id="t8">\begin{document}$$\displaystyle MSD_{\tau ,\tau _{0}}=\left \langle \left |x_{\tau _{0}+\tau }- x_{\tau _{0}}\right |^{2}\right \rangle _{n}$$\end{document}</tex-math></alternatives></disp-formula></p><p>For congruency with the allocentric analysis, we increased <inline-formula><alternatives><mml:math id="inf119"><mml:mi>τ</mml:mi></mml:math><tex-math id="inft119">\begin{document}$\tau $\end{document}</tex-math></alternatives></inline-formula> and <inline-formula><alternatives><mml:math id="inf120"><mml:msub><mml:mrow><mml:mi>τ</mml:mi></mml:mrow><mml:mrow><mml:mn>0</mml:mn></mml:mrow></mml:msub></mml:math><tex-math id="inft120">\begin{document}$\tau _{0}$\end{document}</tex-math></alternatives></inline-formula> in steps of 250 ms starting 1 s into the trial and ending with a maximum difference between <inline-formula><alternatives><mml:math id="inf121"><mml:mi>τ</mml:mi></mml:math><tex-math id="inft121">\begin{document}$\tau $\end{document}</tex-math></alternatives></inline-formula> and <inline-formula><alternatives><mml:math id="inf122"><mml:msub><mml:mrow><mml:mi>τ</mml:mi></mml:mrow><mml:mrow><mml:mn>0</mml:mn></mml:mrow></mml:msub></mml:math><tex-math id="inft122">\begin{document}$\tau _{0}$\end{document}</tex-math></alternatives></inline-formula> of 5 s to ensure that all steps had equivalent window sizes.</p><p>Following the physical analogy, we think of the state of the system, PC<sub>1</sub> loadings in the allocentric analysis, and MSD in the egocentric analysis, as akin to the location and movement of a particle respectively. Positions in state space with low energy have a higher probability of being occupied, and systems with a higher average energy have a more uniform probability distribution, making large jumps in the position of a particle more likely (i.e. lower energy for large MSD values; see supplementary material; <xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1</xref>).</p><p>To quantify the effect of gain-mediated alterations to the topography of the allocentric energy landscape, we devised a novel measure – neural work – of the force (which in classical mechanics is equal to the negative gradient of potential energy) exerted on the low-dimensional neural trajectory by the vector field quantified by the allocentric energy landscape at each time point in the trial.<disp-formula id="equ9"><alternatives><mml:math id="m9"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:msub><mml:mi>W</mml:mi><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mo>−</mml:mo><mml:mfrac><mml:mrow><mml:mi>d</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>d</mml:mi><mml:mi>x</mml:mi></mml:mrow></mml:mfrac><mml:msub><mml:mi>s</mml:mi><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mstyle></mml:mrow></mml:mstyle></mml:math><tex-math id="t9">\begin{document}$$\displaystyle W_{t}=-\frac{dE_{t}}{dx}s_{t}$$\end{document}</tex-math></alternatives></disp-formula></p><p>where <inline-formula><alternatives><mml:math id="inf123"><mml:msub><mml:mrow><mml:mi>s</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:math><tex-math id="inft123">\begin{document}$s_{t}$\end{document}</tex-math></alternatives></inline-formula> is the displacement of the PC trajectory, and <inline-formula><alternatives><mml:math id="inf124"><mml:mfrac><mml:mrow><mml:mi>d</mml:mi><mml:msub><mml:mrow><mml:mi>E</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>d</mml:mi><mml:mi>x</mml:mi></mml:mrow></mml:mfrac></mml:math><tex-math id="inft124">\begin{document}$\frac{dE_{t}}{dx}$\end{document}</tex-math></alternatives></inline-formula> the energy gradient. We computed <inline-formula><alternatives><mml:math id="inf125"><mml:msub><mml:mrow><mml:mi>s</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:math><tex-math id="inft125">\begin{document}$s_{t}$\end{document}</tex-math></alternatives></inline-formula> from the (absolute) difference between PC<sub>1</sub> loadings at the start and end of each time window, and <inline-formula><alternatives><mml:math id="inf126"><mml:mfrac><mml:mrow><mml:mi>d</mml:mi><mml:msub><mml:mrow><mml:mi>E</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>d</mml:mi><mml:mi>x</mml:mi></mml:mrow></mml:mfrac></mml:math><tex-math id="inft126">\begin{document}$\frac{dE_{t}}{dx}$\end{document}</tex-math></alternatives></inline-formula> from the gradient of energy values at the start and end of each time window.</p></sec><sec id="s4-7"><title>MRI data</title><p>Functional data were acquired using gradient echo-planar T2*-weighted images collected on a 1.5T Phillips scanner located at Grand River Hospital in Waterloo, Ontario (TR = 2000 ms; TE = 40 ms; slice thickness = 5 mm with no gap; 26 slices/volume; FOV = 220 × 220 mm<sup>2</sup>; voxel size = 2.75 × 2.75 × 5 mm<sup>3</sup>; flip angle = 90°). Each experimental run consisted of 26 slices per volume and 285 volumes. At the beginning of each run, a whole-brain T1-weighted anatomical image was collected for each participant (TR = 7.4 ms; TE = 3.4 ms; voxel size = 1 × 1 × 1 mm<sup>3</sup>; FOV = 240 × 240 mm<sup>2</sup>; 150 slices with no gap; flip angle = 8°). The experimental protocol was programmed using E-Prime experimental presentation software (v1.1 SP3; Psychology Software Tools, Pittsburgh, PA). Stimuli were presented on an Avotec Silent Vision fibre-optic presentation system using binocular projection glasses (Model SV-7021). The onset of each trial was synchronised with the onset of data collection for the appropriate functional volume using trigger pulses from the scanner.</p></sec><sec id="s4-8"><title>fMRI data preprocessing</title><p>After realignment (using FSL’s MCFLIRT), we used FEAT to unwarp the EPI images in the y-direction with a 10% signal loss threshold and an effective echo spacing of 0.333. Following noise-cleaning with FIX (custom training set for scanner, threshold 20, including regression of estimated motion parameters), the unwrapped EPI images were then smoothed at 6 mm FWHM and nonlinearly co-registered with the anatomical T1 to 2 mm isotropic MNI space. Temporal artefacts were identified in each dataset by calculating framewise displacement (FD) from the derivatives of the six rigid-body realignment parameters estimated during standard volume realignment (<xref ref-type="bibr" rid="bib62">Power et al., 2014</xref>), as well as the root mean square change in BOLD signal from volume to volume (DVARS). Frames associated with FD &gt; 0.25 mm or DVARS &gt; 2.5% were identified; however, as no participants were identified with greater than 10% of the resting time points exceeding these values, no trials were excluded from further analysis. There were no differences in head motion parameters between the five runs (p&gt;0.500). Following artefact detection, nuisance covariates associated with the six linear head movement parameters (and their temporal derivatives), DVARS, physiological regressors (created using the RETROICOR method), and anatomical masks from the cerebrospinal fluid and deep cerebral white matter were regressed from the data using the CompCor strategy (<xref ref-type="bibr" rid="bib7">Behzadi et al., 2007</xref>). Finally, in keeping with previous time-resolved connectivity experiments (<xref ref-type="bibr" rid="bib30">Gu et al., 2015</xref>), a temporal band pass filter (0.0071&lt;f&lt;0.125 Hz) was applied to the data.</p></sec><sec id="s4-9"><title>Brain parcellation</title><p>Following preprocessing, the mean time series was extracted from 375 predefined regions of interest (ROIs). To ensure whole-brain coverage, we extracted the following: (a) 333 cortical parcels (161 and 162 regions from the left and right hemispheres, respectively) using the Gordon atlas (<xref ref-type="bibr" rid="bib29">Gordon et al., 2016</xref>); (b) 14 subcortical regions from the Harvard-Oxford subcortical atlas (bilateral thalamus, caudate, putamen, ventral striatum, globus pallidus, amygdala, and hippocampus; <ext-link ext-link-type="uri" xlink:href="https://fsl.fmrib.ox.ac.uk/">https://fsl.fmrib.ox.ac.uk/</ext-link>); and (c) 28 cerebellar regions from the SUIT atlas (<xref ref-type="bibr" rid="bib21">Diedrichsen et al., 2009</xref>) for each participant in the study.</p></sec><sec id="s4-10"><title>Neuroimaging analysis</title><p>In order to analyse task-evoked activity related to stimulus presentations, we first performed a PCA (<xref ref-type="bibr" rid="bib76">Shine et al., 2019</xref>) on the pre-processed BOLD time series (per subject/session) to extract orthogonal low-dimensional time series. The top 3 PCs explained ~30.6% of the variance. The time series of these PCs was entered into a general linear model, in which we modelled the following nine event types across an entire session, centred around the perceptual switch point, which changed on a trial-by-trial basis: the first two images (modelled as a single regressor), the seven images surrounding each perceptual change (i.e. the switch trial and the three images surrounding the change point, modelled as seven separate regressors) and the last two images (modelled as a single regressor). Each of the event onset times was also convolved with a canonical haemodynamic response function. This left us with nine unique β values per principal component, which we could use to determine how each PC differentially engaged as a function of the task. To test the hypothesis that the rate of change of PC engagement peaked at the perceptual change point, we calculated the difference between the β value for each of the top 3 PCs for each of the nine event types, and then plotted the resultant series in order to identify whether a peak occurred at the perceptual switch point (i.e. the middle β value in the series). A block-resampling null (n=5000 permutations) was used as a permutation test (p&lt;0.05).</p><p>Spatial maps associated with the terms ‘switching’, ‘effort’, ‘attention’, ‘perception’, and ‘load’ were downloaded from the <italic>neurosynth</italic> repository (<xref ref-type="bibr" rid="bib101">Yarkoni et al., 2011</xref>) and mapped into our parcellation space by calculating the mean value within each independent parcel. These values were then correlated with the spatial loading of each of the top 3 PCs. A separate partial correlation analysis was conducted in which the same correlation was estimated after controlling for each of the other spatial maps.</p></sec><sec id="s4-11"><title>Topological analyses</title><p>A hierarchical modularity approach was used to collapse the mean time-averaged correlation matrix across participants into a set of four spatially non-overlapping modules. Briefly, this involved running the Louvain modularity algorithm, which iteratively maximises the modularity statistic, <italic>Q</italic>, for different community assignments until the maximum possible score of <italic>Q</italic> has been obtained.<disp-formula id="equ10"><alternatives><mml:math id="m10"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:msub><mml:mi>Q</mml:mi><mml:mrow><mml:mi>T</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:msup><mml:mi>v</mml:mi><mml:mrow><mml:mo>+</mml:mo></mml:mrow></mml:msup></mml:mfrac><mml:munder><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:munder><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msubsup><mml:mi>w</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mo>+</mml:mo></mml:mrow></mml:msubsup><mml:mo>−</mml:mo><mml:msubsup><mml:mi>e</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mo>+</mml:mo></mml:mrow></mml:msubsup><mml:mo stretchy="false">)</mml:mo><mml:msub><mml:mi>δ</mml:mi><mml:mrow><mml:msub><mml:mi>M</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mi>M</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msub></mml:mrow><mml:mo>−</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:msup><mml:mrow><mml:mi mathvariant="script">v</mml:mi></mml:mrow><mml:mo>+</mml:mo></mml:msup><mml:mo>+</mml:mo><mml:msup><mml:mrow><mml:mi mathvariant="script">v</mml:mi></mml:mrow><mml:mo>−</mml:mo></mml:msup></mml:mrow></mml:mfrac><mml:munder><mml:mo movablelimits="false">∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:munder><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msubsup><mml:mi>w</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mo>−</mml:mo></mml:mrow></mml:msubsup><mml:mo>−</mml:mo><mml:msubsup><mml:mi>e</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mo>−</mml:mo></mml:mrow></mml:msubsup><mml:mo stretchy="false">)</mml:mo><mml:msub><mml:mi>δ</mml:mi><mml:mrow><mml:msub><mml:mi>M</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mi>M</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msub></mml:mrow></mml:mstyle></mml:mrow></mml:mstyle></mml:math><tex-math id="t10">\begin{document}$$\displaystyle Q_{T}=\frac{1}{v^{+}}\sum _{ij}{(w_{ij}^{+}-e_{ij}^{+})\delta_{M_{i}M_{j}}}-\frac{1}{\mathscr{v}^+ +\mathscr{v}^- } \sum\limits_{ij}{(w_{ij}^{-}-e_{ij}^{-})\delta _{M_{i}M_{j}}}$$\end{document}</tex-math></alternatives></disp-formula></p><p>The community assignment for each region was then estimated 500 times across a range of γ values (0.5–2.0, in steps of 0.1). In order to identify multi-level structure in our data, we repeated the modularity analysis for each of the modules identified in the first step (<xref ref-type="bibr" rid="bib50">Meunier et al., 2010</xref>). Finally, a consensus partition was identified using a fine-tuning algorithm from the Brain Connectivity Toolbox (<ext-link ext-link-type="uri" xlink:href="http://www.brain-connectivity-toolbox.net/">http://www.brain-connectivity-toolbox.net/</ext-link>). We subsequently used this final module assignment to estimate the cartographic profile of the each participant’s time-averaged adjacency matrix (<xref ref-type="bibr" rid="bib73">Shine et al., 2016</xref>). Specifically, we estimated integration using the participation coefficient, which quantifies the extent to which a region connects across all modules (i.e. between-module strength; <xref ref-type="bibr" rid="bib31">Guimerà and Nunes Amaral, 2005</xref>), and segregation using the module-degree Z-score. These measures were entered into a joint-histogram (101 × 101 unique bins, equally spaced between 0 and 1 [for integration] and –1 and 1 [for segregation]). The value within each bin of this joint histogram was then correlated with the combined regression weights of PC<sub>2</sub> and PC<sub>3</sub> for each subject. A permutation test that scrambled the order of participants was used to assess statistical significance (p&lt;0.05).</p></sec><sec id="s4-12"><title>Brain-state displacement and the energy landscape</title><p>To quantify the change in the evoked BOLD activity following each stimulus, we calculated the main BOLD displacement (MBD). The MBD is a measure of the absolute evoked deviation in BOLD activity. The evoked activity is measured through a general linear model using a canonical haemodynamic response function convolved on a design matrix. We are interested in the probability, <italic>p</italic>(MBD, <italic>re</italic>), that we will observe a given displacement in BOLD at a given regressor <italic>re</italic>. The probability is calculated through the null model of the general linear model (the probability that the observed evoked value of the corresponding region is different from 0). As described above, we then calculated the energy for each displacement value as <inline-formula><alternatives><mml:math id="inf127"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>B</mml:mi><mml:mi>D</mml:mi><mml:mo>,</mml:mo><mml:mi>r</mml:mi><mml:mi>e</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>l</mml:mi><mml:mi>n</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mi>P</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>M</mml:mi><mml:mi>B</mml:mi><mml:mi>D</mml:mi><mml:mo>,</mml:mo><mml:mi>r</mml:mi><mml:mi>e</mml:mi></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mfrac><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math><tex-math id="inft127">\begin{document}$E_{MBD,re }=ln\left (\frac{1}{P\left (MBD,re \right)}\right)$\end{document}</tex-math></alternatives></inline-formula>. Finally, to measure the surprise per displacement, we divided the absolute β for PC2 from <inline-formula><alternatives><mml:math id="inf128"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>B</mml:mi><mml:mi>D</mml:mi><mml:mo>,</mml:mo><mml:mi>r</mml:mi><mml:mi>e</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mstyle></mml:math><tex-math id="inft128">\begin{document}$E_{MBD,re }$\end{document}</tex-math></alternatives></inline-formula> for each regressor <italic>re</italic> (<xref ref-type="fig" rid="fig6">Figure 6</xref>).</p></sec></sec></body><back><sec sec-type="additional-information" id="s5"><title>Additional information</title><fn-group content-type="competing-interest"><title>Competing interests</title><fn fn-type="COI-statement" id="conf1"><p>No competing interests declared</p></fn></fn-group><fn-group content-type="author-contribution"><title>Author contributions</title><fn fn-type="con" id="con1"><p>Conceptualization, Data curation, Formal analysis, Validation, Investigation, Visualization, Methodology, Writing – original draft, Writing – review and editing</p></fn><fn fn-type="con" id="con2"><p>Conceptualization, Data curation, Software, Formal analysis, Validation, Investigation, Visualization, Methodology, Writing – original draft, Writing – review and editing</p></fn><fn fn-type="con" id="con3"><p>Conceptualization, Writing – review and editing</p></fn><fn fn-type="con" id="con4"><p>Methodology, Writing – review and editing</p></fn><fn fn-type="con" id="con5"><p>Writing – review and editing</p></fn><fn fn-type="con" id="con6"><p>Data curation, Methodology, Writing – review and editing</p></fn><fn fn-type="con" id="con7"><p>Data curation, Writing – review and editing</p></fn><fn fn-type="con" id="con8"><p>Methodology, Writing – review and editing</p></fn><fn fn-type="con" id="con9"><p>Conceptualization, Formal analysis, Supervision, Investigation, Methodology, Writing – review and editing</p></fn><fn fn-type="con" id="con10"><p>Conceptualization, Resources, Formal analysis, Supervision, Validation, Investigation, Visualization, Methodology, Writing – original draft, Project administration, Writing – review and editing</p></fn></fn-group><fn-group content-type="ethics-information"><title>Ethics</title><fn fn-type="other"><p>The research protocol was approved by the Office of Research Ethics at the University of Waterloo and the Tri-Hospital Research Ethics Board of the Region of Waterloo in Ontario, Canada.</p></fn></fn-group></sec><sec sec-type="supplementary-material" id="s6"><title>Additional files</title><supplementary-material id="mdar"><label>MDAR checklist</label><media xlink:href="elife-93191-mdarchecklist1-v1.pdf" mimetype="application" mime-subtype="pdf"/></supplementary-material></sec><sec sec-type="data-availability" id="s7"><title>Data availability</title><p>The data and code necessary to replicate our results are available online (<ext-link ext-link-type="uri" xlink:href="https://github.com/ShineLabUSYD/AmbiguousFigures">https://github.com/ShineLabUSYD/AmbiguousFigures</ext-link> [copy archived at <xref ref-type="bibr" rid="bib98">Whyte et al., 2025</xref>] and <ext-link ext-link-type="uri" xlink:href="https://osf.io/uvykp/">https://osf.io/uvykp/</ext-link>).</p><p>The following dataset was generated:</p><p><element-citation publication-type="data" specific-use="isSupplementedBy" id="dataset1"><person-group person-group-type="author"><name><surname>Danckert</surname><given-names>J</given-names></name></person-group><year iso-8601-date="2025">2025</year><data-title>fMRI data from Stottinger papers</data-title><source>Open Science Framework</source><pub-id pub-id-type="doi">10.17605/OSF.IO/UVYKP</pub-id></element-citation></p></sec><ref-list><title>References</title><ref id="bib1"><element-citation publication-type="book"><person-group person-group-type="author"><name><surname>Alais</surname><given-names>D</given-names></name><name><surname>Blake</surname><given-names>R</given-names></name></person-group><year iso-8601-date="2005">2005</year><source>Binocular Rivalry</source><publisher-name>MIT Press</publisher-name><pub-id pub-id-type="doi">10.7551/mitpress/1605.001.0001</pub-id></element-citation></ref><ref id="bib2"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Alnæs</surname><given-names>D</given-names></name><name><surname>Sneve</surname><given-names>MH</given-names></name><name><surname>Espeseth</surname><given-names>T</given-names></name><name><surname>Endestad</surname><given-names>T</given-names></name><name><surname>van de Pavert</surname><given-names>SHP</given-names></name><name><surname>Laeng</surname><given-names>B</given-names></name></person-group><year iso-8601-date="2014">2014</year><article-title>Pupil size signals mental effort deployed during multiple object tracking and predicts brain activity in the dorsal attention network and the locus coeruleus</article-title><source>Journal of Vision</source><volume>14</volume><fpage>1</fpage><lpage>20</lpage><pub-id pub-id-type="doi">10.1167/14.4.1</pub-id><pub-id pub-id-type="pmid">24692319</pub-id></element-citation></ref><ref id="bib3"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Aston-Jones</surname><given-names>G</given-names></name><name><surname>Cohen</surname><given-names>JD</given-names></name></person-group><year iso-8601-date="2005">2005</year><article-title>An integrative theory of locus coeruleus-norepinephrine function: adaptive gain and optimal performance</article-title><source>Annual Review of Neuroscience</source><volume>28</volume><fpage>403</fpage><lpage>450</lpage><pub-id pub-id-type="doi">10.1146/annurev.neuro.28.061604.135709</pub-id><pub-id pub-id-type="pmid">16022602</pub-id></element-citation></ref><ref id="bib4"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Barack</surname><given-names>DL</given-names></name><name><surname>Krakauer</surname><given-names>JW</given-names></name></person-group><year iso-8601-date="2021">2021</year><article-title>Two views on the cognitive brain</article-title><source>Nature Reviews. Neuroscience</source><volume>22</volume><fpage>359</fpage><lpage>371</lpage><pub-id pub-id-type="doi">10.1038/s41583-021-00448-6</pub-id><pub-id pub-id-type="pmid">33859408</pub-id></element-citation></ref><ref id="bib5"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Beer</surname><given-names>RD</given-names></name></person-group><year iso-8601-date="2000">2000</year><article-title>Dynamical approaches to cognitive science</article-title><source>Trends in Cognitive Sciences</source><volume>4</volume><fpage>91</fpage><lpage>99</lpage><pub-id pub-id-type="doi">10.1016/s1364-6613(99)01440-0</pub-id><pub-id pub-id-type="pmid">10689343</pub-id></element-citation></ref><ref id="bib6"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Beer</surname><given-names>RD</given-names></name></person-group><year iso-8601-date="2022">2022</year><article-title>Codimension-2 parameter space structure of continuous-time recurrent neural networks</article-title><source>Biological Cybernetics</source><volume>116</volume><fpage>501</fpage><lpage>515</lpage><pub-id pub-id-type="doi">10.1007/s00422-022-00938-5</pub-id><pub-id pub-id-type="pmid">35723721</pub-id></element-citation></ref><ref id="bib7"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Behzadi</surname><given-names>Y</given-names></name><name><surname>Restom</surname><given-names>K</given-names></name><name><surname>Liau</surname><given-names>J</given-names></name><name><surname>Liu</surname><given-names>TT</given-names></name></person-group><year iso-8601-date="2007">2007</year><article-title>A component based noise correction method (CompCor) for BOLD and perfusion based fMRI</article-title><source>NeuroImage</source><volume>37</volume><fpage>90</fpage><lpage>101</lpage><pub-id pub-id-type="doi">10.1016/j.neuroimage.2007.04.042</pub-id><pub-id pub-id-type="pmid">17560126</pub-id></element-citation></ref><ref id="bib8"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bogacz</surname><given-names>R</given-names></name><name><surname>Brown</surname><given-names>E</given-names></name><name><surname>Moehlis</surname><given-names>J</given-names></name><name><surname>Holmes</surname><given-names>P</given-names></name><name><surname>Cohen</surname><given-names>JD</given-names></name></person-group><year iso-8601-date="2006">2006</year><article-title>The physics of optimal decision making: a formal analysis of models of performance in two-alternative forced-choice tasks</article-title><source>Psychological Review</source><volume>113</volume><fpage>700</fpage><lpage>765</lpage><pub-id pub-id-type="doi">10.1037/0033-295X.113.4.700</pub-id><pub-id pub-id-type="pmid">17014301</pub-id></element-citation></ref><ref id="bib9"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bogacz</surname><given-names>R</given-names></name></person-group><year iso-8601-date="2017">2017</year><article-title>A tutorial on the free-energy framework for modelling perception and learning</article-title><source>Journal of Mathematical Psychology</source><volume>76</volume><fpage>198</fpage><lpage>211</lpage><pub-id pub-id-type="doi">10.1016/j.jmp.2015.11.003</pub-id><pub-id pub-id-type="pmid">28298703</pub-id></element-citation></ref><ref id="bib10"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bouret</surname><given-names>S</given-names></name><name><surname>Sara</surname><given-names>SJ</given-names></name></person-group><year iso-8601-date="2005">2005</year><article-title>Network reset: a simplified overarching theory of locus coeruleus noradrenaline function</article-title><source>Trends in Neurosciences</source><volume>28</volume><fpage>574</fpage><lpage>582</lpage><pub-id pub-id-type="doi">10.1016/j.tins.2005.09.002</pub-id><pub-id pub-id-type="pmid">16165227</pub-id></element-citation></ref><ref id="bib11"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Briand</surname><given-names>LA</given-names></name><name><surname>Gritton</surname><given-names>H</given-names></name><name><surname>Howe</surname><given-names>WM</given-names></name><name><surname>Young</surname><given-names>DA</given-names></name><name><surname>Sarter</surname><given-names>M</given-names></name></person-group><year iso-8601-date="2007">2007</year><article-title>Modulators in concert for cognition: modulator interactions in the prefrontal cortex</article-title><source>Progress in Neurobiology</source><volume>83</volume><fpage>69</fpage><lpage>91</lpage><pub-id pub-id-type="doi">10.1016/j.pneurobio.2007.06.007</pub-id><pub-id pub-id-type="pmid">17681661</pub-id></element-citation></ref><ref id="bib12"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Campos-Arteaga</surname><given-names>G</given-names></name><name><surname>Forcato</surname><given-names>C</given-names></name><name><surname>Wainstein</surname><given-names>G</given-names></name><name><surname>Lagos</surname><given-names>R</given-names></name><name><surname>Palacios-García</surname><given-names>I</given-names></name><name><surname>Artigas</surname><given-names>C</given-names></name><name><surname>Morales</surname><given-names>R</given-names></name><name><surname>Pedreira</surname><given-names>ME</given-names></name><name><surname>Rodríguez</surname><given-names>E</given-names></name></person-group><year iso-8601-date="2020">2020</year><article-title>Differential neurophysiological correlates of retrieval of consolidated and reconsolidated memories in humans: An ERP and pupillometry study</article-title><source>Neurobiology of Learning and Memory</source><volume>174</volume><elocation-id>107279</elocation-id><pub-id pub-id-type="doi">10.1016/j.nlm.2020.107279</pub-id><pub-id pub-id-type="pmid">32710932</pub-id></element-citation></ref><ref id="bib13"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Carter</surname><given-names>O</given-names></name><name><surname>van Swinderen</surname><given-names>B</given-names></name><name><surname>Leopold</surname><given-names>DA</given-names></name><name><surname>Collin</surname><given-names>SP</given-names></name><name><surname>Maier</surname><given-names>A</given-names></name></person-group><year iso-8601-date="2020">2020</year><article-title>Perceptual rivalry across animal species</article-title><source>The Journal of Comparative Neurology</source><volume>528</volume><fpage>3123</fpage><lpage>3133</lpage><pub-id pub-id-type="doi">10.1002/cne.24939</pub-id><pub-id pub-id-type="pmid">32361986</pub-id></element-citation></ref><ref id="bib14"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cazettes</surname><given-names>F</given-names></name><name><surname>Reato</surname><given-names>D</given-names></name><name><surname>Morais</surname><given-names>JP</given-names></name><name><surname>Renart</surname><given-names>A</given-names></name><name><surname>Mainen</surname><given-names>ZF</given-names></name></person-group><year iso-8601-date="2021">2021</year><article-title>Phasic activation of dorsal raphe serotonergic neurons increases pupil size</article-title><source>Current Biology</source><volume>31</volume><fpage>192</fpage><lpage>197</lpage><pub-id pub-id-type="doi">10.1016/j.cub.2020.09.090</pub-id><pub-id pub-id-type="pmid">33186549</pub-id></element-citation></ref><ref id="bib15"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cisek</surname><given-names>P</given-names></name></person-group><year iso-8601-date="2019">2019</year><article-title>Resynthesizing behavior through phylogenetic refinement</article-title><source>Attention, Perception &amp; Psychophysics</source><volume>81</volume><fpage>2265</fpage><lpage>2287</lpage><pub-id pub-id-type="doi">10.3758/s13414-019-01760-1</pub-id><pub-id pub-id-type="pmid">31161495</pub-id></element-citation></ref><ref id="bib16"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Clark</surname><given-names>A</given-names></name></person-group><year iso-8601-date="2013">2013</year><article-title>Whatever next? Predictive brains, situated agents, and the future of cognitive science</article-title><source>The Behavioral and Brain Sciences</source><volume>36</volume><fpage>181</fpage><lpage>204</lpage><pub-id pub-id-type="doi">10.1017/S0140525X12000477</pub-id><pub-id pub-id-type="pmid">23663408</pub-id></element-citation></ref><ref id="bib17"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>de Gee</surname><given-names>JW</given-names></name><name><surname>Knapen</surname><given-names>T</given-names></name><name><surname>Donner</surname><given-names>TH</given-names></name></person-group><year iso-8601-date="2014">2014</year><article-title>Decision-related pupil dilation reflects upcoming choice and individual bias</article-title><source>PNAS</source><volume>111</volume><fpage>E618</fpage><lpage>E25</lpage><pub-id pub-id-type="doi">10.1073/pnas.1317557111</pub-id><pub-id pub-id-type="pmid">24449874</pub-id></element-citation></ref><ref id="bib18"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>de Gee</surname><given-names>JW</given-names></name><name><surname>Colizoli</surname><given-names>O</given-names></name><name><surname>Kloosterman</surname><given-names>NA</given-names></name><name><surname>Knapen</surname><given-names>T</given-names></name><name><surname>Nieuwenhuis</surname><given-names>S</given-names></name><name><surname>Donner</surname><given-names>TH</given-names></name></person-group><year iso-8601-date="2017">2017</year><article-title>Dynamic modulation of decision biases by brainstem arousal systems</article-title><source>eLife</source><volume>6</volume><elocation-id>e23232</elocation-id><pub-id pub-id-type="doi">10.7554/eLife.23232</pub-id><pub-id pub-id-type="pmid">28383284</pub-id></element-citation></ref><ref id="bib19"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>de Gee</surname><given-names>JW</given-names></name><name><surname>Tsetsos</surname><given-names>K</given-names></name><name><surname>Schwabe</surname><given-names>L</given-names></name><name><surname>Urai</surname><given-names>AE</given-names></name><name><surname>McCormick</surname><given-names>D</given-names></name><name><surname>McGinley</surname><given-names>MJ</given-names></name><name><surname>Donner</surname><given-names>TH</given-names></name></person-group><year iso-8601-date="2020">2020</year><article-title>Pupil-linked phasic arousal predicts a reduction of choice bias across species and decision domains</article-title><source>eLife</source><volume>9</volume><elocation-id>e54014</elocation-id><pub-id pub-id-type="doi">10.7554/eLife.54014</pub-id><pub-id pub-id-type="pmid">32543372</pub-id></element-citation></ref><ref id="bib20"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Desimone</surname><given-names>R</given-names></name><name><surname>Duncan</surname><given-names>J</given-names></name></person-group><year iso-8601-date="1995">1995</year><article-title>Neural mechanisms of selective visual attention</article-title><source>Annual Review of Neuroscience</source><volume>18</volume><fpage>193</fpage><lpage>222</lpage><pub-id pub-id-type="doi">10.1146/annurev.ne.18.030195.001205</pub-id><pub-id pub-id-type="pmid">7605061</pub-id></element-citation></ref><ref id="bib21"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Diedrichsen</surname><given-names>J</given-names></name><name><surname>Balsters</surname><given-names>JH</given-names></name><name><surname>Flavell</surname><given-names>J</given-names></name><name><surname>Cussans</surname><given-names>E</given-names></name><name><surname>Ramnani</surname><given-names>N</given-names></name></person-group><year iso-8601-date="2009">2009</year><article-title>A probabilistic MR atlas of the human cerebellum</article-title><source>NeuroImage</source><volume>46</volume><fpage>39</fpage><lpage>46</lpage><pub-id pub-id-type="doi">10.1016/j.neuroimage.2009.01.045</pub-id></element-citation></ref><ref id="bib22"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dieter</surname><given-names>KC</given-names></name><name><surname>Tadin</surname><given-names>D</given-names></name></person-group><year iso-8601-date="2011">2011</year><article-title>Understanding attentional modulation of binocular rivalry: a framework based on biased competition</article-title><source>Frontiers in Human Neuroscience</source><volume>5</volume><elocation-id>155</elocation-id><pub-id pub-id-type="doi">10.3389/fnhum.2011.00155</pub-id><pub-id pub-id-type="pmid">22144958</pub-id></element-citation></ref><ref id="bib23"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Doerig</surname><given-names>A</given-names></name><name><surname>Sommers</surname><given-names>RP</given-names></name><name><surname>Seeliger</surname><given-names>K</given-names></name><name><surname>Richards</surname><given-names>B</given-names></name><name><surname>Ismael</surname><given-names>J</given-names></name><name><surname>Lindsay</surname><given-names>GW</given-names></name><name><surname>Kording</surname><given-names>KP</given-names></name><name><surname>Konkle</surname><given-names>T</given-names></name><name><surname>van Gerven</surname><given-names>MAJ</given-names></name><name><surname>Kriegeskorte</surname><given-names>N</given-names></name><name><surname>Kietzmann</surname><given-names>TC</given-names></name></person-group><year iso-8601-date="2023">2023</year><article-title>The neuroconnectionist research programme</article-title><source>Nature Reviews. Neuroscience</source><volume>24</volume><fpage>431</fpage><lpage>450</lpage><pub-id pub-id-type="doi">10.1038/s41583-023-00705-w</pub-id><pub-id pub-id-type="pmid">37253949</pub-id></element-citation></ref><ref id="bib24"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Eckhoff</surname><given-names>P</given-names></name><name><surname>Wong-Lin</surname><given-names>K</given-names></name><name><surname>Holmes</surname><given-names>P</given-names></name></person-group><year iso-8601-date="2011">2011</year><article-title>Dimension reduction and dynamics of a spiking neural network model for decision making under neuromodulation()</article-title><source>SIAM Journal on Applied Dynamical Systems</source><volume>10</volume><fpage>148</fpage><lpage>188</lpage><pub-id pub-id-type="doi">10.1137/090770096</pub-id><pub-id pub-id-type="pmid">22768006</pub-id></element-citation></ref><ref id="bib25"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Einhäuser</surname><given-names>W</given-names></name><name><surname>Stout</surname><given-names>J</given-names></name><name><surname>Koch</surname><given-names>C</given-names></name><name><surname>Carter</surname><given-names>O</given-names></name></person-group><year iso-8601-date="2008">2008</year><article-title>Pupil dilation reflects perceptual selection and predicts subsequent stability in perceptual rivalry</article-title><source>PNAS</source><volume>105</volume><fpage>1704</fpage><lpage>1709</lpage><pub-id pub-id-type="doi">10.1073/pnas.0707727105</pub-id><pub-id pub-id-type="pmid">18250340</pub-id></element-citation></ref><ref id="bib26"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Eldar</surname><given-names>E</given-names></name><name><surname>Cohen</surname><given-names>JD</given-names></name><name><surname>Niv</surname><given-names>Y</given-names></name></person-group><year iso-8601-date="2013">2013</year><article-title>The effects of neural gain on attention and learning</article-title><source>Nature Neuroscience</source><volume>16</volume><fpage>1146</fpage><lpage>1153</lpage><pub-id pub-id-type="doi">10.1038/nn.3428</pub-id><pub-id pub-id-type="pmid">23770566</pub-id></element-citation></ref><ref id="bib27"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Flounders</surname><given-names>MW</given-names></name><name><surname>González-García</surname><given-names>C</given-names></name><name><surname>Hardstone</surname><given-names>R</given-names></name><name><surname>He</surname><given-names>BJ</given-names></name></person-group><year iso-8601-date="2019">2019</year><article-title>Neural dynamics of visual ambiguity resolution by perceptual prior</article-title><source>eLife</source><volume>8</volume><elocation-id>e41861</elocation-id><pub-id pub-id-type="doi">10.7554/eLife.41861</pub-id><pub-id pub-id-type="pmid">30843519</pub-id></element-citation></ref><ref id="bib28"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Friston</surname><given-names>K</given-names></name></person-group><year iso-8601-date="2005">2005</year><article-title>A theory of cortical responses</article-title><source>Philosophical Transactions of the Royal Society of London. Series B, Biological Sciences</source><volume>360</volume><fpage>815</fpage><lpage>836</lpage><pub-id pub-id-type="doi">10.1098/rstb.2005.1622</pub-id><pub-id pub-id-type="pmid">15937014</pub-id></element-citation></ref><ref id="bib29"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gordon</surname><given-names>EM</given-names></name><name><surname>Laumann</surname><given-names>TO</given-names></name><name><surname>Adeyemo</surname><given-names>B</given-names></name><name><surname>Huckins</surname><given-names>JF</given-names></name><name><surname>Kelley</surname><given-names>WM</given-names></name><name><surname>Petersen</surname><given-names>SE</given-names></name></person-group><year iso-8601-date="2016">2016</year><article-title>Generation and evaluation of a cortical area parcellation from resting-state correlations</article-title><source>Cerebral Cortex</source><volume>26</volume><fpage>288</fpage><lpage>303</lpage><pub-id pub-id-type="doi">10.1093/cercor/bhu239</pub-id><pub-id pub-id-type="pmid">25316338</pub-id></element-citation></ref><ref id="bib30"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gu</surname><given-names>S</given-names></name><name><surname>Pasqualetti</surname><given-names>F</given-names></name><name><surname>Cieslak</surname><given-names>M</given-names></name><name><surname>Telesford</surname><given-names>QK</given-names></name><name><surname>Yu</surname><given-names>AB</given-names></name><name><surname>Kahn</surname><given-names>AE</given-names></name><name><surname>Medaglia</surname><given-names>JD</given-names></name><name><surname>Vettel</surname><given-names>JM</given-names></name><name><surname>Miller</surname><given-names>MB</given-names></name><name><surname>Grafton</surname><given-names>ST</given-names></name><name><surname>Bassett</surname><given-names>DS</given-names></name></person-group><year iso-8601-date="2015">2015</year><article-title>Controllability of structural brain networks</article-title><source>Nature Communications</source><volume>6</volume><elocation-id>8414</elocation-id><pub-id pub-id-type="doi">10.1038/ncomms9414</pub-id><pub-id pub-id-type="pmid">26423222</pub-id></element-citation></ref><ref id="bib31"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Guimerà</surname><given-names>R</given-names></name><name><surname>Nunes Amaral</surname><given-names>LA</given-names></name></person-group><year iso-8601-date="2005">2005</year><article-title>Functional cartography of complex metabolic networks</article-title><source>Nature</source><volume>433</volume><fpage>895</fpage><lpage>900</lpage><pub-id pub-id-type="doi">10.1038/nature03288</pub-id><pub-id pub-id-type="pmid">15729348</pub-id></element-citation></ref><ref id="bib32"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hansen</surname><given-names>JY</given-names></name><name><surname>Markello</surname><given-names>RD</given-names></name><name><surname>Vogel</surname><given-names>JW</given-names></name><name><surname>Seidlitz</surname><given-names>J</given-names></name><name><surname>Bzdok</surname><given-names>D</given-names></name><name><surname>Misic</surname><given-names>B</given-names></name></person-group><year iso-8601-date="2021">2021</year><article-title>Mapping gene transcription and neurocognition across human neocortex</article-title><source>Nature Human Behaviour</source><volume>5</volume><fpage>1240</fpage><lpage>1250</lpage><pub-id pub-id-type="doi">10.1038/s41562-021-01082-z</pub-id><pub-id pub-id-type="pmid">33767429</pub-id></element-citation></ref><ref id="bib33"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hansen</surname><given-names>JY</given-names></name><name><surname>Shafiei</surname><given-names>G</given-names></name><name><surname>Markello</surname><given-names>RD</given-names></name><name><surname>Smart</surname><given-names>K</given-names></name><name><surname>Cox</surname><given-names>SML</given-names></name><name><surname>Nørgaard</surname><given-names>M</given-names></name><name><surname>Beliveau</surname><given-names>V</given-names></name><name><surname>Wu</surname><given-names>Y</given-names></name><name><surname>Gallezot</surname><given-names>J-D</given-names></name><name><surname>Aumont</surname><given-names>É</given-names></name><name><surname>Servaes</surname><given-names>S</given-names></name><name><surname>Scala</surname><given-names>SG</given-names></name><name><surname>DuBois</surname><given-names>JM</given-names></name><name><surname>Wainstein</surname><given-names>G</given-names></name><name><surname>Bezgin</surname><given-names>G</given-names></name><name><surname>Funck</surname><given-names>T</given-names></name><name><surname>Schmitz</surname><given-names>TW</given-names></name><name><surname>Spreng</surname><given-names>RN</given-names></name><name><surname>Galovic</surname><given-names>M</given-names></name><name><surname>Koepp</surname><given-names>MJ</given-names></name><name><surname>Duncan</surname><given-names>JS</given-names></name><name><surname>Coles</surname><given-names>JP</given-names></name><name><surname>Fryer</surname><given-names>TD</given-names></name><name><surname>Aigbirhio</surname><given-names>FI</given-names></name><name><surname>McGinnity</surname><given-names>CJ</given-names></name><name><surname>Hammers</surname><given-names>A</given-names></name><name><surname>Soucy</surname><given-names>J-P</given-names></name><name><surname>Baillet</surname><given-names>S</given-names></name><name><surname>Guimond</surname><given-names>S</given-names></name><name><surname>Hietala</surname><given-names>J</given-names></name><name><surname>Bedard</surname><given-names>M-A</given-names></name><name><surname>Leyton</surname><given-names>M</given-names></name><name><surname>Kobayashi</surname><given-names>E</given-names></name><name><surname>Rosa-Neto</surname><given-names>P</given-names></name><name><surname>Ganz</surname><given-names>M</given-names></name><name><surname>Knudsen</surname><given-names>GM</given-names></name><name><surname>Palomero-Gallagher</surname><given-names>N</given-names></name><name><surname>Shine</surname><given-names>JM</given-names></name><name><surname>Carson</surname><given-names>RE</given-names></name><name><surname>Tuominen</surname><given-names>L</given-names></name><name><surname>Dagher</surname><given-names>A</given-names></name><name><surname>Misic</surname><given-names>B</given-names></name></person-group><year iso-8601-date="2022">2022</year><article-title>Mapping neurotransmitter systems to the structural and functional organization of the human neocortex</article-title><source>Nature Neuroscience</source><volume>25</volume><fpage>1569</fpage><lpage>1581</lpage><pub-id pub-id-type="doi">10.1038/s41593-022-01186-3</pub-id><pub-id pub-id-type="pmid">36303070</pub-id></element-citation></ref><ref id="bib34"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hohwy</surname><given-names>J</given-names></name><name><surname>Roepstorff</surname><given-names>A</given-names></name><name><surname>Friston</surname><given-names>K</given-names></name></person-group><year iso-8601-date="2008">2008</year><article-title>Predictive coding explains binocular rivalry: an epistemological review</article-title><source>Cognition</source><volume>108</volume><fpage>687</fpage><lpage>701</lpage><pub-id pub-id-type="doi">10.1016/j.cognition.2008.05.010</pub-id><pub-id pub-id-type="pmid">18649876</pub-id></element-citation></ref><ref id="bib35"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hohwy</surname><given-names>J</given-names></name></person-group><year iso-8601-date="2012">2012</year><article-title>Attention and conscious perception in the hypothesis testing brain</article-title><source>Frontiers in Psychology</source><volume>3</volume><elocation-id>96</elocation-id><pub-id pub-id-type="doi">10.3389/fpsyg.2012.00096</pub-id><pub-id pub-id-type="pmid">22485102</pub-id></element-citation></ref><ref id="bib36"><element-citation publication-type="book"><person-group person-group-type="author"><name><surname>Hohwy</surname><given-names>J</given-names></name></person-group><year iso-8601-date="2013">2013</year><source>The Predictive Mind</source><publisher-name>Oxford University Press</publisher-name><pub-id pub-id-type="doi">10.1093/acprof:oso/9780199682737.001.0001</pub-id></element-citation></ref><ref id="bib37"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hupé</surname><given-names>JM</given-names></name><name><surname>Lamirel</surname><given-names>C</given-names></name><name><surname>Lorenceau</surname><given-names>J</given-names></name></person-group><year iso-8601-date="2009">2009</year><article-title>Pupil dynamics during bistable motion perception</article-title><source>Journal of Vision</source><volume>9</volume><elocation-id>10</elocation-id><pub-id pub-id-type="doi">10.1167/9.7.10</pub-id><pub-id pub-id-type="pmid">19761325</pub-id></element-citation></ref><ref id="bib38"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jacob</surname><given-names>SN</given-names></name><name><surname>Nienborg</surname><given-names>H</given-names></name></person-group><year iso-8601-date="2018">2018</year><article-title>Monoaminergic neuromodulation of sensory processing</article-title><source>Frontiers in Neural Circuits</source><volume>12</volume><elocation-id>51</elocation-id><pub-id pub-id-type="doi">10.3389/fncir.2018.00051</pub-id><pub-id pub-id-type="pmid">30042662</pub-id></element-citation></ref><ref id="bib39"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Janitzky</surname><given-names>K</given-names></name><name><surname>Lippert</surname><given-names>MT</given-names></name><name><surname>Engelhorn</surname><given-names>A</given-names></name><name><surname>Tegtmeier</surname><given-names>J</given-names></name><name><surname>Goldschmidt</surname><given-names>J</given-names></name><name><surname>Heinze</surname><given-names>HJ</given-names></name><name><surname>Ohl</surname><given-names>FW</given-names></name></person-group><year iso-8601-date="2015">2015</year><article-title>Optogenetic silencing of locus coeruleus activity in mice impairs cognitive flexibility in an attentional set-shifting task</article-title><source>Frontiers in Behavioral Neuroscience</source><volume>9</volume><elocation-id>286</elocation-id><pub-id pub-id-type="doi">10.3389/fnbeh.2015.00286</pub-id><pub-id pub-id-type="pmid">26582980</pub-id></element-citation></ref><ref id="bib40"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>John</surname><given-names>YJ</given-names></name><name><surname>Sawyer</surname><given-names>KS</given-names></name><name><surname>Srinivasan</surname><given-names>K</given-names></name><name><surname>Müller</surname><given-names>EJ</given-names></name><name><surname>Munn</surname><given-names>BR</given-names></name><name><surname>Shine</surname><given-names>JM</given-names></name></person-group><year iso-8601-date="2022">2022</year><article-title>It’s about time: Linking dynamical systems with human neuroimaging to understand the brain</article-title><source>Network Neuroscience</source><volume>6</volume><fpage>960</fpage><lpage>979</lpage><pub-id pub-id-type="doi">10.1162/netn_a_00230</pub-id><pub-id pub-id-type="pmid">36875012</pub-id></element-citation></ref><ref id="bib41"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jolliffe</surname><given-names>IT</given-names></name></person-group><year iso-8601-date="1982">1982</year><article-title>A note on the use of principal components in regression</article-title><source>Applied Statistics</source><volume>31</volume><elocation-id>300</elocation-id><pub-id pub-id-type="doi">10.2307/2348005</pub-id></element-citation></ref><ref id="bib42"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jordan</surname><given-names>R</given-names></name><name><surname>Keller</surname><given-names>GB</given-names></name></person-group><year iso-8601-date="2023">2023</year><article-title>The locus coeruleus broadcasts prediction errors across the cortex to promote sensorimotor plasticity</article-title><source>eLife</source><volume>12</volume><elocation-id>85111</elocation-id><pub-id pub-id-type="doi">10.7554/eLife.85111.3</pub-id></element-citation></ref><ref id="bib43"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Joshi</surname><given-names>S</given-names></name><name><surname>Li</surname><given-names>Y</given-names></name><name><surname>Kalwani</surname><given-names>RM</given-names></name><name><surname>Gold</surname><given-names>JI</given-names></name></person-group><year iso-8601-date="2016">2016</year><article-title>Relationships between pupil diameter and neuronal activity in the locus coeruleus, colliculi, and cingulate cortex</article-title><source>Neuron</source><volume>89</volume><fpage>221</fpage><lpage>234</lpage><pub-id pub-id-type="doi">10.1016/j.neuron.2015.11.028</pub-id></element-citation></ref><ref id="bib44"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Joshi</surname><given-names>S</given-names></name><name><surname>Gold</surname><given-names>JI</given-names></name></person-group><year iso-8601-date="2020">2020</year><article-title>Pupil size as a window on neural substrates of cognition</article-title><source>Trends in Cognitive Sciences</source><volume>24</volume><fpage>466</fpage><lpage>480</lpage><pub-id pub-id-type="doi">10.1016/j.tics.2020.03.005</pub-id><pub-id pub-id-type="pmid">32331857</pub-id></element-citation></ref><ref id="bib45"><element-citation publication-type="confproc"><person-group person-group-type="author"><name><surname>Kingma</surname><given-names>DP</given-names></name><name><surname>Ba</surname><given-names>JL</given-names></name></person-group><year iso-8601-date="2015">2015</year><article-title>Adam: a method for stochastic optimization</article-title><conf-name>3rd Int. Conf. Learn. Represent. ICLR 2015 - Conf. Track Proc</conf-name><fpage>1</fpage><lpage>15</lpage></element-citation></ref><ref id="bib46"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kloosterman</surname><given-names>NA</given-names></name><name><surname>Meindertsma</surname><given-names>T</given-names></name><name><surname>van Loon</surname><given-names>AM</given-names></name><name><surname>Lamme</surname><given-names>VAF</given-names></name><name><surname>Bonneh</surname><given-names>YS</given-names></name><name><surname>Donner</surname><given-names>TH</given-names></name></person-group><year iso-8601-date="2015">2015</year><article-title>Pupil size tracks perceptual content and surprise</article-title><source>The European Journal of Neuroscience</source><volume>41</volume><fpage>1068</fpage><lpage>1078</lpage><pub-id pub-id-type="doi">10.1111/ejn.12859</pub-id><pub-id pub-id-type="pmid">25754528</pub-id></element-citation></ref><ref id="bib47"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kosciessa</surname><given-names>JQ</given-names></name><name><surname>Lindenberger</surname><given-names>U</given-names></name><name><surname>Garrett</surname><given-names>DD</given-names></name></person-group><year iso-8601-date="2021">2021</year><article-title>Thalamocortical excitability modulation guides human perception under uncertainty</article-title><source>Nature Communications</source><volume>12</volume><elocation-id>2430</elocation-id><pub-id pub-id-type="doi">10.1038/s41467-021-22511-7</pub-id><pub-id pub-id-type="pmid">33893294</pub-id></element-citation></ref><ref id="bib48"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname><given-names>Y</given-names></name><name><surname>Rodenkirch</surname><given-names>C</given-names></name><name><surname>Moskowitz</surname><given-names>N</given-names></name><name><surname>Schriver</surname><given-names>B</given-names></name><name><surname>Wang</surname><given-names>Q</given-names></name></person-group><year iso-8601-date="2017">2017</year><article-title>Dynamic lateralization of pupil dilation evoked by locus coeruleus activation results from sympathetic, not parasympathetic, contributions</article-title><source>Cell Reports</source><volume>20</volume><fpage>3099</fpage><lpage>3112</lpage><pub-id pub-id-type="doi">10.1016/j.celrep.2017.08.094</pub-id><pub-id pub-id-type="pmid">28954227</pub-id></element-citation></ref><ref id="bib49"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Meng</surname><given-names>M</given-names></name><name><surname>Tong</surname><given-names>F</given-names></name></person-group><year iso-8601-date="2004">2004</year><article-title>Can attention selectively bias bistable perception? Differences between binocular rivalry and ambiguous figures</article-title><source>Journal of Vision</source><volume>4</volume><fpage>539</fpage><lpage>551</lpage><pub-id pub-id-type="doi">10.1167/4.7.2</pub-id><pub-id pub-id-type="pmid">15330700</pub-id></element-citation></ref><ref id="bib50"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Meunier</surname><given-names>D</given-names></name><name><surname>Lambiotte</surname><given-names>R</given-names></name><name><surname>Bullmore</surname><given-names>ET</given-names></name></person-group><year iso-8601-date="2010">2010</year><article-title>Modular and hierarchically modular organization of brain networks</article-title><source>Frontiers in Neuroscience</source><volume>4</volume><elocation-id>200</elocation-id><pub-id pub-id-type="doi">10.3389/fnins.2010.00200</pub-id><pub-id pub-id-type="pmid">21151783</pub-id></element-citation></ref><ref id="bib51"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Moran</surname><given-names>RJ</given-names></name><name><surname>Campo</surname><given-names>P</given-names></name><name><surname>Symmonds</surname><given-names>M</given-names></name><name><surname>Stephan</surname><given-names>KE</given-names></name><name><surname>Dolan</surname><given-names>RJ</given-names></name><name><surname>Friston</surname><given-names>KJ</given-names></name></person-group><year iso-8601-date="2013">2013</year><article-title>Free energy, precision and learning: the role of cholinergic neuromodulation</article-title><source>The Journal of Neuroscience</source><volume>33</volume><fpage>8227</fpage><lpage>8236</lpage><pub-id pub-id-type="doi">10.1523/JNEUROSCI.4255-12.2013</pub-id><pub-id pub-id-type="pmid">23658161</pub-id></element-citation></ref><ref id="bib52"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Müller</surname><given-names>EJ</given-names></name><name><surname>Munn</surname><given-names>BR</given-names></name><name><surname>Shine</surname><given-names>JM</given-names></name></person-group><year iso-8601-date="2020">2020</year><article-title>Diffuse neural coupling mediates complex network dynamics through the formation of quasi-critical brain states</article-title><source>Nature Communications</source><volume>11</volume><elocation-id>6337</elocation-id><pub-id pub-id-type="doi">10.1038/s41467-020-19716-7</pub-id><pub-id pub-id-type="pmid">33303766</pub-id></element-citation></ref><ref id="bib53"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Munn</surname><given-names>B</given-names></name><name><surname>Gong</surname><given-names>P</given-names></name></person-group><year iso-8601-date="2018">2018</year><article-title>Critical dynamics of natural time-varying images</article-title><source>Physical Review Letters</source><volume>121</volume><elocation-id>058101</elocation-id><pub-id pub-id-type="doi">10.1103/PhysRevLett.121.058101</pub-id><pub-id pub-id-type="pmid">30118263</pub-id></element-citation></ref><ref id="bib54"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Munn</surname><given-names>BR</given-names></name><name><surname>Müller</surname><given-names>EJ</given-names></name><name><surname>Wainstein</surname><given-names>G</given-names></name><name><surname>Shine</surname><given-names>JM</given-names></name></person-group><year iso-8601-date="2021">2021</year><article-title>The ascending arousal system shapes neural dynamics to mediate awareness of cognitive states</article-title><source>Nature Communications</source><volume>12</volume><fpage>1</fpage><lpage>9</lpage><pub-id pub-id-type="doi">10.1038/s41467-021-26268-x</pub-id></element-citation></ref><ref id="bib55"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Murphy</surname><given-names>PR</given-names></name><name><surname>Vandekerckhove</surname><given-names>J</given-names></name><name><surname>Nieuwenhuis</surname><given-names>S</given-names></name></person-group><year iso-8601-date="2014">2014</year><article-title>Pupil-linked arousal determines variability in perceptual decision making</article-title><source>PLOS Computational Biology</source><volume>10</volume><elocation-id>e1003854</elocation-id><pub-id pub-id-type="doi">10.1371/journal.pcbi.1003854</pub-id><pub-id pub-id-type="pmid">25232732</pub-id></element-citation></ref><ref id="bib56"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Murphy</surname><given-names>PR</given-names></name><name><surname>Boonstra</surname><given-names>E</given-names></name><name><surname>Nieuwenhuis</surname><given-names>S</given-names></name></person-group><year iso-8601-date="2016">2016</year><article-title>Global gain modulation generates time-dependent urgency during perceptual choice in humans</article-title><source>Nature Communications</source><volume>7</volume><elocation-id>13526</elocation-id><pub-id pub-id-type="doi">10.1038/ncomms13526</pub-id><pub-id pub-id-type="pmid">27882927</pub-id></element-citation></ref><ref id="bib57"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nieuwenhuis</surname><given-names>S</given-names></name><name><surname>Aston-Jones</surname><given-names>G</given-names></name><name><surname>Cohen</surname><given-names>JD</given-names></name></person-group><year iso-8601-date="2005">2005</year><article-title>Decision making, the P3, and the locus coeruleus-norepinephrine system</article-title><source>Psychological Bulletin</source><volume>131</volume><fpage>510</fpage><lpage>532</lpage><pub-id pub-id-type="doi">10.1037/0033-2909.131.4.510</pub-id><pub-id pub-id-type="pmid">16060800</pub-id></element-citation></ref><ref id="bib58"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Parr</surname><given-names>T</given-names></name><name><surname>Friston</surname><given-names>KJ</given-names></name></person-group><year iso-8601-date="2017">2017</year><article-title>Uncertainty, epistemics and active inference</article-title><source>Journal of the Royal Society, Interface</source><volume>14</volume><elocation-id>20170376</elocation-id><pub-id pub-id-type="doi">10.1098/rsif.2017.0376</pub-id><pub-id pub-id-type="pmid">29167370</pub-id></element-citation></ref><ref id="bib59"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Parr</surname><given-names>T</given-names></name><name><surname>Friston</surname><given-names>KJ</given-names></name></person-group><year iso-8601-date="2018">2018</year><article-title>The anatomy of inference: generative models and brain structure</article-title><source>Frontiers in Computational Neuroscience</source><volume>12</volume><elocation-id>90</elocation-id><pub-id pub-id-type="doi">10.3389/fncom.2018.00090</pub-id><pub-id pub-id-type="pmid">30483088</pub-id></element-citation></ref><ref id="bib60"><element-citation publication-type="confproc"><person-group person-group-type="author"><name><surname>Paszke</surname><given-names>A</given-names></name></person-group><year iso-8601-date="2019">2019</year><article-title>Pytorch: An imperative style, high-performance deep learning library</article-title><conf-name>Proceedings of the 33rd International Conference on Neural Information Processing Systems</conf-name></element-citation></ref><ref id="bib61"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Pfeffer</surname><given-names>T</given-names></name><name><surname>Keitel</surname><given-names>C</given-names></name><name><surname>Kluger</surname><given-names>DS</given-names></name><name><surname>Keitel</surname><given-names>A</given-names></name><name><surname>Russmann</surname><given-names>A</given-names></name><name><surname>Thut</surname><given-names>G</given-names></name><name><surname>Donner</surname><given-names>TH</given-names></name><name><surname>Gross</surname><given-names>J</given-names></name></person-group><year iso-8601-date="2022">2022</year><article-title>Coupling of pupil- and neuronal population dynamics reveals diverse influences of arousal on cortical processing</article-title><source>eLife</source><volume>11</volume><elocation-id>e71890</elocation-id><pub-id pub-id-type="doi">10.7554/eLife.71890</pub-id><pub-id pub-id-type="pmid">35133276</pub-id></element-citation></ref><ref id="bib62"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Power</surname><given-names>JD</given-names></name><name><surname>Mitra</surname><given-names>A</given-names></name><name><surname>Laumann</surname><given-names>TO</given-names></name><name><surname>Snyder</surname><given-names>AZ</given-names></name><name><surname>Schlaggar</surname><given-names>BL</given-names></name><name><surname>Petersen</surname><given-names>SE</given-names></name></person-group><year iso-8601-date="2014">2014</year><article-title>Methods to detect, characterize, and remove motion artifact in resting state fMRI</article-title><source>NeuroImage</source><volume>84</volume><fpage>320</fpage><lpage>341</lpage><pub-id pub-id-type="doi">10.1016/j.neuroimage.2013.08.048</pub-id><pub-id pub-id-type="pmid">23994314</pub-id></element-citation></ref><ref id="bib63"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Reimer</surname><given-names>J</given-names></name><name><surname>Froudarakis</surname><given-names>E</given-names></name><name><surname>Cadwell</surname><given-names>CR</given-names></name><name><surname>Yatsenko</surname><given-names>D</given-names></name><name><surname>Denfield</surname><given-names>GH</given-names></name><name><surname>Tolias</surname><given-names>AS</given-names></name></person-group><year iso-8601-date="2014">2014</year><article-title>Pupil fluctuations track fast switching of cortical states during quiet wakefulness</article-title><source>Neuron</source><volume>84</volume><fpage>355</fpage><lpage>362</lpage><pub-id pub-id-type="doi">10.1016/j.neuron.2014.09.033</pub-id><pub-id pub-id-type="pmid">25374359</pub-id></element-citation></ref><ref id="bib64"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Reimer</surname><given-names>J</given-names></name><name><surname>McGinley</surname><given-names>MJ</given-names></name><name><surname>Liu</surname><given-names>Y</given-names></name><name><surname>Rodenkirch</surname><given-names>C</given-names></name><name><surname>Wang</surname><given-names>Q</given-names></name><name><surname>McCormick</surname><given-names>DA</given-names></name><name><surname>Tolias</surname><given-names>AS</given-names></name></person-group><year iso-8601-date="2016">2016</year><article-title>Pupil fluctuations track rapid changes in adrenergic and cholinergic activity in cortex</article-title><source>Nature Communications</source><volume>7</volume><elocation-id>13289</elocation-id><pub-id pub-id-type="doi">10.1038/ncomms13289</pub-id><pub-id pub-id-type="pmid">27824036</pub-id></element-citation></ref><ref id="bib65"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Reynolds</surname><given-names>JH</given-names></name><name><surname>Heeger</surname><given-names>DJ</given-names></name></person-group><year iso-8601-date="2009">2009</year><article-title>The normalization model of attention</article-title><source>Neuron</source><volume>61</volume><fpage>168</fpage><lpage>185</lpage><pub-id pub-id-type="doi">10.1016/j.neuron.2009.01.002</pub-id><pub-id pub-id-type="pmid">19186161</pub-id></element-citation></ref><ref id="bib66"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Richards</surname><given-names>BA</given-names></name><name><surname>Lillicrap</surname><given-names>TP</given-names></name><name><surname>Beaudoin</surname><given-names>P</given-names></name><name><surname>Bengio</surname><given-names>Y</given-names></name><name><surname>Bogacz</surname><given-names>R</given-names></name><name><surname>Christensen</surname><given-names>A</given-names></name><name><surname>Clopath</surname><given-names>C</given-names></name><name><surname>Costa</surname><given-names>RP</given-names></name><name><surname>de Berker</surname><given-names>A</given-names></name><name><surname>Ganguli</surname><given-names>S</given-names></name><name><surname>Gillon</surname><given-names>CJ</given-names></name><name><surname>Hafner</surname><given-names>D</given-names></name><name><surname>Kepecs</surname><given-names>A</given-names></name><name><surname>Kriegeskorte</surname><given-names>N</given-names></name><name><surname>Latham</surname><given-names>P</given-names></name><name><surname>Lindsay</surname><given-names>GW</given-names></name><name><surname>Miller</surname><given-names>KD</given-names></name><name><surname>Naud</surname><given-names>R</given-names></name><name><surname>Pack</surname><given-names>CC</given-names></name><name><surname>Poirazi</surname><given-names>P</given-names></name><name><surname>Roelfsema</surname><given-names>P</given-names></name><name><surname>Sacramento</surname><given-names>J</given-names></name><name><surname>Saxe</surname><given-names>A</given-names></name><name><surname>Scellier</surname><given-names>B</given-names></name><name><surname>Schapiro</surname><given-names>AC</given-names></name><name><surname>Senn</surname><given-names>W</given-names></name><name><surname>Wayne</surname><given-names>G</given-names></name><name><surname>Yamins</surname><given-names>D</given-names></name><name><surname>Zenke</surname><given-names>F</given-names></name><name><surname>Zylberberg</surname><given-names>J</given-names></name><name><surname>Therien</surname><given-names>D</given-names></name><name><surname>Kording</surname><given-names>KP</given-names></name></person-group><year iso-8601-date="2019">2019</year><article-title>A deep learning framework for neuroscience</article-title><source>Nature Neuroscience</source><volume>22</volume><fpage>1761</fpage><lpage>1770</lpage><pub-id pub-id-type="doi">10.1038/s41593-019-0520-2</pub-id><pub-id pub-id-type="pmid">31659335</pub-id></element-citation></ref><ref id="bib67"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rojas-Líbano</surname><given-names>D</given-names></name><name><surname>Wainstein</surname><given-names>G</given-names></name><name><surname>Carrasco</surname><given-names>X</given-names></name><name><surname>Aboitiz</surname><given-names>F</given-names></name><name><surname>Crossley</surname><given-names>N</given-names></name><name><surname>Ossandón</surname><given-names>T</given-names></name></person-group><year iso-8601-date="2019">2019</year><article-title>A pupil size, eye-tracking and neuropsychological dataset from ADHD children during a cognitive task</article-title><source>Scientific Data</source><volume>6</volume><elocation-id>25</elocation-id><pub-id pub-id-type="doi">10.1038/s41597-019-0037-2</pub-id><pub-id pub-id-type="pmid">30975993</pub-id></element-citation></ref><ref id="bib68"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sales</surname><given-names>AC</given-names></name><name><surname>Friston</surname><given-names>KJ</given-names></name><name><surname>Jones</surname><given-names>MW</given-names></name><name><surname>Pickering</surname><given-names>AE</given-names></name><name><surname>Moran</surname><given-names>RJ</given-names></name></person-group><year iso-8601-date="2019">2019</year><article-title>Locus Coeruleus tracking of prediction errors optimises cognitive flexibility: An Active Inference model</article-title><source>PLOS Computational Biology</source><volume>15</volume><elocation-id>e1006267</elocation-id><pub-id pub-id-type="doi">10.1371/journal.pcbi.1006267</pub-id><pub-id pub-id-type="pmid">30608922</pub-id></element-citation></ref><ref id="bib69"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Samuels</surname><given-names>ER</given-names></name><name><surname>Szabadi</surname><given-names>E</given-names></name></person-group><year iso-8601-date="2008">2008</year><article-title>Functional neuroanatomy of the noradrenergic locus coeruleus: its roles in the regulation of arousal and autonomic function part II: physiological and pharmacological manipulations and pathological alterations of locus coeruleus activity in humans</article-title><source>Current Neuropharmacology</source><volume>6</volume><fpage>254</fpage><lpage>285</lpage><pub-id pub-id-type="doi">10.2174/157015908785777193</pub-id><pub-id pub-id-type="pmid">19506724</pub-id></element-citation></ref><ref id="bib70"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sara</surname><given-names>SJ</given-names></name></person-group><year iso-8601-date="2009">2009</year><article-title>The locus coeruleus and noradrenergic modulation of cognition</article-title><source>Nature Reviews. Neuroscience</source><volume>10</volume><fpage>211</fpage><lpage>223</lpage><pub-id pub-id-type="doi">10.1038/nrn2573</pub-id><pub-id pub-id-type="pmid">19190638</pub-id></element-citation></ref><ref id="bib71"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sara</surname><given-names>SJ</given-names></name></person-group><year iso-8601-date="2015">2015</year><article-title>Locus Coeruleus in time with the making of memories</article-title><source>Current Opinion in Neurobiology</source><volume>35</volume><fpage>87</fpage><lpage>94</lpage><pub-id pub-id-type="doi">10.1016/j.conb.2015.07.004</pub-id><pub-id pub-id-type="pmid">26241632</pub-id></element-citation></ref><ref id="bib72"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Servan-schreiber</surname><given-names>AD</given-names></name></person-group><year iso-8601-date="2016">2016</year><article-title>Reports a network model of catecholamine effects: gain</article-title><source>Signal-to-Noise Ratio, and Behavior</source><volume>249</volume><fpage>892</fpage><lpage>895</lpage><pub-id pub-id-type="doi">10.1126/science.2392679</pub-id></element-citation></ref><ref id="bib73"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shine</surname><given-names>JM</given-names></name><name><surname>Bissett</surname><given-names>PG</given-names></name><name><surname>Bell</surname><given-names>PT</given-names></name><name><surname>Koyejo</surname><given-names>O</given-names></name><name><surname>Balsters</surname><given-names>JH</given-names></name><name><surname>Gorgolewski</surname><given-names>KJ</given-names></name><name><surname>Moodie</surname><given-names>CA</given-names></name><name><surname>Poldrack</surname><given-names>RA</given-names></name></person-group><year iso-8601-date="2016">2016</year><article-title>The dynamics of functional brain networks: integrated network states during cognitive task performance</article-title><source>Neuron</source><volume>92</volume><fpage>544</fpage><lpage>554</lpage><pub-id pub-id-type="doi">10.1016/j.neuron.2016.09.018</pub-id><pub-id pub-id-type="pmid">27693256</pub-id></element-citation></ref><ref id="bib74"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shine</surname><given-names>JM</given-names></name><name><surname>Aburn</surname><given-names>MJ</given-names></name><name><surname>Breakspear</surname><given-names>M</given-names></name><name><surname>Poldrack</surname><given-names>RA</given-names></name></person-group><year iso-8601-date="2018">2018</year><article-title>The modulation of neural gain facilitates a transition between functional segregation and integration in the brain</article-title><source>eLife</source><volume>7</volume><elocation-id>e31130</elocation-id><pub-id pub-id-type="doi">10.7554/eLife.31130</pub-id><pub-id pub-id-type="pmid">29376825</pub-id></element-citation></ref><ref id="bib75"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shine</surname><given-names>JM</given-names></name></person-group><year iso-8601-date="2019">2019</year><article-title>Neuromodulatory influences on integration and segregation in the brain</article-title><source>Trends in Cognitive Sciences</source><volume>23</volume><fpage>572</fpage><lpage>583</lpage><pub-id pub-id-type="doi">10.1016/j.tics.2019.04.002</pub-id><pub-id pub-id-type="pmid">31076192</pub-id></element-citation></ref><ref id="bib76"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shine</surname><given-names>JM</given-names></name><name><surname>Hearne</surname><given-names>LJ</given-names></name><name><surname>Breakspear</surname><given-names>M</given-names></name><name><surname>Hwang</surname><given-names>K</given-names></name><name><surname>Müller</surname><given-names>EJ</given-names></name><name><surname>Sporns</surname><given-names>O</given-names></name><name><surname>Poldrack</surname><given-names>RA</given-names></name><name><surname>Mattingley</surname><given-names>JB</given-names></name><name><surname>Cocchi</surname><given-names>L</given-names></name></person-group><year iso-8601-date="2019">2019</year><article-title>The low-dimensional neural architecture of cognitive complexity is related to activity in medial thalamic nuclei</article-title><source>Neuron</source><volume>104</volume><fpage>849</fpage><lpage>855</lpage><pub-id pub-id-type="doi">10.1016/j.neuron.2019.09.002</pub-id><pub-id pub-id-type="pmid">31653463</pub-id></element-citation></ref><ref id="bib77"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shine</surname><given-names>JM</given-names></name><name><surname>Müller</surname><given-names>EJ</given-names></name><name><surname>Munn</surname><given-names>B</given-names></name><name><surname>Cabral</surname><given-names>J</given-names></name><name><surname>Moran</surname><given-names>RJ</given-names></name><name><surname>Breakspear</surname><given-names>M</given-names></name></person-group><year iso-8601-date="2021">2021</year><article-title>Computational models link cellular mechanisms of neuromodulation to large-scale neural dynamics</article-title><source>Nature Neuroscience</source><volume>24</volume><fpage>765</fpage><lpage>776</lpage><pub-id pub-id-type="doi">10.1038/s41593-021-00824-6</pub-id><pub-id pub-id-type="pmid">33958801</pub-id></element-citation></ref><ref id="bib78"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Song</surname><given-names>HF</given-names></name><name><surname>Yang</surname><given-names>GR</given-names></name><name><surname>Wang</surname><given-names>XJ</given-names></name></person-group><year iso-8601-date="2016">2016</year><article-title>Training excitatory-inhibitory recurrent neural networks for cognitive tasks: a simple and flexible framework</article-title><source>PLOS Computational Biology</source><volume>12</volume><elocation-id>e1004792</elocation-id><pub-id pub-id-type="doi">10.1371/journal.pcbi.1004792</pub-id><pub-id pub-id-type="pmid">26928718</pub-id></element-citation></ref><ref id="bib79"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Stöttinger</surname><given-names>E</given-names></name><name><surname>Filipowicz</surname><given-names>A</given-names></name><name><surname>Valadao</surname><given-names>D</given-names></name><name><surname>Culham</surname><given-names>JC</given-names></name><name><surname>Goodale</surname><given-names>MA</given-names></name><name><surname>Anderson</surname><given-names>B</given-names></name><name><surname>Danckert</surname><given-names>J</given-names></name></person-group><year iso-8601-date="2015">2015</year><article-title>A cortical network that marks the moment when conscious representations are updated</article-title><source>Neuropsychologia</source><volume>79</volume><fpage>113</fpage><lpage>122</lpage><pub-id pub-id-type="doi">10.1016/j.neuropsychologia.2015.10.037</pub-id><pub-id pub-id-type="pmid">26529489</pub-id></element-citation></ref><ref id="bib80"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Stöttinger</surname><given-names>E</given-names></name><name><surname>Sepahvand</surname><given-names>NM</given-names></name><name><surname>Danckert</surname><given-names>J</given-names></name><name><surname>Anderson</surname><given-names>B</given-names></name></person-group><year iso-8601-date="2016">2016</year><article-title>Assessing perceptual change with an ambiguous figures task: Normative data for 40 standard picture sets</article-title><source>Behavior Research Methods</source><volume>48</volume><fpage>201</fpage><lpage>222</lpage><pub-id pub-id-type="doi">10.3758/s13428-015-0564-5</pub-id></element-citation></ref><ref id="bib81"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sussillo</surname><given-names>D</given-names></name><name><surname>Barak</surname><given-names>O</given-names></name></person-group><year iso-8601-date="2013">2013</year><article-title>Opening the black box: low-dimensional dynamics in high-dimensional recurrent neural networks</article-title><source>Neural Computation</source><volume>25</volume><fpage>626</fpage><lpage>649</lpage><pub-id pub-id-type="doi">10.1162/NECO_a_00409</pub-id><pub-id pub-id-type="pmid">23272922</pub-id></element-citation></ref><ref id="bib82"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sussillo</surname><given-names>D</given-names></name></person-group><year iso-8601-date="2014">2014</year><article-title>Neural circuits as computational dynamical systems</article-title><source>Current Opinion in Neurobiology</source><volume>25</volume><fpage>156</fpage><lpage>163</lpage><pub-id pub-id-type="doi">10.1016/j.conb.2014.01.008</pub-id><pub-id pub-id-type="pmid">24509098</pub-id></element-citation></ref><ref id="bib83"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Szabadi</surname><given-names>E</given-names></name></person-group><year iso-8601-date="2018">2018</year><article-title>Functional organization of the sympathetic pathways controlling the pupil: light-inhibited and light-stimulated pathways</article-title><source>Frontiers in Neurology</source><volume>9</volume><elocation-id>1069</elocation-id><pub-id pub-id-type="doi">10.3389/fneur.2018.01069</pub-id><pub-id pub-id-type="pmid">30619035</pub-id></element-citation></ref><ref id="bib84"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Taylor</surname><given-names>NL</given-names></name><name><surname>D’Souza</surname><given-names>A</given-names></name><name><surname>Munn</surname><given-names>BR</given-names></name><name><surname>Lv</surname><given-names>J</given-names></name><name><surname>Zaborszky</surname><given-names>L</given-names></name><name><surname>Müller</surname><given-names>EJ</given-names></name><name><surname>Wainstein</surname><given-names>G</given-names></name><name><surname>Calamante</surname><given-names>F</given-names></name><name><surname>Shine</surname><given-names>JM</given-names></name></person-group><year iso-8601-date="2022">2022</year><article-title>Structural connections between the noradrenergic and cholinergic system shape the dynamics of functional brain networks</article-title><source>NeuroImage</source><volume>260</volume><elocation-id>119455</elocation-id><pub-id pub-id-type="doi">10.1016/j.neuroimage.2022.119455</pub-id><pub-id pub-id-type="pmid">35809888</pub-id></element-citation></ref><ref id="bib85"><element-citation publication-type="preprint"><person-group person-group-type="author"><name><surname>Thura</surname><given-names>D</given-names></name><name><surname>Cabana</surname><given-names>JF</given-names></name><name><surname>Feghaly</surname><given-names>A</given-names></name><name><surname>Cisek</surname><given-names>P</given-names></name></person-group><year iso-8601-date="2020">2020</year><article-title>Unified neural dynamics of decisions and actions in the cerebral cortex and basal ganglia</article-title><source>bioRxiv</source><pub-id pub-id-type="doi">10.1101/2020.10.22.350280</pub-id></element-citation></ref><ref id="bib86"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tkačik</surname><given-names>G</given-names></name><name><surname>Mora</surname><given-names>T</given-names></name><name><surname>Marre</surname><given-names>O</given-names></name><name><surname>Amodei</surname><given-names>D</given-names></name><name><surname>Palmer</surname><given-names>SE</given-names></name><name><surname>Berry</surname><given-names>MJ</given-names></name><name><surname>Bialek</surname><given-names>W</given-names></name></person-group><year iso-8601-date="2015">2015</year><article-title>Thermodynamics and signatures of criticality in a network of neurons</article-title><source>PNAS</source><volume>112</volume><fpage>11508</fpage><lpage>11513</lpage><pub-id pub-id-type="doi">10.1073/pnas.1514188112</pub-id><pub-id pub-id-type="pmid">26330611</pub-id></element-citation></ref><ref id="bib87"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Totah</surname><given-names>NKB</given-names></name><name><surname>Logothetis</surname><given-names>NK</given-names></name><name><surname>Eschenko</surname><given-names>O</given-names></name></person-group><year iso-8601-date="2019">2019</year><article-title>Noradrenergic ensemble-based modulation of cognition over multiple timescales</article-title><source>Brain Research</source><volume>1709</volume><fpage>50</fpage><lpage>66</lpage><pub-id pub-id-type="doi">10.1016/j.brainres.2018.12.031</pub-id><pub-id pub-id-type="pmid">30586547</pub-id></element-citation></ref><ref id="bib88"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Urai</surname><given-names>AE</given-names></name><name><surname>Braun</surname><given-names>A</given-names></name><name><surname>Donner</surname><given-names>TH</given-names></name></person-group><year iso-8601-date="2017">2017</year><article-title>Pupil-linked arousal is driven by decision uncertainty and alters serial choice bias</article-title><source>Nature Communications</source><volume>8</volume><elocation-id>14637</elocation-id><pub-id pub-id-type="doi">10.1038/ncomms14637</pub-id><pub-id pub-id-type="pmid">28256514</pub-id></element-citation></ref><ref id="bib89"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>van Ee</surname><given-names>R</given-names></name></person-group><year iso-8601-date="2005">2005</year><article-title>Dynamics of perceptual bi-stability for stereoscopic slant rivalry and a comparison with grating, house-face, and Necker cube rivalry</article-title><source>Vision Research</source><volume>45</volume><fpage>29</fpage><lpage>40</lpage><pub-id pub-id-type="doi">10.1016/j.visres.2004.07.039</pub-id><pub-id pub-id-type="pmid">15571736</pub-id></element-citation></ref><ref id="bib90"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vincent</surname><given-names>P</given-names></name><name><surname>Parr</surname><given-names>T</given-names></name><name><surname>Benrimoh</surname><given-names>D</given-names></name><name><surname>Friston</surname><given-names>KJ</given-names></name></person-group><year iso-8601-date="2019">2019</year><article-title>With an eye on uncertainty: Modelling pupillary responses to environmental volatility</article-title><source>PLOS Computational Biology</source><volume>15</volume><elocation-id>e1007126</elocation-id><pub-id pub-id-type="doi">10.1371/journal.pcbi.1007126</pub-id><pub-id pub-id-type="pmid">31276488</pub-id></element-citation></ref><ref id="bib91"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vyas</surname><given-names>S</given-names></name><name><surname>Golub</surname><given-names>MD</given-names></name><name><surname>Sussillo</surname><given-names>D</given-names></name><name><surname>Shenoy</surname><given-names>KV</given-names></name></person-group><year iso-8601-date="2020">2020</year><article-title>Computation through neural population dynamics</article-title><source>Annual Review of Neuroscience</source><volume>43</volume><fpage>249</fpage><lpage>275</lpage><pub-id pub-id-type="doi">10.1146/annurev-neuro-092619-094115</pub-id><pub-id pub-id-type="pmid">32640928</pub-id></element-citation></ref><ref id="bib92"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wainstein</surname><given-names>G</given-names></name><name><surname>Rojas-Líbano</surname><given-names>D</given-names></name><name><surname>Crossley</surname><given-names>NA</given-names></name><name><surname>Carrasco</surname><given-names>X</given-names></name><name><surname>Aboitiz</surname><given-names>F</given-names></name><name><surname>Ossandón</surname><given-names>T</given-names></name></person-group><year iso-8601-date="2017">2017</year><article-title>Pupil size tracks attentional performance in attention-deficit/hyperactivity disorder</article-title><source>Scientific Reports</source><volume>7</volume><elocation-id>8228</elocation-id><pub-id pub-id-type="doi">10.1038/s41598-017-08246-w</pub-id><pub-id pub-id-type="pmid">28811624</pub-id></element-citation></ref><ref id="bib93"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wainstein</surname><given-names>G</given-names></name><name><surname>Rojas-Líbano</surname><given-names>D</given-names></name><name><surname>Medel</surname><given-names>V</given-names></name><name><surname>Alnæs</surname><given-names>D</given-names></name><name><surname>Kolskår</surname><given-names>KK</given-names></name><name><surname>Endestad</surname><given-names>T</given-names></name><name><surname>Laeng</surname><given-names>B</given-names></name><name><surname>Ossandon</surname><given-names>T</given-names></name><name><surname>Crossley</surname><given-names>N</given-names></name><name><surname>Matar</surname><given-names>E</given-names></name><name><surname>Shine</surname><given-names>JM</given-names></name></person-group><year iso-8601-date="2021">2021</year><article-title>The ascending arousal system promotes optimal performance through mesoscale network integration in a visuospatial attentional task</article-title><source>Network Neuroscience</source><volume>5</volume><fpage>890</fpage><lpage>910</lpage><pub-id pub-id-type="doi">10.1162/netn_a_00205</pub-id><pub-id pub-id-type="pmid">35024535</pub-id></element-citation></ref><ref id="bib94"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wainstein</surname><given-names>G</given-names></name><name><surname>Müller</surname><given-names>EJ</given-names></name><name><surname>Taylor</surname><given-names>N</given-names></name><name><surname>Munn</surname><given-names>B</given-names></name><name><surname>Shine</surname><given-names>JM</given-names></name></person-group><year iso-8601-date="2022">2022</year><article-title>The role of the locus coeruleus in shaping adaptive cortical melodies</article-title><source>Trends in Cognitive Sciences</source><volume>26</volume><fpage>527</fpage><lpage>538</lpage><pub-id pub-id-type="doi">10.1016/j.tics.2022.03.006</pub-id></element-citation></ref><ref id="bib95"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>XJ</given-names></name></person-group><year iso-8601-date="2002">2002</year><article-title>Probabilistic decision making by slow reverberation in cortical circuits</article-title><source>Neuron</source><volume>36</volume><fpage>955</fpage><lpage>968</lpage><pub-id pub-id-type="doi">10.1016/s0896-6273(02)01092-9</pub-id><pub-id pub-id-type="pmid">12467598</pub-id></element-citation></ref><ref id="bib96"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Weilnhammer</surname><given-names>V</given-names></name><name><surname>Stuke</surname><given-names>H</given-names></name><name><surname>Hesselmann</surname><given-names>G</given-names></name><name><surname>Sterzer</surname><given-names>P</given-names></name><name><surname>Schmack</surname><given-names>K</given-names></name></person-group><year iso-8601-date="2017">2017</year><article-title>A predictive coding account of bistable perception - a model-based fMRI study</article-title><source>PLOS Computational Biology</source><volume>13</volume><elocation-id>e1005536</elocation-id><pub-id pub-id-type="doi">10.1371/journal.pcbi.1005536</pub-id><pub-id pub-id-type="pmid">28505152</pub-id></element-citation></ref><ref id="bib97"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Werbos</surname><given-names>PJ</given-names></name></person-group><year iso-8601-date="1990">1990</year><article-title>Backpropagation through time: what it does and how to do it</article-title><source>Proceedings of the IEEE</source><volume>78</volume><fpage>1550</fpage><lpage>1560</lpage><pub-id pub-id-type="doi">10.1109/5.58337</pub-id></element-citation></ref><ref id="bib98"><element-citation publication-type="software"><person-group person-group-type="author"><name><surname>Whyte</surname><given-names>C</given-names></name><name><surname>Wainstein</surname><given-names>G</given-names></name><name><surname>Shine</surname><given-names>M</given-names></name></person-group><year iso-8601-date="2025">2025</year><data-title>AmbiguousFigures</data-title><version designator="swh:1:rev:dea15598a833ff6fbfc71eb4968b4a249048cc4a">swh:1:rev:dea15598a833ff6fbfc71eb4968b4a249048cc4a</version><source>Software Heritage</source><ext-link ext-link-type="uri" xlink:href="https://archive.softwareheritage.org/swh:1:dir:d17bc559488ca5af5711e3cd3d7cb046725cbdf8;origin=https://github.com/ShineLabUSYD/AmbiguousFigures;visit=swh:1:snp:c711f4618649c4e5176551f1238ab7173422964c;anchor=swh:1:rev:dea15598a833ff6fbfc71eb4968b4a249048cc4a">https://archive.softwareheritage.org/swh:1:dir:d17bc559488ca5af5711e3cd3d7cb046725cbdf8;origin=https://github.com/ShineLabUSYD/AmbiguousFigures;visit=swh:1:snp:c711f4618649c4e5176551f1238ab7173422964c;anchor=swh:1:rev:dea15598a833ff6fbfc71eb4968b4a249048cc4a</ext-link></element-citation></ref><ref id="bib99"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wong</surname><given-names>K-F</given-names></name><name><surname>Wang</surname><given-names>X-J</given-names></name></person-group><year iso-8601-date="2006">2006</year><article-title>A recurrent network mechanism of time integration in perceptual decisions</article-title><source>The Journal of Neuroscience</source><volume>26</volume><fpage>1314</fpage><lpage>1328</lpage><pub-id pub-id-type="doi">10.1523/JNEUROSCI.3733-05.2006</pub-id><pub-id pub-id-type="pmid">16436619</pub-id></element-citation></ref><ref id="bib100"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname><given-names>GR</given-names></name><name><surname>Wang</surname><given-names>XJ</given-names></name></person-group><year iso-8601-date="2020">2020</year><article-title>Artificial neural networks for neuroscientists: a primer</article-title><source>Neuron</source><volume>107</volume><fpage>1048</fpage><lpage>1070</lpage><pub-id pub-id-type="doi">10.1016/j.neuron.2020.09.005</pub-id><pub-id pub-id-type="pmid">32970997</pub-id></element-citation></ref><ref id="bib101"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yarkoni</surname><given-names>T</given-names></name><name><surname>Poldrack</surname><given-names>RA</given-names></name><name><surname>Nichols</surname><given-names>TE</given-names></name><name><surname>Van Essen</surname><given-names>DC</given-names></name><name><surname>Wager</surname><given-names>TD</given-names></name></person-group><year iso-8601-date="2011">2011</year><article-title>Large-scale automated synthesis of human functional neuroimaging data</article-title><source>Nature Methods</source><volume>8</volume><fpage>665</fpage><lpage>670</lpage><pub-id pub-id-type="doi">10.1038/nmeth.1635</pub-id><pub-id pub-id-type="pmid">21706013</pub-id></element-citation></ref><ref id="bib102"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zerbi</surname><given-names>V</given-names></name><name><surname>Floriou-Servou</surname><given-names>A</given-names></name><name><surname>Markicevic</surname><given-names>M</given-names></name><name><surname>Vermeiren</surname><given-names>Y</given-names></name><name><surname>Sturman</surname><given-names>O</given-names></name><name><surname>Privitera</surname><given-names>M</given-names></name><name><surname>von Ziegler</surname><given-names>L</given-names></name><name><surname>Ferrari</surname><given-names>KD</given-names></name><name><surname>Weber</surname><given-names>B</given-names></name><name><surname>De Deyn</surname><given-names>PP</given-names></name><name><surname>Wenderoth</surname><given-names>N</given-names></name><name><surname>Bohacek</surname><given-names>J</given-names></name></person-group><year iso-8601-date="2019">2019</year><article-title>Rapid reconfiguration of the functional connectome after chemogenetic locus coeruleus activation</article-title><source>SSRN Electronic Journal</source><volume>1</volume><elocation-id>34983</elocation-id><pub-id pub-id-type="doi">10.2139/ssrn.3334983</pub-id></element-citation></ref></ref-list></back><sub-article article-type="editor-report" id="sa0"><front-stub><article-id pub-id-type="doi">10.7554/eLife.93191.4.sa0</article-id><title-group><article-title>eLife Assessment</article-title></title-group><contrib-group><contrib contrib-type="author"><name><surname>Donner</surname><given-names>Tobias H</given-names></name><role specific-use="editor">Reviewing Editor</role><aff><institution>University Medical Center Hamburg-Eppendorf</institution><country>Germany</country></aff></contrib></contrib-group><kwd-group kwd-group-type="evidence-strength"><kwd>Solid</kwd></kwd-group><kwd-group kwd-group-type="claim-importance"><kwd>Valuable</kwd></kwd-group></front-stub><body><p>This <bold>valuable</bold> article explores the idea that transient modulations of neural gain promote switches between distinct perceptual interpretations of ambiguous stimuli. The authors provide <bold>solid</bold> evidence for this idea by pupillometry (an indirect proxy of neuromodulatory activity), fMRI, neural network modelling, and dynamical systems analyses. The highly integrative nature of this approach is rare in the field.</p></body></sub-article><sub-article article-type="referee-report" id="sa1"><front-stub><article-id pub-id-type="doi">10.7554/eLife.93191.4.sa1</article-id><title-group><article-title>Reviewer #1 (Public review):</article-title></title-group><contrib-group><contrib contrib-type="author"><anonymous/><role specific-use="referee">Reviewer</role></contrib></contrib-group></front-stub><body><p>Summary:</p><p>This paper proposes a neural mechanism underlying the perception of ambiguous images: neuromodulation changes the gain of neural circuits promoting a switch between two possible percepts. Converging evidence for this is provided by indirect measurements of neuromodulatory activity and large-scale brain dynamics which are linked by a neural network model. However, both the data analysis as well as the computational modeling are incomplete and would benefit from a more rigorous approach.</p><p>This is a revised version of the manuscript which, in my view, is a considerable step forward compared to the original submission.</p><p>In particular, the authors now model phasic gain changes in the RNN, based on the network's uncertainty. This is original and much closer to what is suggested by the phasic pupil responses. They also show that switching is actually a network effect because switching times depend on network configuration (Fig 2). This resolves my main comments 1 and 2 about the model.</p><p>The mechanism, as I understand it, is different from what the authors described before in the RNN with tonic gain changes. As uncertainty increases, the network enters a regime in which the two excitatory populations start to oscillate. My intuition is that this oscillation arises from the feedback loop created by the new gain control mechanism. If my intuition is correct, I think it would be worth to explain this mechanism in the paper more explicitly.</p><p>Comments on revisions:</p><p>This is a second revision. I have no further comments. The authors have not answered the question that I had in the previous round (about the origin of oscillations in the RNN). I think this topic deserves to be explored in more detail but perhaps that is beyond the scope of the current paper.</p></body></sub-article><sub-article article-type="referee-report" id="sa2"><front-stub><article-id pub-id-type="doi">10.7554/eLife.93191.4.sa2</article-id><title-group><article-title>Reviewer #2 (Public review):</article-title></title-group><contrib-group><contrib contrib-type="author"><anonymous/><role specific-use="referee">Reviewer</role></contrib></contrib-group></front-stub><body><p>This paper tests the hypothesis that perceptual switches during the presentation of ambiguous stimuli are accompanied by changes in neuromodulation that alter neural gain and trigger abrupt changes in brain activity. To test this hypothesis, the study combines pupillometry, artificial recurrent network (RNN) analysis and fMRI recording. In particular, the study uses methods of energy landscape analysis inspired by physics, which is particularly interesting.</p><p>Strengths</p><p>- The authors should be commended for combining different methods (pupillometry, RNNs, fMRI) to test their hypothesis. This combination provides a mechanistic insight into perceptual switches in the brain and artificial neural networks.</p><p>- The study combines different viewpoints and fields of scientific literature, including neuroscience, psychology, physics, dynamical systems. In order to make this combination more accessible to the reader, the different aspects are presented in a pedagogical way to be accessible to all fields.</p><p>- This combination of methods and viewpoints is rarely done, so it is very useful.</p><p>- The authors introduce dynamic gain modulation in their recurrent neural network, which is novel. They devote a section of the paper to studying the dynamics, fixed points and convergence of this type of network.</p><p>Weaknesses</p><p>- The study may not be specific to perceptual switches. This is because the study relies on a paradigm in which participants report when they identify a switch in the item category. Therefore, it is unclear whether the effects reported in the paper are related to the perceptual switch itself, to attention, or to the detection of behaviourally relevant events. The authors are cautious and explicitly acknowledge this point in their study.</p><p>- The demonstration of the causal role of gain modulation in perceptual switches is partial. This causality is clearly demonstrated in the simulation work with the RNN. However, it is not fully demonstrated in the pupil analysis and the fMRI analysis. One reason is that this work is correlative (which is already very informative).</p><p>- Some effects may reflect the expectation of a perceptual switch rather than the perceptual switch itself. To mitigate this risk, the design of the fMRI task included catch trials, in which no switch occurs, to reduce the expectation of a switch. The pupil study, however, did not include such catch trials.</p><p>- The paper uses RNN-based modelling to provide mechanistic insight into the role of gain modulation in perceptual switches. However, the RNN solves a task that differs from that performed by human participants, which may limit the explanatory value of the model. The RNN is provided with two inputs characterising the sensory evidence supporting the first and last image category in the sequence (e.g. plane and shark). In contrast, observers in the task don't know in advance the identity of the last image at the beginning of the sequence. The brain first receives sensory evidence about the image category (e.g. plane) with which the sequence begins, which is very easy to recognise, then it sees a sequence of morphed images and has to discover what the final image category will be. To discover the final image category, the brain considers several possibilities for the second images (it is a shark?, a frog?, a bird?, etc.), rather than comparing the likelihood of just two categories. This search process among many alternatives and the perceptual switch in the task is therefore different from the competition between only two inputs in the RNN.</p><p>- Another aspect of the motivation for the RNN model remains unclear. The authors introduce dynamic gain modulation in the RNN, but it is not clear what the added value of dynamic gain modulation is. Both static (Fig. S1) and dynamic (Fig. 2F) gain modulation lead to the predicted effect: faster switching when the gain is larger.</p><p>- The authors are to be commended for addressing their research questions with multiple tools and approaches. There are links between the different parts of the study. The RNN and the pupil are linked by the notion of gain modulation, the RNN and the fMRI analysis are linked by the study of the energy landscape, the fMRI study and the pupil study are indirectly linked by previous work for this group showing that the peak in LC fMRI activity precedes a flattening of the energy landscape. These links are very interesting but could have been stronger and more complete.</p><p>Comments on revisions:</p><p>I thank the authors for their responses.</p><p>My review presents points that the authors themselves present as weaknesses or limitations. It also includes points that cannot be addressed in a revision (e.g. causality).</p><p>Regarding the fact that the RNN only considers two categories, whereas subjects consider more categories (because they don't know the final image), I have toned down my remark (removing &quot;markedly&quot; different, removing the fact that the hypothesis space is vast given that participants have some priors). I also removed the qualifier &quot;mechanistically&quot; different, because it can be understood in different ways. The point remains that the proposed model has 2 inputs, the corresponding network in the brain has &gt;2 inputs (because it considers more categories than the RNN), which is different, and which is the point of my remark. I think it may limit the value of the model, but I don't think it is not &quot;sensible&quot;.</p></body></sub-article><sub-article article-type="author-comment" id="sa3"><front-stub><article-id pub-id-type="doi">10.7554/eLife.93191.4.sa3</article-id><title-group><article-title>Author response</article-title></title-group><contrib-group><contrib contrib-type="author"><name><surname>Wainstein</surname><given-names>Gabriel</given-names></name><role specific-use="author">Author</role><aff><institution>University of Sydney</institution><addr-line><named-content content-type="city">Sydney</named-content></addr-line><country>Australia</country></aff></contrib><contrib contrib-type="author"><name><surname>Whyte</surname><given-names>Christopher</given-names></name><role specific-use="author">Author</role><aff><institution>University of Sydney</institution><addr-line><named-content content-type="city">Sydney</named-content></addr-line><country>Australia</country></aff></contrib><contrib contrib-type="author"><name><surname>Ehgoetz Martens</surname><given-names>Kaylena A</given-names></name><role specific-use="author">Author</role><aff><institution>University of Waterloo</institution><addr-line><named-content content-type="city">Waterloo</named-content></addr-line><country>Canada</country></aff></contrib><contrib contrib-type="author"><name><surname>Muller</surname><given-names>Eli</given-names></name><role specific-use="author">Author</role><aff><institution>University of Sydney</institution><addr-line><named-content content-type="city">Sydney</named-content></addr-line><country>Australia</country></aff></contrib><contrib contrib-type="author"><name><surname>Medel</surname><given-names>Vicente</given-names></name><role specific-use="author">Author</role><aff><institution>Adolfo Ibáñez University</institution><addr-line><named-content content-type="city">Santiago</named-content></addr-line><country>Chile</country></aff></contrib><contrib contrib-type="author"><name><surname>Anderson</surname><given-names>Britt</given-names></name><role specific-use="author">Author</role><aff><institution>University of Waterloo</institution><addr-line><named-content content-type="city">Waterloo</named-content></addr-line><country>Canada</country></aff></contrib><contrib contrib-type="author"><name><surname>Stöttinger</surname><given-names>Elisabeth</given-names></name><role specific-use="author">Author</role><aff><institution>Hochschule Fresenius</institution><addr-line><named-content content-type="city">Köln</named-content></addr-line><country>Germany</country></aff></contrib><contrib contrib-type="author"><name><surname>Danckert</surname><given-names>James</given-names></name><role specific-use="author">Author</role><aff><institution>University of Waterloo</institution><addr-line><named-content content-type="city">Waterloo</named-content></addr-line><country>Canada</country></aff></contrib><contrib contrib-type="author"><name><surname>Munn</surname><given-names>Brandon</given-names></name><role specific-use="author">Author</role><aff><institution>University of Sydney</institution><addr-line><named-content content-type="city">Sydney</named-content></addr-line><country>Australia</country></aff></contrib><contrib contrib-type="author"><name><surname>Shine</surname><given-names>James M</given-names></name><role specific-use="author">Author</role><aff><institution>University of Sydney</institution><addr-line><named-content content-type="city">Sydney</named-content></addr-line><country>Australia</country></aff></contrib></contrib-group></front-stub><body><p>The following is the authors’ response to the previous reviews</p><disp-quote content-type="editor-comment"><p><bold>Reviewer #1 (Public r</bold>eview):</p><p>The mechanism, as I understand it, is different from what the authors described before in the RNN with tonic gain changes. As uncertainty increases, the network enters a regime in which the two excitatory populations start to oscillate. My intuition is that this oscillation arises from the feedback loop created by the new gain control mechanism. If my intuition is correct, I think it would be worth to explain this mechanism in the paper more explicitly.</p></disp-quote><p>While interesting, this intuition is not correct. The oscillations are generated by the interaction between excitatory and inhibitory nodes in the network and occur in the model even with stationary gain. All of the plots in figure 3 exploring the dynamical regime of the network at different input x gain combinations (i.e., where the oscillatory regime is characterised) are simulations run with stationary gain.</p><p>To ensure that this intuition is more clearly presented in the manuscript, we have edited the description in the text.</p><p>P. 12: “Because of the large size of the network, we could not solve for the fixed points or study their stability analytically. Instead, we opted for a numerical approach and characterised the dynamical regime (i.e. the location and existence of approximate fixed-point attractors) across all combinations of (static) gain and visited by the network.”</p><disp-quote content-type="editor-comment"><p><bold>Reviewer #2 (Public review):</bold></p><p>- The demonstration of the causal role of gain modulation in perceptual switches is partial. This causality is clearly demonstrated in the simulation work with the RNN. However, it is not fully demonstrated in the pupil analysis and the fMRI analysis. One reason is that this work is correlative (which is already very informative). An analysis of the timing of the effect might have overcome this limitation. For example, in a previous study, the same group showed that fMRI activity in the LC region precedes changes in the energy landscape of fMRI dynamics, which is a step towards investigating causal links between gain modulation, changes in the energy landscape and perceptual switches.</p></disp-quote><p>Thank you for the suggestion, which we considered in detail. Unfortunately, the temporal and spatial resolution of the fMRI data collected for this study precluded the same analyses we’ve run in previous work, however this is an important question for future work.</p><disp-quote content-type="editor-comment"><p>- Some effects may reflect the expectation of a perceptual switch rather than the perceptual switch itself. To mitigate this risk, the design of the fMRI task included catch trials, in which no switch occurs, to reduce the expectation of a switch. The pupil study, however, did not include such catch trials.</p></disp-quote><p>We agree that this is a limitation of the current study, which we previously highlighted in the methods section.</p><disp-quote content-type="editor-comment"><p>- The paper uses RNN-based modelling to provide mechanistic insight into the role of gain modulation in perceptual switches. However, the RNN solves a task that differs markedly from that performed by human participants, which may limit the explanatory value of the model. The RNN is provided with two inputs characterising the sensory evidence supporting the first and last image category in the sequence (e.g. plane and shark). In contrast, observers in the task were naïve as to the identity of the last image at the beginning of the sequence. The brain first receives sensory evidence about the image category (e.g. plane) with which the sequence begins, which is very easy to recognise, then it sees a sequence of morphed images and has to discover what the final image category will be. To discover the final image category, the brain has to search a vast space of possible second images (it is a shark?, a frog?, a bird?, etc.), rather than comparing the likelihood of just two categories. This search process and the perceptual switch in the task appear to be mechanistically different from the competition between two inputs in the RNN.</p></disp-quote><p>We appreciate the critical analysis of the experimental paradigm but disagree with the reviewers conclusions for two keys reasons: (1) Participants prior exposure to the images, such that they could create an expectation about what stimulus category a particular image would transition into (i.e., the image could not switch into any possible category); and (2) even if the reviewers’ concern was founded, models of <italic>K</italic> winner-take-all decision making are structured identically irrespective of whether the options are 2 or <italic>K</italic> options all that changes is the simulated reaction times which depend linearly on the K (for an example model see Hugh Wilson’s textbook Spikes, Decisions, and Actions, 1999, p.89-91). For these reasons, we maintain that the RNN is a sensible representation of the behavioural task.</p><disp-quote content-type="editor-comment"><p>- Another aspect of the motivation for the RNN model remains unclear. The authors introduce dynamic gain modulation in the RNN, but it is not clear what the added value of dynamic gain modulation is. Both static (Fig. S1) and dynamic (Fig. 2F) gain modulation lead to the predicted effect: faster switching when the gain is larger.</p></disp-quote><p>While we agree that the effect is observable with both static and dynamic gain, the stronger construct validity associated with the dynamic approach, including a stronger link with the observed pupil dynamics and a rich literature associated with modelling the behavioural consequences of surprise/uncertainty led us to the conclusion that the dynamical approach was a better representation of our hypothesis.</p><disp-quote content-type="editor-comment"><p>- Fig 1C: I don't see a &quot;top grey bar&quot; indicating significance.</p></disp-quote><p>Thank you for catching this, the caption has been amended. The text was from an older version of the manuscript.</p><disp-quote content-type="editor-comment"><p>- p. 10, reference to fig 3F seems incorrect: there is Fig 3F upper and Fig 3F lower, and nothing on Fig 3 and its legend mention the lesion of units</p></disp-quote><p>This has been amended. We meant to refer to 2F.</p><disp-quote content-type="editor-comment"><p>- In the response letter you mention a MATLAB tutorial, but I could not find it.</p></disp-quote><p>This has been amended. Github repository can be found at <ext-link ext-link-type="uri" xlink:href="https://github.com/ShineLabUSYD/AmbiguousFigures">https://github.com/ShineLabUSYD/AmbiguousFigures</ext-link></p></body></sub-article></article>