<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Neural Circuits</journal-id>
<journal-title>Frontiers in Neural Circuits</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Neural Circuits</abbrev-journal-title>
<issn pub-type="epub">1662-5110</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fncir.2025.1615232</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Neuroscience</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Feedforward extraction of behaviorally significant information by neocortical columns</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author"><name><surname>Favorov</surname> <given-names>Oleg V.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1759628/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes"><name><surname>Kursun</surname> <given-names>Olcay</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2974317/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Lampe Joint Department of Biomedical Engineering, North Carolina State University (in collaboration with University of North Carolina at Chapel Hill)</institution>, <addr-line>Raleigh, NC</addr-line>, <country>United States</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Computer Science and Computer Information Systems, Auburn University at Montgomery</institution>, <addr-line>Montgomery, AL</addr-line>, <country>United States</country></aff>
<author-notes>
<fn fn-type="edited-by" id="fn0002">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/7806/overview">Ju Lu</ext-link>, Lehigh University, United States</p>
</fn>
<fn fn-type="edited-by" id="fn0003">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2290/overview">Stephen D. Van Hooser</ext-link>, Brandeis University, United States</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2665284/overview">Yunyan Ding</ext-link>, University of California, Irvine, United States</p>
</fn>
<corresp id="c001">&#x002A;Correspondence: Olcay Kursun, <email>olcaykursun@gmail.com</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>07</day>
<month>10</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>19</volume>
<elocation-id>1615232</elocation-id>
<history>
<date date-type="received">
<day>20</day>
<month>04</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>08</day>
<month>09</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2025 Favorov and Kursun.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Favorov and Kursun</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Neurons throughout the neocortex exhibit selective sensitivity to particular features of sensory input patterns. According to the prevailing views, cortical strategy is to choose features that exhibit predictable relationship to their spatial and/or temporal context. Such contextually predictable features likely make explicit the causal factors operating in the environment and thus they are likely to have perceptual/behavioral utility. The known details of functional architecture of cortical columns suggest that cortical extraction of such features is a modular nonlinear operation, in which the input layer, layer 4, performs initial nonlinear input transform generating proto-features, followed by their linear integration into output features by the basal dendrites of pyramidal cells in the upper layers. Tuning of pyramidal cells to contextually predictable features is guided by the contextual inputs their apical dendrites receive from other cortical columns via long-range horizontal or feedback connections. Our implementation of this strategy in a model of prototypical V1 cortical column, trained on natural images, reveals the presence of a limited number of contextually predictable orthogonal basis features in the image patterns appearing in the column&#x2019;s receptive field. Upper-layer cells generate an overcomplete Hadamard-like representation of these basis features: i.e., each cell carries information about all basis features, but with each basis feature contributing either positively or negatively in the pattern unique to that cell. In tuning selectively to contextually predictable features, upper layers perform selective filtering of the information they receive from layer 4, emphasizing information about orderly aspects of the sensed environment and downplaying local, likely to be insignificant or distracting, information. Altogether, the upper-layer output preserves fine discrimination capabilities while acquiring novel higher-order categorization abilities to cluster together input patterns that are different but, in some way, environmentally related. We find that to be fully effective, our feature tuning operation requires collective participation of cells across 7 minicolumns, together making up a functionally defined 150&#x202F;&#x03BC;m diameter &#x201C;mesocolumn.&#x201D; Similarly to real V1 cortex, 80% of model upper-layer cells acquire complex-cell receptive field properties while 20% acquire simple-cell properties. Overall, the design of the model and its emergent properties are fully consistent with the known properties of cortical organization. Thus, in conclusion, our feature-extracting circuit might capture the core operation performed by cortical columns in their feedforward extraction of perceptually and behaviorally significant information.</p>
</abstract>
<kwd-group>
<kwd>visual cortex</kwd>
<kwd>layer 4</kwd>
<kwd>layer 3</kwd>
<kwd>complex cells</kwd>
<kwd>minicolumn</kwd>
<kwd>model</kwd>
<kwd>predictive coding</kwd>
</kwd-group>
<contract-num rid="cn1">2435093</contract-num>
<contract-sponsor id="cn1">National Science Foundation<named-content content-type="fundref-id">10.13039/100000001</named-content></contract-sponsor>
<contract-sponsor id="cn2">J. Scott McFadyen Fund for Excellence in Parkinson&#x2019;s Disease Research</contract-sponsor>
<counts>
<fig-count count="13"/>
<table-count count="0"/>
<equation-count count="26"/>
<ref-count count="91"/>
<page-count count="21"/>
<word-count count="18982"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<label>1</label>
<title>Introduction</title>
<p>In artificial intelligence, to quote <xref ref-type="bibr" rid="ref69">Ritter (2003)</xref>, &#x201C;A first and very important step in many pattern recognition and information processing tasks is the identification or construction of a reasonably small set of important features in which the essential information for the task is concentrated.&#x201D; The concept of stimulus feature tuning is also fundamental to neuroscience. It is widely accepted that neurons throughout the cerebral cortex exhibit highly selective sensitivity to particular features of peripheral stimuli and such tuning defines neurons&#x2019; information representational identities (<xref ref-type="bibr" rid="ref23">DiCarlo and Cox, 2007</xref>). Across cortical areas, neurons tune to stimulus features that vary greatly in their complexity. Starting from the primary sensory cortical areas and up each stream of successive areas, neurons gradually increase their receptive field sizes, become more selective to spatiotemporal stimulus patterns in their receptive fields (RFs), and also develop selective invariances (<xref ref-type="bibr" rid="ref32">Felleman and Van Essen, 1991</xref>; <xref ref-type="bibr" rid="ref67">Riesenhuber and Poggio, 1999</xref>).</p>
<p>A generally supported <xref ref-type="bibr" rid="ref62">Mountcastle&#x2019;s (1978)</xref> conjecture is that such progressive elaboration of feature tuning properties is accomplished by recursive application of essentially the same computational operation, performed by series of cortical columns on their afferent inputs (<xref ref-type="bibr" rid="ref66">Phillips and Singer, 1997</xref>). However, the nature of this hypothesized operation, as well as the nature of the extracted features are poorly understood. Neurons acquire their mature feature-tuning properties to a large degree by learning from experience, using lower-level features provided by their afferent inputs to build higher-level ones. Technically, a feature is a mathematical transfer function over a set of afferent inputs to a neuron (or to a node in an artificial neural network). Each neuron has to select (learn) some useful transfer function. However, this can be a challenging task. In high-level cortical areas that are closely engaged in shaping the behavior, the neurons&#x2019; tuning to stimulus features can, in principle, be guided directly by their more or less obvious behavioral utility. But for early sensory areas, the identity of low-level stimulus features that would be behaviorally useful &#x2013; as building blocks enabling the construction of high-level behaviorally significant features &#x2013; and thus worth extracting is far from clear. Such low-level features might be too far removed from actual behavior for a criterion of &#x201C;behavioral usefulness&#x201D; being of practical use in their selection, at least initially during early postnatal cortical development. Instead, selection of such features would have to rely on some local signs promising their eventual usefulness.</p>
<p>The prevailing consensus, which emerged in the 1990s, is that such local signs of tentative features&#x2019; potential usefulness can come from the spatial and/or temporal context in which these features occur (<xref ref-type="bibr" rid="ref3">Barlow, 1992</xref>; <xref ref-type="bibr" rid="ref6">Becker and Hinton, 1992</xref>; <xref ref-type="bibr" rid="ref5">Becker, 1996</xref>; <xref ref-type="bibr" rid="ref81">Stone, 1996</xref>; <xref ref-type="bibr" rid="ref19">de Sa and Ballard, 1998</xref>; <xref ref-type="bibr" rid="ref66">Phillips and Singer, 1997</xref>; <xref ref-type="bibr" rid="ref39">Hawkins and Blakeslee, 2004</xref>; <xref ref-type="bibr" rid="ref30">Favorov and Ryder, 2004</xref>). According to this idea, local but ultimately behaviorally useful features should be the ones that can be predictably related to other such features, either preceding or following them in time or taking place side-by-side with them. Thus, neurons should choose features for their ability to predict and be predictable from other such features. Predictive relations exist among features extracted from non-overlapping sensory inputs because they do reflect order present in the environment. Thus, contextually predictable features are signatures of causal factors operating in the individual&#x2019;s environment, which might be relevant to the individual&#x2019;s interactions with its environment and therefore worth tuning to <xref ref-type="bibr" rid="ref66">Phillips and Singer (1997)</xref>, <xref ref-type="bibr" rid="ref72">Ryder and Favorov (2001)</xref>, <xref ref-type="bibr" rid="ref30">Favorov and Ryder (2004)</xref>, and <xref ref-type="bibr" rid="ref71">Ryder (2004)</xref>.</p>
<p>While this proposal is straightforward at the conceptual level, its actual algorithmic and neural implementational details &#x2013; which ultimately establish its biological feasibility &#x2013; are lacking and need fleshing out. In Section 2 of this paper, we use the known details of cortical functional architecture as guiding constraints to formulate a biologically realistic, algorithmically explicit computational model for contextually guided feature tuning in cortical columns. This model allows us to devise a version of multi-view canonical correlation analysis to explicitly extract shared contextual information from neighboring cortical columns, estimate its dimensionality, and compute the principal axes (basis vectors) of the space of contextually predictable features of input patterns occurring in a cortical column&#x2019;s RF. In Section 3, we apply this methodology to natural images to reveal the information space of contextually predictable features available to a column in the primary visual area, V1. We train our cortical model in Section 3 on visual inputs obtained from natural images and demonstrate that the model&#x2019;s neurons are highly capable of tuning to contextually predictable nonlinear features despite using only Hebbian synaptic plasticity. The model neurons learn close to all theoretically available contextually predictable features, and these features are found to be similar to those of neurons in the cat V1.</p>
<p>The demonstrated feature tuning effectiveness and biological realism of the model suggest that it might capture the core operation performed by cortical columns in their feedforward extraction of perceptually and behaviorally significant information. In a related paper (<xref ref-type="bibr" rid="ref50">Kursun et al., 2024</xref>), we demonstrate that convolutional neural networks (CNN) trained using contextual guidance can perform better than deep CNN, which are trained using error-backpropagation, on visual and hyperspectral imaging tasks, tactile texture discrimination, or text classification.</p>
</sec>
<sec id="sec2">
<label>2</label>
<title>Theoretical model specification</title>
<sec id="sec3">
<label>2.1</label>
<title>Contextual guidance in cortical layer 3</title>
<p>Cerebral cortex is a complex dynamical system dominated by feedback circuits, but we limit our exploration to the feed-forward component of this system, which endows neurons with their identity-defining so-called &#x201C;classical&#x201D; RFs and feature-tuning properties. We further confine our exploration to the central pathway in the feed-forward elaboration of cortical neurons&#x2019; properties, which proceeds through a repeating sequence of two cortical layers. Cortical layer 4 (L4) is the principal initial recipient of the feed-forward afferent input to a cortical area. L4 converts that input into a new form and sends it, in particular, to layer 3 (L3) of the same cortical area for its feature-extraction operation. The product of that L3 operation is then sent to L4 of the next cortical area, where the same two-stage feature-extracting operation is repeated, but on a higher level, building on the advances made by the preceding cortical area (<xref ref-type="bibr" rid="ref70">Rockland and Pandya, 1979</xref>; <xref ref-type="bibr" rid="ref32">Felleman and Van Essen, 1991</xref>; <xref ref-type="bibr" rid="ref15">Callaway, 2004</xref>).</p>
<p>In addition to their afferent input from L4, L3 neurons receive extensive contextual input via long-range horizontal connections from surrounding columns up to several millimeters away from their resident column (<xref ref-type="bibr" rid="ref35">Gilbert and Wiesel, 1983</xref>; <xref ref-type="bibr" rid="ref22">DeFelipe et al., 1986</xref>; <xref ref-type="bibr" rid="ref57">Lund et al., 1993</xref>; <xref ref-type="bibr" rid="ref13">Burton and Fabri, 1995</xref>). These contextual inputs are expected to guide L3 neurons to the sources of mutual information in these two, afferent and contextual, input sets (<xref ref-type="bibr" rid="ref66">Phillips and Singer, 1997</xref>). Two principally different kinds of such sources are possible. First, the two input sets might have partially overlapping RFs; in other words, they might share some neurons along their afferent pathways in common. Such an <italic>internal</italic> source of mutual information in the two sets is trivial and has to be avoided. Second, the afferent and contextual input sets might be impacted by the same environmental agent. Such an <italic>external</italic> source of mutual information has the potential of being behaviorally significant and therefore worthy of recognition. One way to ensure that mutual information in the two input sets comes from external sources is to use inputs with non-overlapping RFs. Indeed, long-range horizontal connections come from far enough to have non-overlapping RFs but are close enough to reflect the same distal variables in the engaged environment.</p>
<p>The value of the feature (<italic>&#x03C6;</italic>) extracted by the <italic>i<sup>th</sup></italic> L3 cell is computed from the afferent inputs to its resident cortical column <italic>m</italic>, as in <xref ref-type="disp-formula" rid="EQ1">Equation 1</xref>:</p>
<disp-formula id="EQ1">
<label>(1)</label>
<mml:math id="M1">
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi mathvariant="italic">mi</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi mathvariant="italic">mi</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mover accent="true">
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math id="M2">
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi mathvariant="italic">mi</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> is the chosen feature-specific transfer function, and <inline-formula>
<mml:math id="M3">
<mml:mover accent="true">
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
</mml:math>
</inline-formula> is a vector of activities of all the afferent axons innervating column <italic>m</italic>. According to the contextual guidance proposal, the function <inline-formula>
<mml:math id="M4">
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi mathvariant="italic">mi</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> is chosen so as to maximize correlation of <inline-formula>
<mml:math id="M5">
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi mathvariant="italic">mi</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> with the &#x201C;best&#x201D; function <inline-formula>
<mml:math id="M6">
<mml:msub>
<mml:mi>g</mml:mi>
<mml:mi mathvariant="italic">mi</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> over features extracted in other, surrounding columns and delivered via long-range horizontal connections, as in <xref ref-type="disp-formula" rid="EQ2">Equation 2</xref>:</p>
<disp-formula id="EQ2">
<label>(2)</label>
<mml:math id="M7">
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi mathvariant="italic">mi</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mo>arg</mml:mo>
<mml:munder>
<mml:mo>max</mml:mo>
<mml:msub>
<mml:mi>g</mml:mi>
<mml:mi mathvariant="italic">mi</mml:mi>
</mml:msub>
</mml:munder>
<mml:mspace width="0.33em"/>
<mml:mtext mathvariant="italic">corr</mml:mtext>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi mathvariant="italic">mi</mml:mi>
</mml:msub>
<mml:mo>;</mml:mo>
<mml:msub>
<mml:mi>g</mml:mi>
<mml:mi mathvariant="italic">mi</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>&#x03C6;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mtext mathvariant="italic">context</mml:mtext>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula>
<p>where <italic>corr</italic> is Pearson&#x2019;s correlation coefficient, and <inline-formula>
<mml:math id="M8">
<mml:msub>
<mml:mover accent="true">
<mml:mi>&#x03C6;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mtext mathvariant="italic">context</mml:mtext>
</mml:msub>
<mml:mspace width="0.25em"/>
</mml:math>
</inline-formula>is a vector of all available L3 contextual features combined.</p>
<p>Since different neurons in a column should extract different features, we should elaborate the choice of the feature-extracting transfer function <inline-formula>
<mml:math id="M9">
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi mathvariant="italic">mi</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> for a single neuron <italic>i</italic> in column <italic>m</italic>: the choice is to maximize correlation of <inline-formula>
<mml:math id="M10">
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi mathvariant="italic">mi</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> with the &#x201C;best&#x201D; function <inline-formula>
<mml:math id="M11">
<mml:msub>
<mml:mi>g</mml:mi>
<mml:mi mathvariant="italic">mi</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> over features in other columns, subject to the constraint that correlation of this feature with features computed by other neurons in the <italic>same</italic> layer in the <italic>same</italic> column should not be excessive.</p>
<p>It should be noted that features extracted by cortical neurons &#x2013; especially in high-level cortical areas &#x2013; are highly nonlinear functions of peripheral patterns of receptor activations. No recursive application of linear transform functions would be able on its own to produce such features. Cortical neurons must be able to use nonlinear transfer functions. However, experience-driven learning of nonlinear transfer functions in neural networks can be highly problematic, unless a kernel-based strategy is used. Kernel methods, popular in machine learning, offer a highly effective strategy for dealing with nonlinear problems by transforming the input space into a new &#x201C;feature&#x201D; space where a nonlinear problem becomes linear and thus more tractable with efficient linear techniques (<xref ref-type="bibr" rid="ref75">Sch&#x00F6;lkopf and Smola, 2002</xref>). According to <xref ref-type="bibr" rid="ref28">Favorov and Kursun (2011)</xref>, such a kernel-based function linearization strategy happens to be used in the neocortex in its principal input layer, layer 4. This insight suggests that cortical columns first perform a nonlinear function-linearization transform of their afferent inputs in L4 and then learn linear transform functions in L3.</p>
</sec>
<sec id="sec4">
<label>2.2</label>
<title>Layer 4 pluripotent function linearization</title>
<p>An important feature of L4 functional architecture is the presence of untuned feed-forward inhibition, which reflects the overall strength of the stimulus activating a local L4 network but is insensitive &#x2013; invariant &#x2013; to spatial details of the stimulus patterns (<xref ref-type="bibr" rid="ref51">Kyriazi et al., 1996</xref>; <xref ref-type="bibr" rid="ref10">Bruno and Simons, 2002</xref>; <xref ref-type="bibr" rid="ref84">Swadlow, 2003</xref>; <xref ref-type="bibr" rid="ref40">Hirsch et al., 2003</xref>; <xref ref-type="bibr" rid="ref83">Sun et al., 2006</xref>; <xref ref-type="bibr" rid="ref17">Cruikshank et al., 2007</xref>). <xref ref-type="bibr" rid="ref28">Favorov and Kursun (2011)</xref> showed that the presence of such untuned feed-forward inhibition converts a conventional neural network into a functional analog of Radial Basis Function (RBF) networks (<xref ref-type="bibr" rid="ref55">Lowe, 2003</xref>), which are well known for their universal function approximation and linearization capabilities (<xref ref-type="bibr" rid="ref64">Park and Sandberg, 1991</xref>; <xref ref-type="bibr" rid="ref47">Kurkov&#x00E1;, 2003</xref>). Input transforms performed by such networks automatically linearize a broad repertoire of nonlinear functions over the afferent inputs. This capacity for pluripotent function linearization suggests that L4 can contribute importantly to cortical feature extraction by performing such a transform of afferent inputs to a cortical column that makes possible for neurons in the other layers of the column, including L3, to extract nonlinear features of afferent inputs using mostly linear operations.</p>
<p>A biologically realistic and highly effective pluripotent function linearizer has the following ingredients (<xref ref-type="disp-formula" rid="EQ3">Equation 3</xref>): (1) activity of each excitatory L4 cell is computed, in part, as a weighted sum of its afferent inputs, which are Hebbian; (2) lateral interconnections among L4 cells are used to diversify the afferent connectional patterns among L4 cells in a cortical column and give them a rich variety of RF properties; and (3) feed-forward inhibition makes L4 cells behave similarly to RBF units and is principally responsible for function linearization capabilities. Following <xref ref-type="bibr" rid="ref28">Favorov and Kursun (2011)</xref>, we describe L4 operation as:</p>
<disp-formula id="EQ3">
<label>(3)</label>
<mml:math id="M12">
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:msub>
<mml:mn>4</mml:mn>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">[</mml:mo>
<mml:munder>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mi>j</mml:mi>
</mml:munder>
<mml:msub>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mi>a</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mi>&#x03BB;</mml:mi>
<mml:munder>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mi>k</mml:mi>
</mml:munder>
<mml:mo stretchy="true">(</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:msub>
<mml:mn>4</mml:mn>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x03B8;</mml:mi>
<mml:msqrt>
<mml:mrow>
<mml:munder>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mi>j</mml:mi>
</mml:munder>
<mml:msubsup>
<mml:mi>a</mml:mi>
<mml:mi>j</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:msqrt>
<mml:mo stretchy="true">]</mml:mo>
</mml:mrow>
<mml:mo>+</mml:mo>
</mml:msup>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math id="M13">
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:msub>
<mml:mn>4</mml:mn>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mspace width="0.25em"/>
</mml:math>
</inline-formula>is the activity of L4 neuron <italic>i</italic>; <italic>a<sub>j</sub></italic> is the activity of afferent input neuron <italic>j</italic>; <italic>w<sub>i,j</sub></italic> is the weight, or efficacy, of the excitatory synaptic connection from afferent neuron <italic>j</italic> to L4 neuron <italic>i</italic>; <inline-formula>
<mml:math id="M14">
<mml:mi>&#x03BB;</mml:mi>
</mml:math>
</inline-formula> is a lateral connection scaling constant; <inline-formula>
<mml:math id="M15">
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:msub>
<mml:mn>4</mml:mn>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mspace width="0.25em"/>
</mml:math>
</inline-formula>is the activity of a neighboring L4 neuron <italic>k</italic>; <inline-formula>
<mml:math id="M16">
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> is the correlation coefficient between activities of L4 neurons <italic>i</italic> and <italic>k</italic>; <italic>&#x03B8;</italic> is a feed-forward inhibition scaling constant; and [&#x00B7;]<sup>+</sup> indicates that if the quantity in the brackets is negative, the value is to be taken as zero.</p>
<p>In the presence of both feed-forward inhibition and plastic lateral connections, which are unique to L4 in that higher correlation in firings of the pre- and post-synaptic cells leads to decrease &#x2013; rather than increase &#x2013; of synaptic strength (<xref ref-type="bibr" rid="ref24">Egger et al., 1999</xref>; <xref ref-type="bibr" rid="ref73">S&#x00E1;ez and Friedlander, 2009</xref>), a modeled network of L4 neurons, trained on visual inputs, develops biologically accurate diversity of multi-subfield RFs and acquires orientation tuning matching in sharpness that of real L4 neurons, as well as a host of other real L4 functional properties (<xref ref-type="bibr" rid="ref28">Favorov and Kursun, 2011</xref>).</p>
<p>In the above L4 model, neurons accomplish their pluripotent function linearization by acting in local groups. To explain, consider a local group of L4 neurons that are innervated by a common set of afferent neurons. Together, such a set of <italic>N</italic> convergent afferent neurons can be viewed as defining an abstract <italic>N</italic>-dimensional afferent input state space, each dimension corresponding to one of the constituent afferent neurons. A targeted L4 neuron <italic>i</italic> takes a particular direction in this afferent space (defined by the vector of its afferent connection weights <inline-formula>
<mml:math id="M17">
<mml:msub>
<mml:mover accent="true">
<mml:mi>w</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> in <xref ref-type="disp-formula" rid="EQ3">Equation 3</xref>) as its conic RBF center. Neighboring L4 neurons innervated by the same set of afferent neurons chose different RBF centers (i.e., different <inline-formula>
<mml:math id="M18">
<mml:mover accent="true">
<mml:mi>w</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
</mml:math>
</inline-formula>) in their common afferent space, influenced in their choices by lateral interactions with each other. Together, a local group of L4 neurons will spread their RBF centers evenly throughout their common afferent space so as to map it most efficiently, with more active regions of that space mapped at higher resolution (<xref ref-type="bibr" rid="ref20">Deco and Obradovic, 1995</xref>). A wide range of nonlinear functions defined over this space &#x2013; including transfer functions that can extract contextually predictable features &#x2013; can be then approximated by weighted sums of the activities of the mapping L4 neurons.</p>
<p>What is the size of such RBF-network-like local groups of L4 neurons that together can perform pluripotent function linearizations? Although it is limited, anatomical evidence based on typical sizes of afferent axon arborizations in L4 and the lateral spread of dendrites and axon collaterals of L4 cells within the confines of L4 suggests that such groups should be larger than a minicolumn (i.e., &#x003E;50&#x202F;&#x03BC;m in diameter) but smaller than a macrocolumn (i.e., &#x003C;500&#x202F;&#x03BC;m). We will refer to such intermediate-size function-linearizing columns in this paper as <italic>mesocolumns</italic>.</p>
<p>Structurally, minicolumns are the radially oriented cords of neuronal cell bodies evident in Nissl-stained sections of the cerebral cortex (<xref ref-type="bibr" rid="ref62">Mountcastle, 1978</xref>; <xref ref-type="bibr" rid="ref14">Buxhoeveden and Casanova, 2002</xref>). They are the narrowest (~50&#x202F;&#x03BC;m diameter) columnar aggregates of neurons in the neocortex (<xref ref-type="bibr" rid="ref25">Favorov and Diamond, 1990</xref>; <xref ref-type="bibr" rid="ref87">Tommerdahl et al., 1993</xref>) and thus can be viewed as the smallest building blocks of cortical columnar organization (<xref ref-type="bibr" rid="ref62">Mountcastle, 1978</xref>). Published estimates of L4 cell densities in visual and somatosensory cortical areas (<xref ref-type="bibr" rid="ref4">Beaulieu and Colonnier, 1983</xref>; <xref ref-type="bibr" rid="ref12">Budd, 2000</xref>; <xref ref-type="bibr" rid="ref58">Markram et al., 2015</xref>; <xref ref-type="bibr" rid="ref61">Meyer et al., 2010</xref>) suggest that a single minicolumn has between 30 and 60 excitatory L4 neurons. Such a number is clearly not enough for a functionally useful RBF mapping of a minicolumn&#x2019;s afferent space.</p>
<p>Minicolumns are packed together in the cortex in an essentially hexagonal pattern. From a geometric perspective, the next larger-size columnar entity to consider is a group of 7 minicolumns, one surrounded by 6 others. Such columns will be 3 minicolumns wide and thus ~150&#x202F;&#x03BC;m in diameter. They will have between 200 and 400 excitatory L4 neurons. In Section 3 we will show that such numbers of L4 neurons are sufficient for the purposes of contextually predictable feature extraction in L3. We propose that, based on the available evidence, such groupings of 7 minicolumns are the most plausible candidates for the role of function-linearizing mesocolumns (<xref ref-type="fig" rid="fig1">Figure 1</xref>). A group of 7 such mesocolumns, in turn, make the next larger-size columnar entity ~450&#x202F;&#x03BC;m in diameter, corresponding in size to the well-known macrocolumns (<xref ref-type="bibr" rid="ref63">Mountcastle, 1997</xref>).</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Mesocolumn-based feature extraction in the neocortex. <bold>(A)</bold> Connectional diagram. <bold>(B)</bold> Minicolumnar composition and RF of a mesocolumn. <bold>(C)</bold> Mesocolumnar composition and RF of a macrocolumn. The smallest structural units of neocortical columnar organization are <italic>minicolumns</italic>, comprising neurons whose bodies line up in &#x2053;50&#x202F;&#x03BC;m diameter radially oriented stacks separated by radially oriented bundles of axons and apical dendrites. Neurons residing in neighboring minicolumns are not functionally isolated but make up larger-size functional aggregates. This paper explores the feature extracting capabilities of aggregates that span local groups of 7 minicolumns, referred to as <italic>mesocolumns</italic>. The L4 and L3 compartments of three such mesocolumns, taken from monkey somatosensory cortex, are shown in panel <bold>(A)</bold>, each revealing multiple vertical stacks of Nissl-stained neurons. Neighboring mesocolumns receive their input <inline-formula>
<mml:math id="M19">
<mml:mover accent="true">
<mml:mi>a</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
</mml:math>
</inline-formula> from partially overlapping sets of afferent neurons and thus from partially overlapping RFs. In panel <bold>(B)</bold>, a mesocolumn is shown schematically as a hexagonally packed group of 7 minicolumns (black filled circles). It is estimated to contain 200&#x2013;400 excitatory cells in each of its L4 and L3 compartments. In the primary visual cortex, a mesocolumn&#x2019;s RF in natural images would correspond to an approximately 16 pixel diameter circle (<xref ref-type="bibr" rid="ref28">Favorov and Kursun, 2011</xref>). L4 cells in a mesocolumn act together as a group in performing pluripotent function linearizing transform of their RF input patterns. Neurons in the L3 compartment of a mesocolumn receive their afferent input from L4 cells residing not only in their own but also neighboring mesocolumns <bold>(A)</bold>. Such a larger group of 7 mesocolumns, feeding central mesocolumn&#x2019;s L3 neurons, is shown in panel <bold>(C)</bold> schematically as an &#x2053;450&#x202F;&#x03BC;m diameter <italic>macrocolumn</italic>. Since RFs of L4 compartments of these 7 mesocolumns are partially shifted (as shown), the overall RF of a mesocolumn&#x2019;s L3 compartment is expanded to an approximately 21 pixel diameter circle. L3 neurons in a mesocolumn respond to diverse features of input patterns appearing in their mesocolumn&#x2019;s RF, together converting the mesocolumn&#x2019;s afferent input vector <inline-formula>
<mml:math id="M20">
<mml:mover accent="true">
<mml:mi>a</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
</mml:math>
</inline-formula> to the mesocolumn&#x2019;s output feature vector <inline-formula>
<mml:math id="M21">
<mml:mover accent="true">
<mml:mi>&#x03C6;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
</mml:math>
</inline-formula>.</p>
</caption>
<graphic xlink:href="fncir-19-1615232-g001.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Diagram illustrating cortical columns. Panel A shows vertical structures labeled as macrocolumn and mesocolumn, with Layer 3 and Layer 4 indicated. Arrows represent signal direction from an afferent source. Panel B depicts a mesocolumn as a circle with smaller circles inside, alongside a receptive field plot. Panel C illustrates a macrocolumn consisting of multiple mesocolumns, with a complex receptive field plot. Scale bars indicate measurements in micrometers and pixels.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec5">
<label>2.3</label>
<title>Layer 3 extraction of contextually predictable features</title>
<p>The lateral spread of axonal projections of L4 cells in L3 and the lateral spread of basal dendrites of pyramidal cells in L3 indicate that L4 neurons send their output to L3 neurons not only in their own mesocolumn but also in the 6 surrounding mesocolumns (<xref ref-type="bibr" rid="ref56">Lubke et al., 2003</xref>; <xref ref-type="bibr" rid="ref18">da Costa and Martin, 2010</xref>). Consequently, the &#x201C;classical&#x201D; RFs and feature-tuning properties of L3 neurons in a given mesocolumn are, essentially, the product of weighted summation of output activities of L4 neurons of the same and 6 surrounding mesocolumns (<xref ref-type="fig" rid="fig1">Figure 1</xref>):</p>
<disp-formula id="EQ4">
<label>(4)</label>
<mml:math id="M22">
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:munderover>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mn>7</mml:mn>
</mml:munderover>
<mml:munderover>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>4</mml:mn>
<mml:mi mathvariant="italic">mc</mml:mi>
</mml:mrow>
</mml:msub>
</mml:munderover>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="italic">mj</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:msub>
<mml:mn>4</mml:mn>
<mml:mi mathvariant="italic">mj</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mspace width="0.33em"/>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math id="M23">
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mspace width="0.25em"/>
</mml:math>
</inline-formula>is the feature-expressing activity of L3 neuron <italic>i</italic> in the central mesocolumn; <italic>N<sub>L4mc</sub></italic> is the number of L4 cells in a mesocolumn; <inline-formula>
<mml:math id="M24">
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:msub>
<mml:mn>4</mml:mn>
<mml:mi mathvariant="italic">mj</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mspace width="0.25em"/>
</mml:math>
</inline-formula>is the activity of an L4 neuron <italic>j</italic> in mesocolumn <italic>m</italic>; and <italic>u<sub>i,mj</sub></italic> is the strength of their connection.</p>
<p>In L3, the afferent inputs from L4 target basal dendrites of pyramidal cells, whereas the contextual inputs from surrounding cortical territories target their apical dendrites (<xref ref-type="bibr" rid="ref35">Gilbert and Wiesel, 1983</xref>; <xref ref-type="bibr" rid="ref45">Kisvardy et al., 1986</xref>; <xref ref-type="bibr" rid="ref56">Lubke et al., 2003</xref>; <xref ref-type="bibr" rid="ref65">Petreanu et al., 2009</xref>). Synaptic inputs to basal dendrites are integrated in the soma, leading to spike generation in the initial axon segment. But the apical dendrite, including its terminal tuft extension in layer 1, has its own site of synaptic input integration and is able to generate its own spikes (<xref ref-type="bibr" rid="ref7">Bernander et al., 1994</xref>; <xref ref-type="bibr" rid="ref16">Cauller and Connors, 1994</xref>; <xref ref-type="bibr" rid="ref74">Schiller et al., 1997</xref>; <xref ref-type="bibr" rid="ref82">Stuart and Spruston, 1998</xref>; <xref ref-type="bibr" rid="ref53">Larkum et al., 1999</xref>, <xref ref-type="bibr" rid="ref52">2007</xref>). Output activity of the apical dendrite in the <italic>i<sup>th</sup></italic> L3 cell is, essentially, the product of weighted summation of output activities of L3 neurons of surrounding columns:</p>
<disp-formula id="EQ5">
<label>(5)</label>
<mml:math id="M25">
<mml:msub>
<mml:mi>A</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x221D;</mml:mo>
<mml:munder>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mi>C</mml:mi>
</mml:mrow>
</mml:munder>
<mml:msub>
<mml:mi>v</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2022;</mml:mo>
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi>c</mml:mi>
</mml:msub>
</mml:math>
</disp-formula>
<p>where <italic>C</italic> is the set of all the L3 neurons in surrounding columns that contribute contextual input to cell <italic>i</italic>; <inline-formula>
<mml:math id="M26">
<mml:msub>
<mml:mi>v</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> is the strength of connection to cell <italic>i</italic> from contextual cell <italic>c</italic>; and <inline-formula>
<mml:math id="M27">
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi>c</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> is basal dendrite output of cell <italic>c</italic> (<xref ref-type="disp-formula" rid="EQ4">Equation 4</xref>). With such separate contextual input integration, the apical dendrite can guide basal dendrites in their selection of afferent connectional patterns (and vice versa) so that they will maximize covariance of the cell&#x2019;s apical and basal outputs <italic>A<sub>i</sub></italic> and <inline-formula>
<mml:math id="M28">
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:math>
</inline-formula>, as was proposed and successfully demonstrated in a basic model by <xref ref-type="bibr" rid="ref46">Kording and Konig (2000)</xref>.</p>
<p>The number of excitatory cells in L3 is approximately the same as in L4 (<xref ref-type="bibr" rid="ref58">Markram et al., 2015</xref>; <xref ref-type="bibr" rid="ref61">Meyer et al., 2010</xref>), suggesting that the L3 compartment of a mesocolumn contains between 200 and 400 pyramidal neurons. Under mutual competitive pressure to diversify their RF tuning properties, similar to plastic local lateral connections among neighboring L4 cells driving them to select different features, these 200&#x2013;400 neurons in a mesocolumn will compete in their search for contextually predictable features. Together, they will find and tune to all the different contextually predictable features present in their shared afferent input from L4 (<xref ref-type="disp-formula" rid="EQ4">Equation 4</xref>).</p>
<p>In geometric terms, together the 1,400&#x2013;2,800&#x202F;L4 cells in 7 mesocolumns that provide afferent input to the L3 compartment of a central mesocolumn create that mesocolumn&#x2019;s high-dimensional <italic>state space</italic>. Since we are concerned with L3 features that are computed linearly in that state space (<xref ref-type="disp-formula" rid="EQ4">Equation 4</xref>), such features correspond to particular directions in the mesocolumn&#x2019;s L3 state space: for a given L3 neuron <italic>i</italic>, its afferent connectional vector <inline-formula>
<mml:math id="M29">
<mml:msub>
<mml:mover accent="true">
<mml:mi>u</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> determines that neuron&#x2019;s preferred direction in its mesocolumn&#x2019;s L3 state space and thus its preferred feature.</p>
<p>Any arbitrary direction in the L3 state space will express some feature of input patterns taking place in the mesocolumn&#x2019;s RF. However, most of such arbitrarily chosen features will not be perceptually significant. Contextually predictable features occupy a lower-dimensional subspace of the L3 state space. The size and contents of this contextually predictable subspace have never been revealed before, even for the primary sensory cortical areas. In the next section (Section 2.4), we derive a computational algorithm for estimating the principal axes (basis vectors) of this subspace, and in Section 3 we apply this algorithm to natural images in an attempt to reveal the contextually predictable subspace of a mesocolumn in the primary visual area, V1. Also in Section 3 we investigate what features (i.e., directions in the mesocolumn&#x2019;s L3 state space) individual L3 cells will choose if they are modeled as comprising two dendritic compartments &#x2013; basal and apical, each receiving Hebbian connections from either L4 of its own macrocolumn or from L3 of surrounding macrocolumns, respectively &#x2013; and are trained on natural images. We show that such modeled L3 cells do indeed select features in the mesocolumn&#x2019;s contextually predictable subspace.</p>
</sec>
<sec id="sec6">
<label>2.4</label>
<title>Extraction of the contextually predictable feature subspace of a cortical mesocolumn</title>
<p>We begin by formalizing terminology to be used in the rest of this paper:</p>
<list list-type="bullet">
<list-item>
<p>The <italic>state space</italic> of a mesocolumn is created by 1,400&#x2013;2,800&#x202F;L4 cells that provide afferent input to its L3 compartment (<xref ref-type="disp-formula" rid="EQ4">Equation 4</xref>). Stimulus patterns activating that mesocolumn&#x2019;s RF are represented as points in the state space and can be characterized in an infinite number of ways by projecting these points onto any particular vector in the state space. Any such projection vector can be considered a &#x201C;feature,&#x201D; and the entire state space of a mesocolumn is the space of possible features, or the feature space. Thus, we can refer to a mesocolumn&#x2019;s state space as its <italic>feature space</italic> to emphasize its feature content.</p>
</list-item>
<list-item>
<p>We search for contextually predictable features because such features reflect orderly aspects of the environment. To emphasize their orderly nature, we will follow <xref ref-type="bibr" rid="ref41">Hotelling (1936)</xref> and call them <italic>canonical features</italic> (from the Greek word <italic>kanonikotita</italic>, &#x03BA;&#x03B1;&#x03BD;&#x03BF;&#x03BD;&#x03B9;&#x03BA;&#x03CC;&#x03C4;&#x03B7;&#x03C4;&#x03B1;, which means &#x201C;regularity,&#x201D; &#x201C;predictable recurrence&#x201D;). The contextually predictable subspace of a mesocolumn&#x2019;s state space, comprising all the canonical features, then is the <italic>canonical feature subspace</italic>.</p>
</list-item>
<list-item>
<p>Our explicit task is to extract the canonical feature subspace from the mesocolumn&#x2019;s state space by finding all of its principal axes (basis vectors). This set of orthogonal vectors in the state space, enclosing the canonical feature subspace, will be called <italic>canonical variates</italic> (<xref ref-type="bibr" rid="ref41">Hotelling, 1936</xref>).</p>
</list-item>
</list>
<p>We formulate our approach based on the following considerations. We define the 1st axis of the canonical feature subspace (i.e., the 1st canonical variate) to be the basis vector with the maximal correlation with the contextual input, the second axis (i.e., the 2nd canonical variate) to be the basis vector with the second largest correlation with the contextual input, and so on until the last axis. In the cortex, different mesocolumns develop their own sets of afferent, lateral, and contextual connections based on their particular histories of sensory experiences. However, since neighboring mesocolumns will end up being exposed to and being shaped by the same regularities in their sensory experiences, any emergent differences among them will not be functionally significant. Thus, in deriving our algorithm, we can make an assumption that all the neighboring mesocolumns involved in contextual guidance will have the same matrices of L3 afferent [<italic>u<sub>i,mj</sub></italic>] and contextual <inline-formula>
<mml:math id="M30">
<mml:mo stretchy="true">[</mml:mo>
<mml:msub>
<mml:mi>v</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">]</mml:mo>
</mml:math>
</inline-formula> connections (<xref ref-type="disp-formula" rid="EQ4 EQ5">Equations 4, 5</xref>) and also identical sets of canonical variates.</p>
<p>To quantify the correlation of a canonical variate with the contextual input, we use the mean of pairwise correlations of that variate in the central mesocolumn and the same variate in each of the neighboring mesocolumns that contribute the contextual input. If we label the direction of a canonical variate in the L3 state space as <inline-formula>
<mml:math id="M31">
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
</mml:math>
</inline-formula> (<italic>b</italic> stands for &#x201C;basis&#x201D;), then we define the contextual correlation of this variate as in <xref ref-type="disp-formula" rid="EQ6">Equation 6</xref>:</p>
<disp-formula id="EQ6">
<label>(6)</label>
<mml:math id="M32">
<mml:mi>r</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mfrac>
<mml:munderover>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:munderover>
<mml:mtext>corr</mml:mtext>
<mml:mo stretchy="true">(</mml:mo>
<mml:msup>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msup>
<mml:mo>&#x2022;</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi mathvariant="italic">af</mml:mi>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msup>
<mml:mo>&#x2022;</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:msub>
<mml:mi mathvariant="italic">aff</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula>
<p>where <italic>N<sub>m</sub></italic> is the number of mesocolumns contributing contextual input. <inline-formula>
<mml:math id="M33">
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi mathvariant="italic">af</mml:mi>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math id="M34">
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:msub>
<mml:mi mathvariant="italic">aff</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:msub>
<mml:mspace width="0.25em"/>
</mml:math>
</inline-formula>are the afferent inputs to the L3 compartment of the central (0<italic>
<sup>th</sup>
</italic>) mesocolumn and the <italic>m<sup>th</sup></italic> neighboring mesocolumn, respectively, from their flattened <inline-formula>
<mml:math id="M35">
<mml:mn>7</mml:mn>
<mml:mo>&#x00D7;</mml:mo>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>4</mml:mn>
<mml:mi mathvariant="italic">mc</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> dimensional vectors of the outputs of L4 neurons of the same and 6 immediately surrounding mesocolumns:</p>
<disp-formula id="EQ7">
<label>(7)</label>
<mml:math id="M36">
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi mathvariant="italic">aff</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">[</mml:mo>
<mml:msubsup>
<mml:mover accent="true">
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mn>0</mml:mn>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msubsup>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mover accent="true">
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mn>1</mml:mn>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msubsup>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:msubsup>
<mml:mover accent="true">
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mn>6</mml:mn>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msubsup>
<mml:mspace width="0.25em"/>
<mml:mo stretchy="true">]</mml:mo>
</mml:mrow>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msup>
</mml:math>
</disp-formula>
<p>Our objective function for the <italic>i<sup>th</sup></italic> canonical variate is to find such a direction <inline-formula>
<mml:math id="M37">
<mml:msub>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> in the L3 state space that will maximize its contextual correlation <inline-formula>
<mml:math id="M38">
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> (subject to the constraint that <inline-formula>
<mml:math id="M39">
<mml:msub>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x22A5;</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> for all <inline-formula>
<mml:math id="M40">
<mml:mi>j</mml:mi>
<mml:mo>&#x003C;</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>. Our objective function is designed to maximize the canonical correlation of the <italic>i<sup>th</sup></italic> component, concurrently ensuring orthogonality with all previously computed components. This methodology, which constructs orthogonal vectors sequentially, beginning with the first, systematically generates a series of orthogonal vectors. Each vector maximizes the variance subject to the orthogonality constraints imposed by its predecessors.</p>
<p>Continuing with our assumption that different mesocolumns in a contextually related cortical territory have the same internal connectivities, we also assume that all <italic>N<sub>m</sub></italic> mesocolumns in our model have the same means and covariance matrices of the afferent inputs to their L3 compartments:</p>
<disp-formula id="EQ8">
<label>(8)</label>
<mml:math id="M41">
<mml:mover accent="true">
<mml:mi>&#x03BC;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mo>=</mml:mo>
<mml:mi>E</mml:mi>
<mml:mo stretchy="true">[</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi mathvariant="italic">af</mml:mi>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">]</mml:mo>
<mml:mspace width="1.66em"/>
<mml:mspace width="0.25em"/>
<mml:msub>
<mml:mi>K</mml:mi>
<mml:mtext>auto</mml:mtext>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mi mathvariant="normal">E</mml:mi>
<mml:mo stretchy="true">[</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi mathvariant="italic">af</mml:mi>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>&#x03BC;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">)</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi mathvariant="italic">af</mml:mi>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>&#x03BC;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msup>
<mml:mo stretchy="true">]</mml:mo>
</mml:math>
</disp-formula>
<p>Then, we can write our objective function as:</p>
<disp-formula id="EQ9">
<label>(9)</label>
<mml:math id="M42">
<mml:msub>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:munder>
<mml:mrow>
<mml:mtext>argmax</mml:mtext>
<mml:mspace width="0.33em"/>
</mml:mrow>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
</mml:munder>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:msubsup>
<mml:mfrac>
<mml:mrow>
<mml:mi mathvariant="normal">E</mml:mi>
<mml:mo stretchy="true">[</mml:mo>
<mml:msup>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msup>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi mathvariant="italic">af</mml:mi>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>&#x03BC;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">)</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:msub>
<mml:mi mathvariant="italic">aff</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>&#x03BC;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msup>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">]</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">E</mml:mi>
<mml:mo stretchy="true">[</mml:mo>
<mml:msup>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msup>
<mml:msub>
<mml:mi>K</mml:mi>
<mml:mtext>auto</mml:mtext>
</mml:msub>
<mml:mspace width="0.33em"/>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">]</mml:mo>
</mml:mrow>
</mml:mfrac>
</mml:math>
</disp-formula>
<p>Thus, the objective function in Lagrangian formulation is given by:</p>
<disp-formula id="EQ10">
<label>(10)</label>
<mml:math id="M43">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:munder>
<mml:mrow>
<mml:mtext>argmax</mml:mtext>
<mml:mspace width="0.33em"/>
</mml:mrow>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
</mml:munder>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:msubsup>
<mml:msup>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msup>
<mml:mo>&#x00B7;</mml:mo>
<mml:mi mathvariant="normal">E</mml:mi>
<mml:mo stretchy="true">[</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi mathvariant="italic">af</mml:mi>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>&#x03BC;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">)</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:msub>
<mml:mi mathvariant="italic">aff</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>&#x03BC;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msup>
<mml:mo stretchy="true">]</mml:mo>
<mml:mo>&#x00B7;</mml:mo>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x03BB;</mml:mi>
<mml:mo>&#x00B7;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msup>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msup>
<mml:msub>
<mml:mi>K</mml:mi>
<mml:mtext>auto</mml:mtext>
</mml:msub>
<mml:mspace width="0.33em"/>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:math>
</disp-formula>
<p>The optimization task specified in <xref ref-type="disp-formula" rid="EQ10">Equation 10</xref> has a well-structured generalized eigenproblem and can be efficiently solved using established numerical algorithms (<xref ref-type="bibr" rid="ref41">Hotelling, 1936</xref>; <xref ref-type="bibr" rid="ref38">Hardoon et al., 2004</xref>; <xref ref-type="bibr" rid="ref48">Kursun et al., 2011</xref>; <xref ref-type="bibr" rid="ref36">Golub and Van Loan, 2013</xref>; <xref ref-type="bibr" rid="ref1">Alpaydin, 2014</xref>), in which the eigenvector having the largest eigenvalue giving us the first canonical variate <inline-formula>
<mml:math id="M44">
<mml:msub>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:math>
</inline-formula>, the eigenvector having the second largest eigenvalue giving us the second variate <inline-formula>
<mml:math id="M45">
<mml:msub>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:math>
</inline-formula>, and so on:</p>
<disp-formula id="EQ11">
<label>(11)</label>
<mml:math id="M46">
<mml:msub>
<mml:mi>K</mml:mi>
<mml:mtext>cross</mml:mtext>
</mml:msub>
<mml:mspace width="0.33em"/>
<mml:msub>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mi>&#x03BB;</mml:mi>
<mml:mspace width="0.33em"/>
<mml:msub>
<mml:mi>K</mml:mi>
<mml:mtext>auto</mml:mtext>
</mml:msub>
<mml:mspace width="0.33em"/>
<mml:msub>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math id="M47">
<mml:msub>
<mml:mi>K</mml:mi>
<mml:mtext>cross</mml:mtext>
</mml:msub>
</mml:math>
</inline-formula> is the cross-covariance matrix (<xref ref-type="bibr" rid="ref41">Hotelling, 1936</xref>; <xref ref-type="bibr" rid="ref48">Kursun et al., 2011</xref>):</p>
<disp-formula id="EQ12">
<label>(12)</label>
<mml:math id="M48">
<mml:msub>
<mml:mi>K</mml:mi>
<mml:mtext>cross</mml:mtext>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mi mathvariant="normal">E</mml:mi>
<mml:mo stretchy="true">[</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi mathvariant="italic">af</mml:mi>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>&#x03BC;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">)</mml:mo>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:msub>
<mml:mi mathvariant="italic">aff</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>&#x03BC;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msup>
<mml:mo stretchy="true">]</mml:mo>
</mml:math>
</disp-formula>
</sec>
</sec>
<sec id="sec7">
<label>3</label>
<title>Model simulations</title>
<p>For model simulations, we sought to emulate the primary visual cortical area (V1) and so applied our L4&#x2013;L3 feature-extracting model to natural images, setting the afferent inputs of the modeled mesocolumns to approximate thalamic inputs to V1 from the lateral geniculate nucleus. The aim of simulations was to develop contextually predictable features that can be expected to be found in a representative V1 mesocolumn. Visual input patterns and the L4 compartments of modeled mesocolumns were reproduced, with a few minor differences, from <xref ref-type="bibr" rid="ref28">Favorov and Kursun (2011)</xref> and that paper should be consulted for their complete descriptions.</p>
<sec id="sec8">
<label>3.1</label>
<title>Methods</title>
<sec id="sec9">
<label>3.1.1</label>
<title>Visual input patterns to the L4 compartment of a mesocolumn</title>
<p>Biologically realistic visual afferent inputs, delivered to L4 via the lateral geniculate nucleus (LGN), were simulated based on the retinal/LGN model of <xref ref-type="bibr" rid="ref80">Somers et al. (1995)</xref>. RFs of LGN neurons were modeled as a difference of the &#x201C;central&#x201D; and the &#x201C;surround&#x201D; two-dimensional Gaussians, with a common space constant <italic>&#x03C3;</italic> for both dimensions:</p>
<disp-formula id="EQ13">
<label>(13)</label>
<mml:math id="M49">
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mi mathvariant="italic">xy</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>/</mml:mo>
<mml:mn>2</mml:mn>
<mml:mi>&#x03C0;</mml:mi>
<mml:msubsup>
<mml:mi>&#x03C3;</mml:mi>
<mml:mtext mathvariant="italic">center</mml:mtext>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo stretchy="true">)</mml:mo>
<mml:msup>
<mml:mi>e</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mi>D</mml:mi>
<mml:mi mathvariant="italic">xy</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo>/</mml:mo>
<mml:mn>2</mml:mn>
<mml:msubsup>
<mml:mi>&#x03C3;</mml:mi>
<mml:mtext mathvariant="italic">center</mml:mtext>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2212;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>/</mml:mo>
<mml:mn>2</mml:mn>
<mml:mi>&#x03C0;</mml:mi>
<mml:msubsup>
<mml:mi>&#x03C3;</mml:mi>
<mml:mtext mathvariant="italic">surr</mml:mtext>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo stretchy="true">)</mml:mo>
<mml:msup>
<mml:mi>e</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mi>D</mml:mi>
<mml:mi mathvariant="italic">xy</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo>/</mml:mo>
<mml:mn>2</mml:mn>
<mml:msubsup>
<mml:mi>&#x03C3;</mml:mi>
<mml:mtext mathvariant="italic">surr</mml:mtext>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:msup>
</mml:math>
</disp-formula>
<p>where <italic>&#x03C3;<sub>center</sub></italic>&#x202F;=&#x202F;0.8833 and <italic>&#x03C3;<sub>surr</sub></italic>&#x202F;=&#x202F;2.6499 (<xref ref-type="fig" rid="fig2">Figure 2A</xref>). <italic>D<sub>xy</sub></italic> is the Euclidean distance between a pixel at the (<italic>x</italic>, <italic>y</italic>) location in the image and the (<italic>x</italic><sub>0</sub>, <italic>y</italic><sub>0</sub>) image location of the RF center. If <italic>D<sub>xy</sub></italic>&#x202F;&#x003E;&#x202F;8, <italic>R<sub>xy</sub></italic>&#x202F;=&#x202F;0 (i.e., the RF diameter is restricted to 16 pixels). Thus, the activity of an ON-center LGN neuron with the RF center at the (<italic>x</italic><sub>0</sub>, <italic>y</italic><sub>0</sub>) location in the image was computed as:</p>
<disp-formula id="EQ14">
<label>(14)</label>
<mml:math id="M50">
<mml:msub>
<mml:mi>a</mml:mi>
<mml:mi mathvariant="italic">ON</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">[</mml:mo>
<mml:mn>0.1</mml:mn>
<mml:mo>+</mml:mo>
<mml:munder>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mi>y</mml:mi>
</mml:munder>
<mml:munder>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mi>x</mml:mi>
</mml:munder>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mi mathvariant="italic">xy</mml:mi>
</mml:msub>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mi mathvariant="italic">xy</mml:mi>
</mml:msub>
<mml:mo stretchy="true">]</mml:mo>
</mml:mrow>
<mml:mo>+</mml:mo>
</mml:msup>
</mml:math>
</disp-formula>
<p>where <italic>I<sub>xy</sub></italic> is the grayscale intensity of the pixel at (x, y) location in the image (0&#x202F;&#x2264;&#x202F;<italic>I<sub>xy</sub></italic>&#x202F;&#x2264;&#x202F;1). The activity of an OFF-center LGN neuron was computed as:</p>
<disp-formula id="EQ15">
<label>(15)</label>
<mml:math id="M51">
<mml:msub>
<mml:mi>a</mml:mi>
<mml:mi mathvariant="italic">OFF</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">[</mml:mo>
<mml:mn>0.1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:munder>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mi>y</mml:mi>
</mml:munder>
<mml:munder>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mi>x</mml:mi>
</mml:munder>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mi mathvariant="italic">xy</mml:mi>
</mml:msub>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mi mathvariant="italic">xy</mml:mi>
</mml:msub>
<mml:mo stretchy="true">]</mml:mo>
</mml:mrow>
<mml:mo>+</mml:mo>
</mml:msup>
</mml:math>
</disp-formula>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>LGN layer model. <bold>(A)</bold> RF profiles of ON-center and OFF-center model LGN cells. <bold>(B)</bold> The map of the RF centers (little white boxes) of the 91 ON-center cells of the LGN layer innervating a single mesocolumn. Note that RF centers are arranged in a hexagonal pattern. RF centers are shown superimposed on a 13&#x202F;&#x00D7;&#x202F;13-pixel field, in which each pixel is shown as a black-edged gray square. RF centers of the 91 OFF-center LGN cells match the RF centers of the ON-center cells. <bold>(C)</bold> Four exemplary 320&#x202F;&#x00D7;&#x202F;320-pixel natural images that were used to activate the LGN layer. Reproduced with permission from <xref ref-type="bibr" rid="ref28">Favorov and Kursun (2011)</xref>.</p>
</caption>
<graphic xlink:href="fncir-19-1615232-g002.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Panel A shows graphs of OFF-center and ON-center receptive fields with response peaks and troughs at zero pixels. Panel B displays a grid with a central pattern of white squares representing pixels. Panel C includes four images: vertical tree bark, a spotted animal resting, a leafy tree with sunlight, and a structure with a sloped roof and fence.</alt-text>
</graphic>
</fig>
<p>Each mesocolumn in the model was set to receive its afferent input from 91 LGN neurons with retinotopically arranged ON-center RFs and 91 neurons with retinotopically arranged OFF-center RFs (<xref ref-type="fig" rid="fig2">Figure 2B</xref>). RF centers of ON-center LGN neurons were arranged in a hexagonal pattern, spaced one pixel apart, and RF centers of OFF-center LGN neurons coincided with the RF centers of the ON-center LGN neurons. Together, these 182 LGN neurons created a hexagonally shaped viewing window onto visual images (<xref ref-type="fig" rid="fig2">Figure 2B</xref>).</p>
<p>In this study, the visual inputs to the LGN layer were drawn from a set of 100 grayscale photographs (320&#x202F;&#x00D7;&#x202F;320 pixels) selected from the IAPR TC-12 benchmark dataset (<xref ref-type="bibr" rid="ref37">Grubinger et al., 2006</xref>), containing texture-rich natural images of surfaces, grass, bushes, landscapes, human and animal figures, and <xref ref-type="bibr" rid="ref9">Brodatz (1966)</xref> dataset of textures (<xref ref-type="fig" rid="fig2">Figure 2C</xref>). Since this is a relatively small set of images, selected for their detail-rich spatial contextual information, an additional much larger and more diverse image dataset was also used to confirm the model findings made on the IAPR TC-12 dataset. This was a widely used <italic>Common Objects in Context</italic> (COCO) dataset of images of complex everyday scenes containing common objects in their natural context (<xref ref-type="bibr" rid="ref54">Lin et al., 2015</xref>). In particular, we used 5,000 images of the 2017 validation set.<xref ref-type="fn" rid="fn0001"><sup>1</sup></xref> The photographs were not preprocessed, except for contrast enhancement using histogram equalization. To generate a particular visual input pattern, the LGN viewing window was placed over a particular location in one of the photographs. The intensities of the pixels within the viewing window were then convolved with the RF profiles of the LGN neurons (<xref ref-type="disp-formula" rid="EQ13 EQ14 EQ15">Equations 13&#x2013;15</xref>). All computational procedures were implemented using <xref ref-type="bibr" rid="ref60">MATLAB (2023)</xref>.</p>
</sec>
<sec id="sec10">
<label>3.1.2</label>
<title>Output of the L4 compartment of a mesocolumn</title>
<p>The L4 compartment of each mesocolumn was modeled as a group of <italic>N<sub>L4mc</sub></italic> neurons of the type described above by <xref ref-type="disp-formula" rid="EQ3">Equation 3</xref>. The temporal behavior of each neuron, modeled as a leaky integrator, is described by the following differential equation:</p>
<disp-formula id="EQ16">
<label>(16)</label>
<mml:math id="M52">
<mml:mi>&#x03C4;</mml:mi>
<mml:mfrac>
<mml:mi>d</mml:mi>
<mml:mi mathvariant="italic">dt</mml:mi>
</mml:mfrac>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:msub>
<mml:mn>4</mml:mn>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:msub>
<mml:mn>4</mml:mn>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x03B8;</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">[</mml:mo>
<mml:munderover>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mn>182</mml:mn>
</mml:munderover>
<mml:msub>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mi>a</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x03B8;</mml:mi>
<mml:msqrt>
<mml:mrow>
<mml:munderover>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mn>182</mml:mn>
</mml:munderover>
<mml:msubsup>
<mml:mi>a</mml:mi>
<mml:mi>j</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:msqrt>
<mml:mo>+</mml:mo>
<mml:mi>&#x03BB;</mml:mi>
<mml:munderover>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mi>k</mml:mi>
<mml:mo>&#x2260;</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>4</mml:mn>
<mml:mi mathvariant="italic">mc</mml:mi>
</mml:mrow>
</mml:msub>
</mml:munderover>
<mml:msub>
<mml:mi>z</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2022;</mml:mo>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:msub>
<mml:mn>4</mml:mn>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">]</mml:mo>
</mml:mrow>
<mml:mo>+</mml:mo>
</mml:msup>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math id="M53">
<mml:mi>&#x03C4;</mml:mi>
</mml:math>
</inline-formula> is a time constant; <inline-formula>
<mml:math id="M54">
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:msub>
<mml:mn>4</mml:mn>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mspace width="0.25em"/>
</mml:math>
</inline-formula>and <inline-formula>
<mml:math id="M55">
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:msub>
<mml:mn>4</mml:mn>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> are the output activities of L4 neurons <italic>i</italic> and <italic>k</italic> in the computed mesocolumn, respectively; <italic>a<sub>j</sub></italic> is the activity of the <italic>j</italic><sup>th</sup> among the 182 LGN neurons innervating the computed mesocolumn; <italic>w<sub>i,j</sub></italic> is the strength of the afferent connection from LGN neuron <italic>j</italic> to L4 neuron <italic>i</italic>; <italic>z<sub>i,k</sub></italic> is the strength of the connection to L4 neuron <italic>i</italic> from L4 neuron <italic>k</italic> residing in the same mesocolumn; <italic>&#x03B8;</italic> and <inline-formula>
<mml:math id="M56">
<mml:mi>&#x03BB;</mml:mi>
</mml:math>
</inline-formula> are feed-forward and lateral connection scaling constants, respectively. This differential equation was solved numerically using Euler updates with a step size <inline-formula>
<mml:math id="M57">
<mml:mi>&#x0394;</mml:mi>
</mml:math>
</inline-formula><italic>t</italic>&#x202F;=&#x202F;1&#x202F;ms. Explicitly, the Euler update for an equation <inline-formula>
<mml:math id="M58">
<mml:mi>&#x03C4;</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>d</mml:mi>
<mml:mo>/</mml:mo>
<mml:mi mathvariant="italic">dt</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>g</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>.</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula> is <inline-formula>
<mml:math id="M59">
<mml:mi>x</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi mathvariant="italic">&#x0394;t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2248;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi mathvariant="italic">&#x0394;t</mml:mi>
<mml:mo>/</mml:mo>
<mml:mi>&#x03C4;</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x00B7;</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="italic">&#x0394;t</mml:mi>
<mml:mo>/</mml:mo>
<mml:mi>&#x03C4;</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x00B7;</mml:mo>
<mml:mi>g</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>. Time constant <inline-formula>
<mml:math id="M60">
<mml:mi>&#x03C4;</mml:mi>
</mml:math>
</inline-formula> was set to 4&#x202F;ms, <italic>&#x03B8;</italic>&#x202F;=&#x202F;0.65 and <inline-formula>
<mml:math id="M61">
<mml:mi>&#x03BB;</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>3</mml:mn>
</mml:math>
</inline-formula>. The response of the L4 network to a given afferent input pattern was computed in 20 time steps.</p>
</sec>
<sec id="sec11">
<label>3.1.3</label>
<title>Hebbian development of afferent and lateral connections in the L4 compartment of a mesocolumn</title>
<p>The complete set of instructions and explanations offered in <xref ref-type="bibr" rid="ref28">Favorov and Kursun (2011)</xref> should be followed in growing L4 connections. Partially repeated here, those connections were driven to their final state by modifying them iteratively over 20 update steps. At each step, the L4 compartment of a mesocolumn was stimulated with 1,000 visual input patterns, which were produced by placing the LGN viewing window in random locations in any of the 100 database images. Output activities of the 182 LGN cells and <italic>N<sub>L4mc</sub></italic> L4 cells in response to these 1,000 visual patterns were used to compute correlation coefficients between all pairs of LGN-L4 and L4&#x2013;L4 neurons, and those correlations were used to update the afferent and lateral connections.</p>
<p>At update step <italic>s</italic>, the strength of the afferent connection from LGN cell <italic>k</italic> to L4 cell <italic>i</italic> was updated based positively on correlation <inline-formula>
<mml:math id="M62">
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mi mathvariant="italic">ik</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula> of their outputs during step <italic>s</italic> as, as given in <xref ref-type="disp-formula" rid="EQ17">Equations 17</xref>, <xref ref-type="disp-formula" rid="EQ18">18</xref>:</p>
<disp-formula id="EQ17">
<label>(17)</label>
<mml:math id="M63">
<mml:msub>
<mml:mi>w</mml:mi>
<mml:mi mathvariant="italic">ik</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">[</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>w</mml:mi>
<mml:mo stretchy="true">&#x02DC;</mml:mo>
</mml:mover>
<mml:mi mathvariant="italic">ik</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">]</mml:mo>
</mml:mrow>
<mml:mo>+</mml:mo>
</mml:msup>
<mml:mo>/</mml:mo>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mn>182</mml:mn>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">[</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>w</mml:mi>
<mml:mo stretchy="true">&#x02DC;</mml:mo>
</mml:mover>
<mml:mi mathvariant="italic">ij</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">]</mml:mo>
</mml:mrow>
<mml:mo>+</mml:mo>
</mml:msup>
</mml:mrow>
</mml:msqrt>
</mml:math>
</disp-formula>
<p>where:</p>
<disp-formula id="EQ18">
<label>(18)</label>
<mml:math id="M64">
<mml:msub>
<mml:mover accent="true">
<mml:mi>w</mml:mi>
<mml:mo stretchy="true">&#x02DC;</mml:mo>
</mml:mover>
<mml:mi mathvariant="italic">ik</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mi mathvariant="italic">aff</mml:mi>
</mml:msub>
<mml:mspace width="0.33em"/>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>w</mml:mi>
<mml:mo stretchy="true">&#x02DC;</mml:mo>
</mml:mover>
<mml:mi mathvariant="italic">ik</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mi mathvariant="italic">aff</mml:mi>
</mml:msub>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mi mathvariant="italic">ik</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula>
<p>The weight of the lateral connection between L4 cells <italic>i</italic> and <italic>k</italic> was updated based negatively (according to <xref ref-type="bibr" rid="ref24">Egger et al., 1999</xref>; <xref ref-type="bibr" rid="ref73">S&#x00E1;ez and Friedlander, 2009</xref>) on correlation <inline-formula>
<mml:math id="M65">
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mi mathvariant="italic">ik</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula> of their outputs during step <italic>s</italic>, as in <xref ref-type="disp-formula" rid="EQ19">Equation 19</xref>:</p>
<disp-formula id="EQ19">
<label>(19)</label>
<mml:math id="M66">
<mml:msub>
<mml:mi>z</mml:mi>
<mml:mi mathvariant="italic">ik</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mi mathvariant="italic">lat</mml:mi>
</mml:msub>
<mml:mspace width="0.33em"/>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mi>z</mml:mi>
<mml:mi mathvariant="italic">ik</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mi mathvariant="italic">lat</mml:mi>
</mml:msub>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mi mathvariant="italic">ik</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula>
<p>Adjustment rate constants <inline-formula>
<mml:math id="M67">
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mi mathvariant="italic">aff</mml:mi>
</mml:msub>
</mml:math>
</inline-formula>= 0.01 and <inline-formula>
<mml:math id="M68">
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mi mathvariant="italic">lat</mml:mi>
</mml:msub>
</mml:math>
</inline-formula>= 0.1 produced the fastest convergence of connection strengths to stable values.</p>
</sec>
<sec id="sec12">
<label>3.1.4</label>
<title>Afferent and contextual inputs to the L3 compartment of a mesocolumn</title>
<p>The L3 compartment of a mesocolumn in the model was set to receive afferent input from its own L4 compartment as well as from L4 compartments of six immediately adjacent mesocolumns (<xref ref-type="disp-formula" rid="EQ4">Equation 4</xref>). The LGN viewing windows of these six surrounding mesocolumns are shifted by 3 pixels relative to the LGN window of the central mesocolumn in six evenly spaced directions (<xref ref-type="fig" rid="fig1">Figure 1C</xref>). Consequently, the viewing window of the L3 compartment of a mesocolumn (which we consider to be its classic RF) is increased to 21 pixels.</p>
<p>In the real cortex, L4 compartments of different mesocolumns develop their own sets of LGN and lateral connections based on their visual experiences. However, since visual experiences of 7 neighboring mesocolumns are essentially the same, any emergent connectional differences among them will not be functionally significant. This allows us to greatly reduce the computational effort in developing the model&#x2019;s L4 connectivity by developing LGN and lateral connections of just one mesocolumn and then use these patterns of connections (i.e., the [<italic>w<sub>ij</sub></italic>] and [<italic>z<sub>ik</sub></italic>] matrices in <xref ref-type="disp-formula" rid="EQ16">Equation 16</xref>) in all the mesocolumns making up the model.</p>
<p>Our definition of the mesocolumn in Section 2.2 as a local group of 7 minicolumns, L4 cells of which together perform pluripotent function linearization transform of their shared afferent input, leads us to treat mesocolumns in this modeling effort as discrete entities packed in the cortex as a honeycomb-like mosaic. We also treat macrocolumns as discrete entities comprising 7 mesocolumns (<xref ref-type="fig" rid="fig3">Figure 3</xref>). However, this might be oversimplification. While discrete macrocolumns do exist &#x2013; at least in the somatosensory cortex (<xref ref-type="bibr" rid="ref25">Favorov and Diamond, 1990</xref>; <xref ref-type="bibr" rid="ref31">Favorov et al., 2015</xref>) &#x2013; experimental evidence of discrete mesocolumnar structures in L4 is lacking. It is possible that discrete mesocolumns, while appealing in their conceptual simplicity, are not necessary, and L4 function linearization transform can be successfully performed by a field of partially overlapping mesocolumns (making a mesocolumn a functional, rather than structural, entity). We will leave exploration of this possibility for future studies.</p>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>Afferent and contextual inputs to the model mesocolumn&#x2019;s L3 compartment. <bold>(A)</bold> The central macrocolumn (blue shaded) surrounded by two concentric rings of 6 and 12 macrocolumns (gray shaded) carrying contextual information. In the cortex, these rings would be &#x2053;0.5 and &#x2053;1.0&#x202F;mm away from the central macrocolumn. In the model simulations, image-response activities were computed for L4 cells in all 7 mesocolumns in each of the 19 macrocolumns but, to reduce the amount of computation, responses of L3 canonical variates were computed only for the central mesocolumn in each macrocolumn. They were used as the contextual input to the L3 cells in the central macrocolumn&#x2019;s central mesocolumn (red shaded). <bold>(B)</bold> RF outlines of the central and 12 outermost surrounding macrocolumns, showing very limited overlap. RFs of the inner and outer rings are shifted by 9 and 18 pixels, respectively, relative to the RF of the central macrocolumn.</p>
</caption>
<graphic xlink:href="fncir-19-1615232-g003.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Two diagrams labeled A and B. Diagram A depicts a circular pattern representing a cortical field with nested circles of dots, some highlighted in blue and red at the center. Diagram B shows overlapping circles illustrating a visual field with axes labeled in pixels ranging from -30 to 30.</alt-text>
</graphic>
</fig>
<p>Thus, for model simulations, the afferent input to the L3 compartment of the central mesocolumn is a flattened <inline-formula>
<mml:math id="M69">
<mml:mn>7</mml:mn>
<mml:mo>&#x00D7;</mml:mo>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>4</mml:mn>
<mml:mi mathvariant="italic">mc</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> dimensional vector of the outputs of L4 neurons of the same and 6 surrounding mesocolumns (<xref ref-type="disp-formula" rid="EQ7">Equation 7</xref>). The contextual input to the L3 compartment of the central mesocolumn in the model was set to come from L3 compartments of two concentric rings of distant mesocolumns: the inner ring of 6 mesocolumns and the outer ring of 12 mesocolumns (<xref ref-type="fig" rid="fig3">Figure 3A</xref>). RFs of the outer ring mesocolumns are shifted by 18 pixels relative to the RF of the central/recipient mesocolumn (<xref ref-type="fig" rid="fig3">Figure 3B</xref>). RFs of the inner ring mesocolumns are shifted by half of this distance; i.e., by 9 pixels.</p>
</sec>
<sec id="sec13">
<label>3.1.5</label>
<title>Algorithmic extraction of canonical variates</title>
<p>Canonical variates are the principal axes of the canonical feature subspace. To find their directions <inline-formula>
<mml:math id="M70">
<mml:mo stretchy="true">(</mml:mo>
<mml:mspace width="0.25em"/>
<mml:msub>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula> in the L3 state space (<xref ref-type="disp-formula" rid="EQ9 EQ10 EQ11">Equations 9&#x2013;11</xref>), the modeled field of L3 compartments of 19 mesocolumns, each receiving afferent input from L4 compartments of its own and 6 surrounding mesocolumns (<xref ref-type="fig" rid="fig3">Figure 3</xref>), was stimulated with 5,000 visual input patterns, which were obtained by placing the LGN viewing window in random locations in any of the 100 database images. For each visual pattern, the afferent input to the L3 compartment of each of the 19 mesocolumns in the field <inline-formula>
<mml:math id="M71">
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:msub>
<mml:mi mathvariant="italic">aff</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula> was written as a flattened vector of output activities of cells in L4 compartments of its own and its 6 surrounding mesocolumns (<xref ref-type="disp-formula" rid="EQ7">Equation 7</xref>). <inline-formula>
<mml:math id="M72">
<mml:msub>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> vectors of the first 20 canonical variates were extracted from the 5,000 sets of afferent input vectors of the central and 18 surrounding mesocolumns <inline-formula>
<mml:math id="M73">
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi mathvariant="italic">af</mml:mi>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi mathvariant="italic">af</mml:mi>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2026;</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi mathvariant="italic">af</mml:mi>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>18</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> according to <xref ref-type="disp-formula" rid="EQ8 EQ11 EQ12">Equations 8, 11, 12</xref>. Using <inline-formula>
<mml:math id="M74">
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
</mml:math>
</inline-formula> vectors, magnitudes of canonical variates of L3 afferent input patterns can be computed as:</p>
<disp-formula id="EQ20">
<label>(20)</label>
<mml:math id="M75">
<mml:msub>
<mml:mi>&#x03A6;</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msubsup>
<mml:mover accent="true">
<mml:mi>b</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
<mml:mi>T</mml:mi>
</mml:msubsup>
<mml:mo>&#x00B7;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:msub>
<mml:mi mathvariant="italic">aff</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>&#x03BC;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math id="M76">
<mml:msub>
<mml:mi>&#x03A6;</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> is the projection of the L3 afferent input vector of the <italic>m<sup>th</sup></italic> mesocolumn onto the <italic>i<sup>th</sup></italic> canonical variate.</p>
</sec>
<sec id="sec14">
<label>3.1.6</label>
<title>Hebbian tuning of L3 cells to canonical features</title>
<p>The central thesis of this paper is that pyramidal neurons in L3 should tune to contextually predictable, <italic>canonical</italic>, features, and they accomplish it by adjusting the weights of L4 connections to their basal dendrites under guidance from their apical dendrites, which receive contextual inputs from the surrounding cortical territory (Section 2.3). To explore what features might be thus selected by L3 cells in a V1 mesocolumn, we gave the L3 compartment of the central mesocolumn the same number of cells as in its L4 compartment (i.e., <italic>N<sub>L3mc</sub></italic>&#x202F;=&#x202F;<italic>N<sub>L4mc</sub></italic>) and trained their L4 input connections using an approach adapted from <xref ref-type="bibr" rid="ref46">Kording and Konig (2000)</xref>. For contextual guidance, we used canonical variates in the surrounding 18 mesocolumns (black shaded mesocolumns in <xref ref-type="fig" rid="fig3">Figure 3A</xref>).</p>
<p>Thus, the LGN viewing window was placed in 5000 random locations in the 100 database images, and for each image location we computed afferent input vectors to L3 compartments of the central and 18 surrounding mesocolumns <inline-formula>
<mml:math id="M77">
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi mathvariant="italic">af</mml:mi>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi mathvariant="italic">af</mml:mi>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2026;</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi mathvariant="italic">af</mml:mi>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>18</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> as well as the responses of canonical variates <inline-formula>
<mml:math id="M78">
<mml:msub>
<mml:mi>&#x03A6;</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> to these input vectors (<xref ref-type="disp-formula" rid="EQ20">Equation 20</xref>). These responses were autoscaled to zero mean and unit variance.</p>
<p>The feature-expressing basal outputs of L3 cells in the central mesocolumn in response to images were computed according to <xref ref-type="disp-formula" rid="EQ4">Equation 4</xref> while the contextual inputs to the apical dendrites of the same L3 cells were computed as:</p>
<disp-formula id="EQ21">
<label>(21)</label>
<mml:math id="M79">
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:munderover>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mn>18</mml:mn>
</mml:munderover>
<mml:munderover>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mn>20</mml:mn>
</mml:munderover>
<mml:msub>
<mml:mi>v</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>m</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mi>&#x03A6;</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</disp-formula>
<p>where <italic>I<sub>i</sub></italic> is the net contextual input to the apical dendrite of the <italic>i<sup>th</sup></italic> L3 cell, <inline-formula>
<mml:math id="M80">
<mml:msub>
<mml:mi>&#x03A6;</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> is the response of the <italic>j<sup>th</sup></italic> canonical variate in the <italic>m<sup>th</sup></italic> surrounding mesocolumn, and <inline-formula>
<mml:math id="M81">
<mml:msub>
<mml:mi>v</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>m</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> is the strength of their connection. Both basal outputs of L3 cells and net inputs to their apical dendrites were autoscaled to zero mean and unit variance.</p>
<p>The L3 network has to have a mechanism for diversifying feature tuning properties of cells residing in the same mesocolumn. The presence of such mechanism is indicated by the fact that in the real cortex, while neighboring neurons do share some of their RF and feature tuning properties in common, when all of these properties are considered <italic>in toto</italic>, neighboring neurons are very distinct and are highly decorrelated in their responses to the full repertoire of natural stimuli (<xref ref-type="bibr" rid="ref26">Favorov and Kelly, 1996a</xref>,<xref ref-type="bibr" rid="ref27">b</xref>; <xref ref-type="bibr" rid="ref90">Vinje and Gallant, 2000</xref>). The nature of this diversifying mechanism has not been established yet, but it must involve individual L3 cells in a mesocolumn influencing (likely &#x201C;pushing&#x201D; via lateral inhibition subserved by double-bouquet (<xref ref-type="bibr" rid="ref21">DeFelipe et al., 2006</xref>) and/or Martinotti cells (<xref ref-type="bibr" rid="ref77">Silberberg and Markram, 2007</xref>)) each other to select features different from their own. In the absence of the established mechanism, we chose to achieve its effect by using the same diversifying mechanism we (<xref ref-type="bibr" rid="ref28">Favorov and Kursun, 2011</xref>) proposed to operate in L4.</p>
<p>Thus, to promote tuning of L3 cells in the mesocolumn to different canonical features, the contextual inputs to their apical dendrites were modified by the basal outputs of all the other L3 cells in the mesocolumn, as well as by the output of the mesocolumn&#x2019;s L3 feed-forward inhibitory cell. That is, the output of the apical dendrite of the <italic>i<sup>th</sup></italic> L3 cell in the mesocolumn was computed as in <xref ref-type="disp-formula" rid="EQ22">Equation 22</xref>:</p>
<disp-formula id="EQ22">
<label>(22)</label>
<mml:math id="M82">
<mml:msub>
<mml:mi>A</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x03B8;</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:msub>
<mml:mi mathvariant="italic">FF</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:msub>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mi mathvariant="italic">FF</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x03BB;</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x00B7;</mml:mo>
<mml:munderover>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mi>k</mml:mi>
<mml:mo>&#x2260;</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>3</mml:mn>
<mml:mi mathvariant="italic">mc</mml:mi>
</mml:mrow>
</mml:msub>
</mml:munderover>
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:msub>
<mml:mi>B</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math id="M83">
<mml:msub>
<mml:mi>&#x03B8;</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math id="M84">
<mml:msub>
<mml:mi>&#x03BB;</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> are feed-forward and lateral scaling constants; <inline-formula>
<mml:math id="M85">
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> is the basal output of the <italic>k<sup>th</sup></italic> L3 cell and <inline-formula>
<mml:math id="M86">
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:msub>
<mml:mi>B</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> is the correlation between <inline-formula>
<mml:math id="M87">
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math id="M88">
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> over the training set of images; <italic>F<sub>FF</sub></italic> is the output of the L3 feed-forward cell and <inline-formula>
<mml:math id="M89">
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:msub>
<mml:mi mathvariant="italic">FF</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:msub>
</mml:math>
</inline-formula> is the correlation between <inline-formula>
<mml:math id="M90">
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> and <italic>F<sub>FF</sub></italic>. <italic>F<sub>FF</sub></italic> was computed as the sum of outputs of all L4 cells in the central macrocolumn. It was autoscaled to zero mean and unit variance over the training set of images. The values of <inline-formula>
<mml:math id="M91">
<mml:msub>
<mml:mi>&#x03B8;</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math id="M92">
<mml:msub>
<mml:mi>&#x03BB;</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> scaling constants were tested systematically for their feature diversification effect on L3 cells by measuring cross-correlations between basal outputs of different L3 cells in the mesocolumn. Gradually increasing the values of these constants leads to gradual reduction of cross-correlations, starting from very high values to eventually very low, which indicate that different L3 cells tuned to different features. Based on this empirical search, the optimal settings of <inline-formula>
<mml:math id="M93">
<mml:msub>
<mml:mi>&#x03B8;</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>0.01</mml:mn>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math id="M94">
<mml:msub>
<mml:mi>&#x03BB;</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>0.03</mml:mn>
</mml:math>
</inline-formula> were chosen, because under them L3 cells tune to the most diverse set of canonical features.</p>
<p>Hebbian connections of the basal and apical dendrites of L3 cells were developed gradually by modifying them iteratively over 1,000 update steps. At each update step, the modeled field of 19 macrocolumns was stimulated with 5,000 visual input patterns, which were obtained by placing the LGN viewing window in random locations in any of the 100 database images. Output activities of L4 and L3 cells and canonical variates in response to these 5,000 visual patterns were used to compute correlation coefficients of L3 cells with L4 cells and with canonical variates, and those correlations were used to update the afferent and contextual L3 connections.</p>
<p>At update step <italic>s</italic>, the strength of the afferent connection from the <italic>j<sup>th</sup></italic> L4 cell to the basal dendrite of the <italic>i<sup>th</sup></italic> L3 cell was updated based on correlation of the L4 cell with the apical output, <inline-formula>
<mml:math id="M95">
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mtext mathvariant="italic">corr</mml:mtext>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:msub>
<mml:mn>4</mml:mn>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>A</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>, during 5,000 step <italic>s</italic> trials, as given in <xref ref-type="disp-formula" rid="EQ23">Equations 23</xref>, <xref ref-type="disp-formula" rid="EQ24">24</xref>:</p>
<disp-formula id="EQ23">
<label>(23)</label>
<mml:math id="M96">
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>u</mml:mi>
<mml:mo stretchy="true">&#x02DC;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>/</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>7</mml:mn>
<mml:mo>&#x00D7;</mml:mo>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>4</mml:mn>
<mml:mi mathvariant="italic">mc</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:msubsup>
<mml:mover accent="true">
<mml:mi>u</mml:mi>
<mml:mo stretchy="true">&#x02DC;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
</mml:msqrt>
</mml:math>
</disp-formula>
<p>where:</p>
<disp-formula id="EQ24">
<label>(24)</label>
<mml:math id="M97">
<mml:msub>
<mml:mover accent="true">
<mml:mi>u</mml:mi>
<mml:mo stretchy="true">&#x02DC;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x00B7;</mml:mo>
<mml:mo>sgn</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x00B7;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo>&#x2223;</mml:mo>
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2223;</mml:mo>
</mml:mrow>
<mml:mn>0.5</mml:mn>
</mml:msup>
</mml:math>
</disp-formula>
<p>The strength of the contextual connection from the <italic>j<sup>th</sup></italic> canonical variate to the apical dendrite of the <italic>i<sup>th</sup></italic> L3 cell was updated based on correlation of the variate with the basal output, <inline-formula>
<mml:math id="M98">
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mtext mathvariant="italic">corr</mml:mtext>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi>&#x03A6;</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>, during 5,000 step <italic>s</italic> trials, as given in <xref ref-type="disp-formula" rid="EQ25">Equations 25</xref>, <xref ref-type="disp-formula" rid="EQ26">26</xref>:</p>
<disp-formula id="EQ25">
<label>(25)</label>
<mml:math id="M99">
<mml:msub>
<mml:mi>v</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>v</mml:mi>
<mml:mo stretchy="true">&#x02DC;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>/</mml:mo>
<mml:munderover>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mn>360</mml:mn>
</mml:munderover>
<mml:mo>&#x2223;</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>v</mml:mi>
<mml:mo stretchy="true">&#x02DC;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2223;</mml:mo>
</mml:math>
</disp-formula>
<p>where:</p>
<disp-formula id="EQ26">
<label>(26)</label>
<mml:math id="M100">
<mml:msub>
<mml:mover accent="true">
<mml:mi>v</mml:mi>
<mml:mo stretchy="true">&#x02DC;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mi>v</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x00B7;</mml:mo>
<mml:mo>sgn</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x00B7;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo>&#x2223;</mml:mo>
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2223;</mml:mo>
</mml:mrow>
<mml:mn>0.5</mml:mn>
</mml:msup>
</mml:math>
</disp-formula>
<p>Adjustment rate constant <italic>&#x03B7;<sub>L3</sub></italic>&#x202F;=&#x202F;0.01 produced the fastest convergence of connection strengths to stable values.</p>
</sec>
<sec id="sec15">
<label>3.1.7</label>
<title>No-context L3 model</title>
<p>As an alternative to our contextually guided model of L3 feature tuning, we also tested a no-context model, in which the apical dendrite of each L3 cell was given exactly the same afferent input as its basal dendrite; i.e., instead of using <xref ref-type="disp-formula" rid="EQ21">Equation 21</xref> to compute <italic>I<sub>i</sub></italic>, we used <inline-formula>
<mml:math id="M101">
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>.</mml:mo>
</mml:math>
</inline-formula> That is, instead of receiving contextual input from surrounding columns, apical dendrites received their input from L4 cells of their own macrocolumn. Features developed by L3 cells in this essentially generic self-organizing neural network offer us a benchmark against which to judge the benefits of using contextual guidance in feature selection.</p>
</sec>
</sec>
</sec>
<sec sec-type="results" id="sec16">
<label>4</label>
<title>Results</title>
<sec id="sec17">
<label>4.1</label>
<title>Layer 3 canonical variates</title>
<p>According to our proposed division of tasks between L4 and L3 &#x2013; with the L4 mesocolumnar network linearizing feature-extracting functions that will be computed by L3 cells &#x2013; the first step in estimating L3 canonical variates is to develop RF and functional properties of cells in the L4 compartment of mesocolumns. This is done by repeatedly exposing L4 cells to images and adjusting the weights of their Hebbian input and intrinsic connections, gradually driving them into stable connectional patterns. The emergent functional RF properties of the model L4 cells, which come to closely resemble those of simple cells in cat V1, are comprehensively described in <xref ref-type="bibr" rid="ref28">Favorov and Kursun (2011)</xref>, and for brevity we omit their description here.</p>
<p>On their own, the trained L4 cells have very low pairwise contextual correlations with L4 cells in surrounding macrocolumns. This is shown in <xref ref-type="fig" rid="fig4">Figure 4A</xref> by plotting the distribution of maximal correlations of coincident activities of individual L4 cells in the central macrocolumn and L4 cells in the first and second rings of surrounding macrocolumns. However, our expectation is that optimally chosen weighted sums of multiple L4 cells will have much higher contextual correlations with surrounding macrocolumns. In Section 2.4 we introduced a particular algorithm for finding such optimal weighted sums, giving us the axes of the canonical feature subspace, i.e., canonical variates. We apply this algorithm to the outputs of L4 cells in the modeled field of 19 macrocolumns to obtain canonical variates. We test the strength of their contextual correlations by introducing a third ring of 12 mesocolumns, chosen to be at a such distance from the central mesocolumn that any mutual information they might have in their RFs will have to come from the environmental sources rather than from sharing any pixels in common. To compute their contextual correlations, we used responses <italic>&#x03A6;</italic> (<xref ref-type="disp-formula" rid="EQ20">Equation 20</xref>) of the canonical variates in the central and these 12 distant surrounding mesocolumns to 1,000 image patches taken at random in the 100 dataset images. For each canonical variate, its contextual correlation is expressed by Pearson correlation coefficient computed between the 1,000 responses of that variate in the central mesocolumn and the 1,000 averages of responses of that variate in the 12 distant mesocolumns. The magnitudes of the computed contextual correlations are plotted in <xref ref-type="fig" rid="fig4">Figure 4B</xref> (white bars) for the first 20 canonical variates. The first 7 variates have particularly high correlations (<italic>r</italic><sup>2</sup>&#x202F;&#x2265;&#x202F;0.1). Correlations of the 8th to 15th variates, although low, are nevertheless statistically significant (at &#x03B1;&#x202F;=&#x202F;0.05 with Bonferroni correction), suggesting that even these canonical variates might reflect some causally significant factors in the environment.</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>Contextual correlations between the central and surrounding macrocolumns. <bold>(A)</bold> Contextual correlations among cells in the input layer, L4. Plotted is the histogram of the highest correlation of stimulus-evoked responses that each L4 cell in the central macrocolumn had with L4 cells in the 2 rings of surrounding macrocolumns, revealing that at the level of L4, individual cells in neighboring macrocolumns were essentially uncorrelated. Each mesocolumn had 150 L4 cells. <bold>(B)</bold> Contextual correlations between the first 20 canonical variates of the central mesocolumn and the surrounding mesocolumns with nonoverlapping RFs. For each canonical variate, correlation was computed between its value in the central mesocolumn and the mean of its values in the surrounding mesocolumns. Training of L4 cells and extraction of canonical variates to find their contextual correlations was repeated 10 times, using different randomly chosen sets of training image patches taken from the 100 images of the IARP TR-12 and Brodatz datasets. Shown in the plot are squared correlation averages and their SEM (white bars), indicating that macrocolumnar RFs possess up to 15 canonical variates with contextually significant information. Also shown in the plot are squared correlation averages and their SEM of canonical variates extracted from LGN afferent inputs to macrocolumns (black bars), indicating that only the first LGN-based variate has significant contextual information. <bold>(C)</bold> Contextual correlations between the first 40 canonical variates extracted from the 5,000 images of the COCO dataset (black bars). Shown in the plot are squared correlation averages and their SEM (<italic>n</italic>&#x202F;=&#x202F;10). For comparison, also plotted superimposed are the first 40 canonical variates extracted from the 100 images of the IARP &#x0026; Brodatz datasets (white bars), revealing close similarity between them. <bold>(D)</bold> Canonical Correlation Analysis (CCA) of overlap between canonical feature subspaces extracted by the first 15 canonical variates in the IARP &#x0026; Brodatz vs. COCO datasets (details in the main text). Plotted are squared canonical correlations of the 15 CCA variates, averaged over doing CCA 10 times.</p>
</caption>
<graphic xlink:href="fncir-19-1615232-g004.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Four bar charts labeled A, B, C, and D display different correlation coefficients. Chart A shows the distribution of maximal correlation coefficients squared, with most values under 0.2 and the highest percentage around 40%. Chart B and C illustrate the average correlation coefficient squared across canonical variates, with values decreasing as variates increase, peaking near the first few variates. Chart D shows average canonical correlation squared for CCA variates, starting high near 1 and decreasing steadily, with variate number 1 being the highest.</alt-text>
</graphic>
</fig>
<p>To demonstrate the necessity of the L4 function-linearization operation for maximizing contextual correlations, we also developed canonical variates directly from the LGN afferent inputs to the L4 compartments of the central and 6 surrounding mesocolumns (together constituting a macrocolumn) rather than using L4 outputs of these 7 mesocolumns. Unlike the L4-based variates, all but the first of the LGN-based variates showed no statistically significant contextual correlations (black bars in <xref ref-type="fig" rid="fig4">Figure 4B</xref>).</p>
<p>To test generalizable nature of the canonical variates extracted from the 100 IARP TC-12 images, canonical variates were also extracted from the 5,000 COCO images. The magnitudes of their contextual correlations, shown for the first 40 variates, are plotted as black bars in <xref ref-type="fig" rid="fig4">Figure 4C</xref>, superimposed on the first 40 canonical variates extracted from IARP images (plotted as white bars). As <xref ref-type="fig" rid="fig4">Figure 4C</xref> shows, although they come from different sources, magnitudes of the two sets of canonical variates are very similar, with the first 15 variates having statistically significant contextual correlations. But how similar are the features extracted from the two image sources? As basis vectors, the first 15 contextually predictable canonical variates enclose the canonical feature subspace of the mesocolumn&#x2019;s entire feature space (as defined in Section 2.4). To determine how much the IARP and COCO canonical feature subspaces overlap, we performed Canonical Correlation Analysis (CCA; <xref ref-type="bibr" rid="ref41">Hotelling, 1936</xref>), in which we treated the first 15 IARP and first 15 COCO canonical variates as 2 sets of input variables and used 5,000 training image patches, taken at random from the COCO dataset, to compute their loadings. Next, we used these loadings to compute 15 canonical correlations of the two sets of variables over a different set of randomly picked 1,000 COCO image patches. If the two feature subspaces, enclosed by the 15 IARP and 15 COCO canonical variates, match closely, the 15 canonical correlations would all be close to 1. On the other hand, if the two subspaces do not overlap at all, the 15 canonical correlations would all be close to zero. The actual computed correlations are plotted in <xref ref-type="fig" rid="fig4">Figure 4D</xref>, revealing that the first 6 CCA variates had very high correlations, whereas the last 5 CCA variates had very low correlations. Thus, we can conclude that canonical feature subspaces extracted from the IARP and COCO datasets mostly overlap, albeit not completely.</p>
<p>Going back to <xref ref-type="fig" rid="fig4">Figure 4B</xref>, as it shows, only the first canonical variate does not depend on L4 function-linearization preprocessing. The reason is that it reflects the overall magnitude of activity evoked in the macrocolumn&#x2019;s L4 compartment (<xref ref-type="fig" rid="fig5">Figure 5A</xref>) and thus the overall stimulation intensity of the macrocolumn&#x2019;s RF. Since the other canonical variates depend on L4 function-linearization preprocessing, they must be tuned to various structural features of the image patterns occurring in the mesocolumn&#x2019;s RF. What these features are, either in our model canonical variates or in real L3 neurons, is not obvious but some insight is traditionally gained in V1 studies by characterizing responses of V1 neurons to moving grating images of various orientations and spatial frequencies. <xref ref-type="fig" rid="fig5">Figure 5B</xref> shows orientation and positional tuning of the statistically significant first 15 canonical variates, revealing that variates 8 through 11 are sensitive to both orientation and position while others are sensitive to grating orientation but not its position in the RF (translational invariance), thus falling into the categories of the <italic>simple</italic> and <italic>complex</italic> cells, respectively (<xref ref-type="bibr" rid="ref42">Hubel and Wiesel, 1962</xref>). With real V1 neurons exhibiting diversity in the degrees of their orientation and grating phase tuning, the standard metric used to place any given V1 cell on the simple vs. complex cell spectrum is the F1/F0 ratio, which is the ratio of the 1st and 0th Fourier harmonics of a neuron&#x2019;s activity during stimulation of its RF with an optimal sinewave moving grating (<xref ref-type="bibr" rid="ref79">Skottun et al., 1991</xref>; <xref ref-type="bibr" rid="ref68">Ringach et al., 2002</xref>). V1 cells with F1/F0&#x202F;&#x003E;&#x202F;1 are classified as simple and cells with F1/F0&#x202F;&#x003C;&#x202F;1 are classified as complex. <xref ref-type="fig" rid="fig5">Figure 5C</xref> shows F1/F0 scores of the statistically significant canonical variates 2&#x2013;15, showing that 70 and 30% of variates fall into the complex cell and simple cell categories, respectively.</p>
<fig position="float" id="fig5">
<label>Figure 5</label>
<caption>
<p>Feature tuning of canonical variates. <bold>(A)</bold> Tuning of the 1st canonical variate to the overall intensity of RF stimulation. The variate&#x2019;s response magnitude is plotted as a function of the average of the stimulus-evoked activities of all the L4 cells in the macrocolumn, showing linear dependency. <bold>(B)</bold> Tuning of the first 15 canonical variates to the orientation and spatial phase of sinewave grating images. <bold>(C)</bold> F1/F0 scores of canonical variates 2&#x2013;15, showing clear separation of these variates into the simple and complex cell classes.</p>
</caption>
<graphic xlink:href="fncir-19-1615232-g005.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Panel A shows a scatter plot of the first variate response against the mean response of FL4 cells, indicating a positive correlation. Panel B displays a bar chart of F1/F0 ratios for canonical variates, distinguishing between simple and complex types. Panel C consists of histograms for 15 canonical variates, showing response patterns across grating orientations and cycle phases in degrees.</alt-text>
</graphic>
</fig>
<p>In principle, function-linearization capabilities of mesocolumns&#x2019; L4 compartment depend on the number of cells they employ (<xref ref-type="bibr" rid="ref28">Favorov and Kursun, 2011</xref>): the larger the number of L4 cells in a mesocolumn, the broader the repertoire of nonlinear functions it can linearize. This is shown in <xref ref-type="fig" rid="fig6">Figure 6</xref>, in which the total contextual correlation of the first 20 canonical variates, computed as the sum of squared contextual correlations of individual variates (<xref ref-type="bibr" rid="ref91">Watanabe, 1960</xref>), is plotted as a function of the number of cells in each mesocolumn&#x2019;s L4 compartment. Significantly, there is little further gain in total correlation after the number of L4 cells in mesocolumns is increased beyond 150&#x2013;200, which suggests that they linearize all the contextually predictable features available for extraction in the mesocolumn&#x2019;s RF.</p>
<fig position="float" id="fig6">
<label>Figure 6</label>
<caption>
<p>The dependence of the amount of contextually predictable information extracted by canonical variates on the number of L4 cells in the mesocolumn (<italic>N<sub>L4mc</sub></italic>). The amount of contextual information extracted by the first 20 canonical variates was estimated by their total contextual correlation, which was computed as the sum of squared (with sign preserved) correlations of the 20 variates in the central mesocolumn and their averages among the 12 surrounding mesocolumns with abutting RFs. Total correlation was computed 10 times, each time using different randomly chosen sets of image patches to train a particular number of L4 cells per mesocolumn and to extract canonical variates. Plotted are the means and standard deviations of the total correlation estimated for the number of L4 cells per mesocolumn ranging from 1 to 240. The plot suggests that having around 150 L4 cells per mesocolumn might be enough to extract most of the contextually predictable information in mesocolumns&#x2019; RFs.</p>
</caption>
<graphic xlink:href="fncir-19-1615232-g006.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Graph depicting the relationship between the number of L4 cells per mesocolumn and total contextual correlation. The x-axis shows L4 cells ranging from 0 to 250, and the y-axis shows correlation from 0 to 6. The plotted data points, with error bars, show a positive, nonlinear increase in correlation as the number of cells increases.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec18">
<label>4.2</label>
<title>Canonical features of L3 cells</title>
<p>L3 cells are expected to be driven by their apical dendrites to tune to contextually predictable &#x2013; <italic>canonical</italic>, according to our terminology &#x2013; features. Such features occupy a particular subspace in the mesocolumn&#x2019;s state/feature space, and the extracted canonical variates give us the principal axes of this canonical feature subspace. In choosing their features, L3 cells should be attracted to the canonical variates according to their contextual predictability. We explored this feature-selecting mechanism in our extended field of 19 macrocolumns (<xref ref-type="fig" rid="fig3">Figure 3A</xref>) by providing the L3 compartment of the central mesocolumn (red-shaded in <xref ref-type="fig" rid="fig3">Figure 3A</xref>) with 150 cells, each modeled as a pair of basal and apical dendrites. In each L3 cell, its basal dendrite was given afferent input from 1,050 L4 cells of its own and 6 immediately adjacent mesocolumns (150&#x202F;L4 cells per mesocolumn), which together make up a macrocolumn (blue-shaded in <xref ref-type="fig" rid="fig3">Figure 3A</xref>). The vector of the weights of these L4 connections to the cell&#x2019;s basal dendrite (<inline-formula>
<mml:math id="M102">
<mml:mover accent="true">
<mml:mi>u</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
</mml:math>
</inline-formula> in <xref ref-type="disp-formula" rid="EQ4">Equation 4</xref>) determines that dendrite&#x2019;s preferred direction in the mesocolumn&#x2019;s L3 state space and thus that cell&#x2019;s preferred feature. The apical dendrite of each L3 cell was given contextual input from the 18 more distant mesocolumns (black-shaded in <xref ref-type="fig" rid="fig3">Figure 3A</xref>) in the form of their 15 statistically significant canonical variates (for further details, see Methods section 3.1.6). The apical dendrite learns to produce output that best matches the output of the basal dendrite and vice versa.</p>
<p>Feature selectivities of L3 cells were developed by repeatedly exposing the model to randomly picked dataset images and adjusting the weights of the Hebbian basal and apical connections of L3 cells, gradually driving them into stable connectional patterns (<xref ref-type="fig" rid="fig7">Figure 7</xref>). After such training, the apical and basal dendrites of L3 cells developed prominent correlations in their responses to image patches (<xref ref-type="fig" rid="fig8">Figure 8A</xref>), demonstrating that all 150 L3 cells succeeded in tuning to contextually predictable features. Furthermore, <xref ref-type="fig" rid="fig8">Figure 8B</xref> shows that cross-correlations between basal outputs of different L3 cells residing in the same mesocolumn are low, indicating that these cells tuned to diverse canonical features.</p>
<fig position="float" id="fig7">
<label>Figure 7</label>
<caption>
<p>Time-course of L3 cells&#x2019; development of feature selectivities. Hebbian connections of the basal and apical dendrites of L3 cells were developed by modifying them iteratively over 1,000 steps based on pre- and post-synaptic activity correlations computed in response to 5,000 visual input patterns. To see how quickly the cells converge to their final connectional patterns, responses of each cell to a particular set of test input patterns were obtained after completion of 1,000 connection updates, and these responses were correlated with responses to the same test set obtained after each connection update prior to the final one, thus using the correlation coefficient to express the similarity of the cell&#x2019;s tuning at each update step to its final tuning. The plot shows superimposed the progressions of these correlation coefficients of all 150 L3 cells, from the first update to the last, revealing fast convergence to the final state without any meandering around.</p>
</caption>
<graphic xlink:href="fncir-19-1615232-g007.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Line graph showing the correlation with the final state on the y-axis versus the number of L3 Hebbian learning updates on the x-axis. The correlation starts near zero and sharply increases, plateauing close to one as updates increase towards 1000.</alt-text>
</graphic>
</fig>
<fig position="float" id="fig8">
<label>Figure 8</label>
<caption>
<p>Successful tuning of L3 cells to contextually predictable features. <bold>(A)</bold> Uniformly high correlation (squared) of outputs of the apical and basal dendrites of the 150 cells in the mesocolumn&#x2019;s L3 compartment. <bold>(B)</bold> Distribution of pairwise correlations (squared, keeping the sign) of outputs of basal dendrites of all 150 L3 cells, revealing their low similarity. <bold>(C)</bold> Basal dendrite correlations (squared, keeping the sign) of all L3 cells with each of the first 15 canonical variates (horizontal tick marks), showing that each L3 cell acquired gradually declining sensitivity to each of the first 11 variates. <bold>(D)</bold> Average magnitude of correlations (squared) of canonical variates with outputs of the 150 L4 cells in the mesocolumn (black bars) and outputs of basal dendrites of the 150 L3 cells (white bars), revealing complete insensitivity of L4 cells to canonical variates. Also plotted are the average correlations of canonical variates with 150 L3 cells in the no-context L3 model (gray bars). Development of feature selectivities of L3 cells was repeated 10 times, each time starting by assigning initial connection weights to L4 cells at random and training them on a different randomly selected sequence of image patches, then extracting canonical variates using another randomly selected set of image patches, followed by the same in L3. The bars in the plot show the means and SEM of the average correlations determined in the 10 runs. In all runs, L3 cells developed similar feature selectivities.</p>
</caption>
<graphic xlink:href="fncir-19-1615232-g008.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Four graphs showing statistical data:A. Bar graph of apical-basal correlation squared for L3 cells, ranging mostly between 0.4 and 0.6. B. Histogram of L3 basal-basal correlation squared, centered around zero with a peak at 0%. C. Scatter plot of correlation squared values against canonical variates one to fifteen, showing a diverse range of values. D. Bar graph of average correlation squared over canonical variates, with a decreasing trend.Each graph illustrates correlations relevant to L3 cells.</alt-text>
</graphic>
</fig>
<p><xref ref-type="fig" rid="fig8">Figure 8C</xref> provides some insight into the nature of the features chosen by the 150 L3 cells. It plots correlations of the basal dendrite of each L3 cell in the central mesocolumn with each of the first 15 canonical variates computed for that mesocolumn. The plot shows that each L3 cell developed either positive or negative sensitivity to each of the first 11 canonical variates, declining gradually from the first to the last variate. Combined with information in <xref ref-type="fig" rid="fig8">Figure 8B</xref>, this indicates that L3 cells picked different mixes of positive and negative sensitivities to the 11 variates. If we view the canonical feature space defined by the first 11 variates as an 11-dimensional hypercube, <xref ref-type="fig" rid="fig8">Figures 8B</xref>,<xref ref-type="fig" rid="fig8">C</xref> indicate that L3 cells picked different corners of this hypercube. Unlike L3 cells, L4 cells do not have any preferential sensitivity to the canonical variates (compare white- and black-shaded bars in <xref ref-type="fig" rid="fig8">Figure 8D</xref>). The prominent preferential sensitivity of L3 cells is the product of L3 self-organization. As our no-context L3 model shows, L3 self-organization without contextual guidance from surrounding columns also can to some degree enhance cells&#x2019; sensitivity to canonical variates (compare black- and gray-shaded bars in <xref ref-type="fig" rid="fig8">Figure 8D</xref>), but much less than under contextual guidance.</p>
<p>When evaluated by their responses to moving images of sinewave gratings, 80% of L3 cells fall in the complex-cell category, whereas 20% of L3 cells fall in the simple-cell category (<xref ref-type="fig" rid="fig9">Figure 9A</xref>). This suggests that as a group, L3 cells in a mesocolumn should be able to represent both the orientation and position of grating images in their output activity vector <inline-formula>
<mml:math id="M103">
<mml:mover accent="true">
<mml:mi>&#x03C6;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
</mml:math>
</inline-formula> (<xref ref-type="disp-formula" rid="EQ4">Equation 4</xref>). To show how well they can do it, we expose the RF of the central mesocolumn to a grating pattern of randomly selected orientation, spatial frequency, and position in the RF, and compute the <inline-formula>
<mml:math id="M104">
<mml:msub>
<mml:mover accent="true">
<mml:mi>&#x03C6;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:math>
</inline-formula> response it evokes in the 150 L3 cells in the central mesocolumn. We then rotate the grating pattern by a randomly chosen angle <italic>&#x03B1;</italic>, compute the new <inline-formula>
<mml:math id="M105">
<mml:msub>
<mml:mover accent="true">
<mml:mi>&#x03C6;</mml:mi>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
<mml:mi>&#x03B1;</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> response of L3 cells, and measure the angle between the two L3 output vectors <inline-formula>
<mml:math id="M106">
<mml:mover accent="true">
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math id="M107">
<mml:mover accent="true">
<mml:msub>
<mml:mi>&#x03C6;</mml:mi>
<mml:mi>&#x03B1;</mml:mi>
</mml:msub>
<mml:mo stretchy="true">&#x2192;</mml:mo>
</mml:mover>
</mml:math>
</inline-formula>. <xref ref-type="fig" rid="fig9">Figure 9B</xref> plots the average L3 angle as a function of the angle between the two gratings (gray curve). For a comparison, we also plot the average angle computed for the output vectors of the 150 L4 cells in the central mesocolumn (black curve). In <xref ref-type="fig" rid="fig9">Figure 9C</xref>, instead of rotating, we translate the grating pattern by a randomly chosen fraction (phase) of the grating&#x2019;s period, compute the new response of L4 and L3 cells, and measure the angle between the two L3 output vectors and between the two L4 output vectors. <xref ref-type="fig" rid="fig9">Figure 9C</xref> plots the average L3 (gray) and L4 (black) angles as a function of the phase shift between the two gratings. The plots show that both L4 and L3 output vectors can discriminate even small differences in gratings&#x2019; orientation or position in the RF. It is interesting to note that even at the maximal orientation (90&#x00B0;) or spatial phase (180&#x00B0;) differences between two gratings, L3 output vectors show less than maximal (90&#x00B0;) separation, reflecting the fact that other than for their orientation or phase, the two gratings are the same.</p>
<fig position="float" id="fig9">
<label>Figure 9</label>
<caption>
<p>Responses of L3 cells to grating patterns. <bold>(A)</bold> F1/F0 scores of the 150 cells in the mesocolumn&#x2019;s L3 compartment, spanning the range from clearly simple-cell (&#x003E; 1) to clearly complex-cell (&#x003C;1) categories. This distribution of ratios resembles that found in the upper layers in the real V1 cortex (<xref ref-type="fig" rid="fig1">Figure 1A</xref>; <xref ref-type="bibr" rid="ref44">Kim and Freeman, 2016</xref>). <bold>(B)</bold> Discrimination of the grating orientations by the output vector of the 150 cells in the mesocolumn&#x2019;s L4 compartment (black curve) and the 150 cells in the mesocolumn&#x2019;s L3 compartment (gray curve). The average angle between two L4 or L3 output vectors is plotted as a function of the angle between orientations of the two compared gratings. <bold>(C)</bold> Discrimination of the grating placements by the output vector of the 150 cells in the mesocolumn&#x2019;s L4 compartment (black curve) and the 150 cells in the mesocolumn&#x2019;s L3 compartment (gray curve). The average angle between two L4 or L3 output vectors is plotted as a function of the phase shift of the two compared gratings. Vertical bars are standard deviations.</p>
</caption>
<graphic xlink:href="fncir-19-1615232-g009.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Panel A shows a histogram of the F1/F0 ratio, depicting the percentage of L3 cells. Panel B is a line graph showing the angle between cortical vectors versus grating orientations, comparing L3 and L4 layers. Panel C displays a similar graph for grating cycle phase differences. L4 shows a larger angle range compared to L3 in both B and C. Error bars are present in all graphs.</alt-text>
</graphic>
</fig>
<p><xref ref-type="fig" rid="fig10">Figure 10</xref> demonstrates the importance of contextual guidance for the development of biologically realistic feature properties in L3 cells. To test orientation tuning of L4 and L3 cells in the model, each cell was stimulated with moving grating patterns of the optimal spatial frequency and the full 180&#x00B0; range of orientations. The tightness of the cell&#x2019;s orientation tuning was expressed by the standard half-width and half-height (HWHH) of the orientation tuning curve. <xref ref-type="fig" rid="fig10">Figure 10</xref> plots the F1/F0 ratio determined for each cell against its HWHH. The model&#x2019;s L4 cells are shown as blue circles, L3 cells as red dots, and L3 cells of the no-context model as green dots, revealing that all L4 cells are most tuned to orientation (average HWHH&#x202F;=&#x202F;18&#x00B0;, matching real cat V1) and belong to the simple-cell category, L3 cells are also well-tuned to orientation and have biologically accurate proportion of simple- and complex cell categories, whereas L3 cells in the no-context model fail do develop translational invariance and have poor orientation tuning.</p>
<fig position="float" id="fig10">
<label>Figure 10</label>
<caption>
<p>Importance of contextual guidance for the development of biologically realistic feature properties in L3 cells. Plotted against each other are the F1/F0 ratio and half-width at half-height (HWHH) of orientation tuning of the model&#x2019;s L4 cells (blue circles) and contextually guided L3 cells (red dots), as well as L3 cells of the no-context model (green dots), showing that L4 cells and contextually guided L3 cells acquire biologically correct orientation tuning and translational invariance properties, whereas in the absence of contextual guidance L3 cells fail to do so.</p>
</caption>
<graphic xlink:href="fncir-19-1615232-g010.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Scatter plot showing orientation tuning half-width at half-height (HWHH) versus F1/F0 ratio. Points are color-coded: red for complex cells, blue for simple cells, and green for another type. Complex cells cluster on the left with lower F1/F0 ratios, while simple cells appear on the right with higher ratios.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec19">
<label>4.3</label>
<title>L3 emergent properties</title>
<p>In the real cortex, long-range horizontal connections link cortical columns separated by up to several millimeters in a cortical area. They preferentially link cortical sites that share similar functional properties but have non-overlapping RFs (<xref ref-type="bibr" rid="ref35">Gilbert and Wiesel, 1983</xref>; <xref ref-type="bibr" rid="ref22">DeFelipe et al., 1986</xref>; <xref ref-type="bibr" rid="ref57">Lund et al., 1993</xref>; <xref ref-type="bibr" rid="ref13">Burton and Fabri, 1995</xref>; <xref ref-type="bibr" rid="ref8">Bosking et al., 1997</xref>). The fact that input patterns encountered by mesocolumns in their RFs possess contextually predictable features makes it possible for such long-range horizontal connections to establish Hebbian links between distant cortical columns even though they have non-overlapping RFs. When L3 cells tune to contextually predictable features, they become correlated with similar L3 cells in surrounding columns in their stimulation-evoked activities. <xref ref-type="fig" rid="fig11">Figure 11</xref> shows the magnitude of such correlations between L3 cells in the central mesocolumn and functionally identical L3 cells in the first and second ring of surrounding mesocolumns. For a comparison, <xref ref-type="fig" rid="fig11">Figure 11</xref> also shows that even in the first ring of mesocolumns, functionally identical L4 cells have very low correlations, which means that they would not be able to establish lateral Hebbian connections.</p>
<fig position="float" id="fig11">
<label>Figure 11</label>
<caption>
<p>Correlations of cells in the central and surrounding macrocolumns in response to natural images. Plotted are distributions of magnitudes of correlation between functionally identical L4 and L3 cells in the central vs. the 1st and 2nd rings of surrounding macrocolumns. Substantial correlations at the level of L3 offer a substrate for growing Hebbian short- and long-range horizontal connections.</p>
</caption>
<graphic xlink:href="fncir-19-1615232-g011.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Graph showing the fraction of cell pairs versus the absolute correlation coefficient. It includes three peaks labeled L4 1st ring, L3 2nd ring, and L3 1st ring, peaking at different coefficients. The y-axis ranges from 0 to 30 percent, and the x-axis ranges from 0 to 1.</alt-text>
</graphic>
</fig>
<p>Canonical features learned by L3 cells characterize input patterns in many different ways that reflect the orderly aspects of the sensed outside world. This makes it possible for different input patterns, which are in some way objectively related, to be preferentially clustered in the L3 output space. We demonstrate this clustering tendency on an example of 4 different 512&#x202F;&#x00D7;&#x202F;512 pixel texture images shown in <xref ref-type="fig" rid="fig12">Figure 12A</xref>. We exposed the field of 19 mesocolumns to 500 randomly picked locations in each of the 4 texture images, and for each location we averaged the responses of L3 cells tuned to the same feature across 19 mesocolumns, resulting in a 150-dimensional feature vector representation of the imaged texture field. We next did Principal Component Analysis (PCA) on the 500&#x202F;&#x00D7;&#x202F;4 feature vectors. In <xref ref-type="fig" rid="fig12">Figure 12B</xref>, we plot the computed scores of the first 3 principal components, color-coding them according to the texture images from which they originated. This 3-D plot reveals that L3 responses to the 4 different textures occupy non-overlapping regions in the principal components space. For a comparison, <xref ref-type="fig" rid="fig12">Figure 12C</xref> shows the same plot for responses of thalamic LGN cells, which provided the input to the 19 cortical mesocolumns. As expected, LGN responses to the 4 different textures show no sign of preferential clustering.</p>
<fig position="float" id="fig12">
<label>Figure 12</label>
<caption>
<p>Separate clustering of different textures in the L3 output space but not in the L4 input space. <bold>(A)</bold> Four texture images used for demonstration. The viewing window of the central and 2 rings of macrocolumns (<xref ref-type="fig" rid="fig3">Figure 3B</xref>) was placed at 500 random locations in each of these images to obtain responses of all their L3 cells, yielding a 150-dimensional activity vector for each location. These vectors were converted to principal component scores by performing PCA on the 2000 vectors. <bold>(B)</bold> 3D plot of the scores of the first 3 principal components, color-coding each L3 activity vector by the frame color of its source texture image. L3 vectors coming from the same texture image cluster separately from other vectors, reflecting prominent visual differences among the 4 textures. <bold>(C)</bold> 3D scores plot of the afferent input vectors from LGN layer to L4, revealing that these activity vectors are all mixed together.</p>
</caption>
<graphic xlink:href="fncir-19-1615232-g012.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Panel A displays four grayscale texture patterns with different border colors: red, black, green, and blue. Panel B is a 3D scatter plot labeled "L3" with dots in red, blue, green, and black. Panel C shows another 3D scatter plot labeled "LGN" with similar color-coded dots, indicating data clustering.</alt-text>
</graphic>
</fig>
<p>We expressed the similarity of L3 output vectors evoked in response to different randomly picked locations in the same texture image by computing correlations between pairs of such vectors. <xref ref-type="fig" rid="fig13">Figure 13</xref> plots average correlations (squared, keeping the sign) for each of the 13 texture images in the <xref ref-type="bibr" rid="ref9">Brodatz (1966)</xref> database. Also plotted are average correlations computed for the L4 response vectors and vectors of 15 significant canonical variates. As the plot shows, unlike L4 vectors, both L3 cell and canonical variate vectors evoked by different views of the same texture show substantial similarity. Also noticeable is that L3 cells consistently show greater similarity than canonical variates (compare red and green bars), demonstrating the advantages of the overcomplete representation of the mesocolumn&#x2019;s 15-D canonical feature space by 150 L3 cells.</p>
<fig position="float" id="fig13">
<label>Figure 13</label>
<caption>
<p>Similarity of output activity patterns evoked in L3, but not in L4, by different locations in the same texture image, reflecting their shared higher-order statistics. Responses of L4 and L3 cells in 19 mesocolumns, as well as their canonical variates, were obtained for 200 randomly placed locations in each of the 13 texture images in the Brodatz database, similar to <xref ref-type="fig" rid="fig12">Figure 12</xref>. Response profiles obtained from each texture image were cross-correlated and the average of these correlations (and standard deviation) were plotted separately for L4 (blue bars), canonical variates (green bars), and L3 (red bars) responses, showing that L4 responses had little, if any, similarity (the average correlation across the 13 images&#x202F;=&#x202F;0.03), whereas L3 responses were more similar than canonical variate responses (13-image averages of 0.43 and 0.25, respectively).</p>
</caption>
<graphic xlink:href="fncir-19-1615232-g013.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Bar graph showing average correlation squared for textures one to thirteen. Blue (L4), green (variates), and red (L3) bars represent different variables. Red bars are generally higher, indicating stronger correlations for L3.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="sec20">
<label>5</label>
<title>Discussion</title>
<sec id="sec21">
<label>5.1</label>
<title>Model accomplishments</title>
<p>The results of our cortical model simulations support biological plausibility of the proposed mechanism of cortical feature tuning and offer new insights into the nature of information extraction by neocortical networks. While potential usefulness of contextual guidance for feature tuning has long been recognized (see Introduction), so far it has only been explored at an abstract level or using greatly reduced &#x201C;toy&#x201D; models. In this paper we explore actual biological means by which neocortex tunes its neurons to contextually predictable features. Such means are likely to be the backbone of functional organization of cortical columns.</p>
<p>The starting point in our biologically grounded exploration was consideration that the tuned features have to be nonlinear. Our proposed two-stage solution is that, similar to artificial neural networks, feature tuning relies on hidden layer-like preprocessing, performed by the afferent input layer L4. That is, a local group of L4 neurons together perform a nonlinear transform of their thalamic inputs, which is akin to a basic RBF transform. Such transform accomplishes pluripotent function linearization, thus allowing L3 cells in the second stage to extract their features by simple linear summation of their L4 inputs.</p>
<p>Simplifying the task of feature tuning to that of linear operation over the L4 transform allowed us to determine &#x2013; using an objective-function optimizing algorithm derived in Section 2.4 &#x2013; that an RF of a representative V1 cortical column is likely to possess around 15 independent contextually predictable features, which we called canonical variates (<xref ref-type="fig" rid="fig4">Figure 4B</xref>). Furthermore, we determined that the transform-performing group of L4 cells will need at least 150 members in order to maximize the contextual predictability of all the canonical variates in its RF (<xref ref-type="fig" rid="fig6">Figure 6</xref>). Such a number is much greater than the 30&#x2013;60 excitatory cells found in the L4 compartment of a single 0.05&#x202F;mm-diameter cortical minicolumn (which is the narrowest columnar entity in the neocortex), but much smaller than the total number of excitatory L4 cells in the 0.5&#x202F;mm-diameter macrocolumn. This finding leads us to propose a new class of cortical columns, the 0.15&#x202F;mm-diameter mesocolumn. It is estimated to comprise a local group of 7 minicolumns, all innervated by the same bundle of afferent axons, and to have 200&#x2013;400&#x202F;L4 excitatory cells, which together perform the pluripotent function linearizing transform of the mesocolumn&#x2019;s afferent input.</p>
<p>Moving to the second stage of cortical feature extraction, which takes place in the upper layers, both anatomical evidence and model studies indicate that an L3 pyramidal cell extracts its feature from the L4 input it receives from not just its own mesocolumn, but from a macrocolumn-size group of 7 mesocolumns. Anatomical segregation of the ascending L4 inputs to the basal dendrites and the long-range horizontal inputs to the apical dendrites of L3 pyramidal cells, combined with their separate spike-generating synaptic input integrating centers allows basal and apical dendrites to have separate &#x2013; classical and extra-classical &#x2013; RFs and develop RF properties that will maximize covariance of the cell&#x2019;s apical and basal outputs (<xref ref-type="bibr" rid="ref46">Kording and Konig, 2000</xref>; <xref ref-type="bibr" rid="ref43">Kay and Phillips, 2011</xref>). Our model simulations, based on Hebbian plasticity of apical and basal synapses, show that contextual inputs to the apical dendrites readily drive basal dendrites to select contextually predictable (i.e., canonical) features in their classical RFs. Similarly to real V1 cortex, 80% of model L3 cells acquire complex-cell RF properties while 20% acquire simple-cell properties (<xref ref-type="bibr" rid="ref34">Gilbert, 1977</xref>; <xref ref-type="bibr" rid="ref44">Kim and Freeman, 2016</xref>). Overall, the design of the model and its emergent properties are fully consistent with the known properties of cortical organization.</p>
<p>If cells in the mesocolumn&#x2019;s L3 compartment did not push each other to select different features, they would all tune exclusively to the first &#x2013; most predictable and thus most attractive &#x2013; canonical variate. However, diversification pressures drive L3 cells to choose the second best solution. Rather than tuning to one or a mix of few of the canonical variates, all L3 cells in the mesocolumn become sensitive to all first 11 variates. This sensitivity declines gradually from the 1st to the 11th variate in all cells (<xref ref-type="fig" rid="fig8">Figure 8C</xref>). For each variate, all L3 cells develop approximately the same correlation with it but they differ in the sign of that correlation. Thus, each L3 cell carries maximal information it can about all first 11 variates (rather than emphasizing a subset of variates), with each variate contributing either positively or negatively in the pattern unique to that cell. As a result, L3 can be considered as approximating Hadamard-like domain transform of the first 11 canonical variates, decomposing them into a set of constituent functions (canonical features) over all variates. The L3 transform differs from Hadamard transform in that its transform functions are not orthogonal, and their number (200&#x2013;400) greatly exceeds the number of variates (11). That is, L3 generates an overcomplete representation of canonical variates.</p>
<p>Considered geometrically, diversification pressures among cells in the mesocolumn&#x2019;s L3 compartment drive them to choose different preferred directions in the mesocolumn&#x2019;s canonical feature subspace. If we view the canonical feature space defined by the first 11 variates as an 11-dimensional hypercube, we find that L3 cells pick different corners of this hypercube. Such a hypercube will have 2048 corners to choose from. It is intriguing that while 200&#x2013;400&#x202F;L3 cells in a mesocolumn will not be able to pick all these corners, the larger columnar entity comprising a group of 7 mesocolumns &#x2013; together making up a macrocolumn and sharing L4 input &#x2013; will have just the right number of L3 cells for such a task.</p>
<p>As pointed out in Introduction, the orderly &#x2013; as evidenced by their contextual predictability &#x2013; nature of canonical features reflects the orderly structures in the environment. In tuning selectively to canonical features, L3 performs selective filtering of the information it receives from L4, emphasizing information about orderly aspects of the sensed environment and downplaying local, likely to be insignificant or distracting, information. Despite selective filtering and overcomplete representation of the canonical feature subspace, L3 output preserves excellent discrimination capabilities (<xref ref-type="fig" rid="fig9">Figure 9</xref>) while acquiring novel categorization/abstraction ability to preferentially cluster in the L3 output space different input patterns that are in some way objectively related (<xref ref-type="fig" rid="fig12">Figure 12</xref>). Furthermore, reduced sensitivity of L3 output to distracting irrelevant details should help the L4 in the next cortical area to minimize the Curse of Dimensionality and to succeed in the next round of pluripotent function linearization, and for the next L3 to find higher-order canonical features.</p>
</sec>
<sec id="sec22">
<label>5.2</label>
<title>The model&#x2019;s antecedents</title>
<p>The general idea of using spatiotemporal coherence to discover useful regularities in inputs was introduced by <xref ref-type="bibr" rid="ref6">Becker and Hinton (1992)</xref> and later elaborated by <xref ref-type="bibr" rid="ref5">Becker (1996)</xref>. Their IMAX learning procedure discovers regularities in multiview inputs by maximizing mutual information between outputs of two nonlinear multilayer network modules that receive nonoverlapping, but spatially or temporally related, input samples, thus tuning to higher-order input features reflecting common distal causes in the external world. Details of IMAX design, however, make it unsuitable for implementation in the cerebral cortex (<xref ref-type="bibr" rid="ref5">Becker, 1996</xref>). <xref ref-type="bibr" rid="ref66">Phillips and Singer (1997)</xref> suggested a way of making computation of mutual information biologically more plausible, and it is one of the cornerstones of their Coherent Infomax theory. They consider abstract local processors, loosely analogous to unspecified local cortical circuits, that receive both the afferent input from their RFs and lateral (contextual field) input from other such local processors. The contextual field input guides local processors to tune to those stimulus features in their RFs that are predictably related to the context in which they occur. According to Coherent Infomax, contextual inputs can be used not only to guide learning but, importantly, also modulate short-term processing of sensory information. <xref ref-type="bibr" rid="ref66">Phillips and Singer (1997)</xref> derived a particular mechanism for how contextually-guided learning might be accomplished. Unfortunately, that mechanism is limited in its practical utility due to its inability to search for nonlinear correlations. In its later development, <xref ref-type="bibr" rid="ref43">Kay and Phillips (2011)</xref> showed that Coherent Infomax is consistent with a particular Bayesian interpretation for the contextual guidance of learning and processing and suggested learning rules that are more computationally feasible within systems composed of very many local processors.</p>
<p>Rather than invoking abstract local processors, <xref ref-type="bibr" rid="ref46">Kording and Konig (2000)</xref> proposed that contextual guidance of feature tuning is implemented in individual pyramidal neurons, in which the apical dendrite acts &#x2013; in addition to the soma &#x2013; as a second site of integration capable of generating action potentials. Synaptic inputs to the soma site, coming from the cell&#x2019;s RF, mainly determine the output activity of the post-synaptic neuron. Contextual inputs to the apical site gate synaptic plasticity. This separation makes it possible for contextual information to avoid confounding the effects of processing and learning. In &#x201C;toy&#x201D; simulations of such 2-site neurons receiving nonoverlapping but correlated inputs to their somata while sending their &#x201C;teaching&#x201D; outputs to each other&#x2019;s apical site, cells learned to represent only the coherent part of the input, which would be expected to be relevant to the processing at higher stages. Kording and Konig termed their design Relevant Infomax.</p>
<p>To explain how 2-site pyramidal neurons might be able to tune to nonlinear features in their inputs, the challenge which was not addressed by the Kording and Konig model, <xref ref-type="bibr" rid="ref30">Favorov and Ryder (2004)</xref> proposed that since dendritic trees are fundamentally nonlinear integrators, they might be able to operate functionally as error backpropagating multilayer perceptrons (MLP). In their SINBAD (acronym for <italic>Set of INteracting BAckpropagating Dendrites</italic>) neuron model (<xref ref-type="bibr" rid="ref72">Ryder and Favorov, 2001</xref>), the apical dendrite in each pyramidal cell functions as one MLP and the basal dendrites function as the second MLP, using each other&#x2019;s output activities as their reciprocal backpropagating teaching signals. While SINBAD cells are very powerful in discovering high-order nonlinear regularities hidden in multiview sensory inputs, effectively approximating Gebelein&#x2019;s maximal correlation (<xref ref-type="bibr" rid="ref49">Kursun and Favorov, 2010</xref>), it has become clear that they are not biologically feasible because, while action potentials do backpropagate from the initial axon segment up the apical dendrite, their experimentally observed amplitude modulation is not consistent with what would be required in the error signal. Furthermore, this design depends on a complete separation of the inputs to the apical and basal dendrites, which is not observed in the real cortex. Instead, a much more biologically appealing solution for the necessity of tuning cells to nonlinear features is to make use of pluripotent function linearization in L4 (<xref ref-type="bibr" rid="ref28">Favorov and Kursun, 2011</xref>), followed by linear learning in L3, as is explored in this paper.</p>
</sec>
<sec id="sec23">
<label>5.3</label>
<title>Model limitations</title>
<p>The model of contextual guidance of feature selection explored in this paper is not complete. In addition to spatial context, which was investigated here, contextual guidance can come from temporal context in which orderly features occur, as well as from higher-level understanding of the overall situation. In this paper, we only used static images and thus confined ourselves to spatial features of orderly structures, leaving temporal features of orderly processes for later studies. We anticipate that studies of feature acquisition under temporal contextual guidance and feedback from higher-level cortical areas will make it necessary to expand our current L4-L3 model by adding deep layers and layer 2, resulting in a cortical column model incorporating all cortical layers.</p>
<p>The biological realism of neurons modeled in this paper is not complete. Unlike real neurons, which have binary outputs and are either excitatory or inhibitory, but not both, the modeled cells have outputs that are continuous variables in a negative&#x2013;positive range and have connections that in the process of learning can change their sign. Adding this degree of biological realism to the model will be insightful, but we do not expect it to negate the lessons learned using the current model. Also, some of the mathematical techniques used in the model, such as normalization of the connection weights in <xref ref-type="disp-formula" rid="EQ17 EQ23 EQ25">Equations 17, 23, 25</xref>, might only approximate the true homeostatic mechanisms in the cortex (e.g., <xref ref-type="bibr" rid="ref88">Turrigiano et al., 1998</xref>) and should be investigated further.</p>
<p>Sensory cortical columns are engaged not only in feature extraction and sensory information transmission to higher cortical areas, but also in other tasks, such as across-column binding by selective spike synchronization (<xref ref-type="bibr" rid="ref89">Uhlhaas et al., 2009</xref>; <xref ref-type="bibr" rid="ref78">Singer and Lazar, 2016</xref>), dynamic contrast enhancement and focused attention (<xref ref-type="bibr" rid="ref76">Schummers et al., 2005</xref>; <xref ref-type="bibr" rid="ref86">Tommerdahl et al., 2010</xref>; <xref ref-type="bibr" rid="ref85">Tallon-Baudry, 2012</xref>), predictive computation (<xref ref-type="bibr" rid="ref11">Bubic et al., 2010</xref>; <xref ref-type="bibr" rid="ref29">Favorov et al., 2015</xref>; <xref ref-type="bibr" rid="ref59">Marvan and Phillips, 2024</xref>; <xref ref-type="bibr" rid="ref33">George et al., 2025</xref>), etc. Correspondingly, output of real pyramidal cells in L3 is determined not only by synaptic integration of L4 inputs by the basal dendrites, as was done in the current paper, but also by local excitatory and inhibitory inputs, input from the apical dendrite, and other sources (<xref ref-type="bibr" rid="ref2">Angelucci and Bressloff, 2006</xref>). Our current model lacks all this machinery since its sole purpose was to investigate mechanisms determining classical RF and feature tuning properties of cortical neurons. However, assuming that our proposed mesocolumn-based mechanism of 2-stage feature extraction is biologically realistic, our current model provides a starting point, constraints, and guidance in building a progressively more comprehensive model of cortical functional organization.</p>
</sec>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec24">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec sec-type="author-contributions" id="sec25">
<title>Author contributions</title>
<p>OF: Validation, Conceptualization, Investigation, Visualization, Resources, Data curation, Software, Formal analysis, Project administration, Supervision, Writing &#x2013; review &#x0026; editing, Methodology, Writing &#x2013; original draft. OK: Data curation, Project administration, Resources, Validation, Formal analysis, Methodology, Visualization, Funding acquisition, Conceptualization, Investigation, Writing &#x2013; review &#x0026; editing, Software, Supervision, Writing &#x2013; original draft.</p>
</sec>
<sec sec-type="funding-information" id="sec26">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This work was supported by National Science Foundation grant 2435093 and the J. Scott McFadyen Fund for Excellence in Parkinson&#x2019;s Disease Research.</p>
</sec>
<ack>
<p>We thank Drs. Richard Murrow and Tim Challener for valuable discussions and comments on the manuscript.</p>
</ack>
<sec sec-type="COI-statement" id="sec27">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec28">
<title>Generative AI statement</title>
<p>The authors declare that no Gen AI was used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="sec29">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<fn-group>
<fn id="fn0001"><p><sup>1</sup><ext-link xlink:href="http://images.cocodataset.org/zips/val2017.zip" ext-link-type="uri">http://images.cocodataset.org/zips/val2017.zip</ext-link></p></fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="ref1"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Alpaydin</surname> <given-names>E.</given-names></name></person-group> (<year>2014</year>). <source>Introduction to machine learning, third edition</source>. <publisher-loc>Cambridge</publisher-loc>: <publisher-name>The MIT Press</publisher-name>.</citation></ref>
<ref id="ref2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Angelucci</surname> <given-names>A.</given-names></name> <name><surname>Bressloff</surname> <given-names>P. C.</given-names></name></person-group> (<year>2006</year>). <article-title>Contribution of feedforward, lateral and feedback connections to the classical receptive field center and extra-classical receptive field surround of primate V1 neurons</article-title>. <source>Prog. Brain Res.</source> <volume>154</volume>, <fpage>93</fpage>&#x2013;<lpage>120</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0079-6123(06)54005-1</pub-id></citation></ref>
<ref id="ref3"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Barlow</surname> <given-names>H. B.</given-names></name></person-group> (<year>1992</year>). &#x201C;<article-title>The biological role of neocortex</article-title>&#x201D; in <source>Information processing in the cortex</source>. eds. <person-group person-group-type="editor"><name><surname>Aertsen</surname> <given-names>A.</given-names></name> <name><surname>Braitenberg</surname> <given-names>V.</given-names></name></person-group> (<publisher-loc>Berlin</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>53</fpage>&#x2013;<lpage>80</lpage>.</citation></ref>
<ref id="ref4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Beaulieu</surname> <given-names>C.</given-names></name> <name><surname>Colonnier</surname> <given-names>M.</given-names></name></person-group> (<year>1983</year>). <article-title>The number of neurons in the different laminae of the binocular and monocular regions of area 17 in the cat</article-title>. <source>J. Comp. Neurol.</source> <volume>217</volume>, <fpage>337</fpage>&#x2013;<lpage>344</lpage>. doi: <pub-id pub-id-type="doi">10.1002/cne.902170308</pub-id>, PMID: <pub-id pub-id-type="pmid">6411777</pub-id></citation></ref>
<ref id="ref5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Becker</surname> <given-names>S.</given-names></name></person-group> (<year>1996</year>). <article-title>Mutual information maximization: models of cortical self-organization</article-title>. <source>Network</source> <volume>7</volume>, <fpage>7</fpage>&#x2013;<lpage>31</lpage>. doi: <pub-id pub-id-type="doi">10.1080/0954898X.1996.11978653</pub-id>, PMID: <pub-id pub-id-type="pmid">29480142</pub-id></citation></ref>
<ref id="ref6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Becker</surname> <given-names>S.</given-names></name> <name><surname>Hinton</surname> <given-names>G. E.</given-names></name></person-group> (<year>1992</year>). <article-title>Self-organizing neural network that discovers surfaces in random-dot stereograms</article-title>. <source>Nature</source> <volume>355</volume>, <fpage>161</fpage>&#x2013;<lpage>163</lpage>. doi: <pub-id pub-id-type="doi">10.1038/355161a0</pub-id>, PMID: <pub-id pub-id-type="pmid">1729650</pub-id></citation></ref>
<ref id="ref7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bernander</surname> <given-names>O.</given-names></name> <name><surname>Koch</surname> <given-names>C.</given-names></name> <name><surname>Douglas</surname> <given-names>R. J.</given-names></name></person-group> (<year>1994</year>). <article-title>Amplification and linearization of distal synaptic input to cortical pyramidal cells</article-title>. <source>J. Neurophysiol.</source> <volume>72</volume>, <fpage>2743</fpage>&#x2013;<lpage>2753</lpage>. doi: <pub-id pub-id-type="doi">10.1152/jn.1994.72.6.2743</pub-id>, PMID: <pub-id pub-id-type="pmid">7897486</pub-id></citation></ref>
<ref id="ref8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bosking</surname> <given-names>W. H.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Schofield</surname> <given-names>B.</given-names></name> <name><surname>Fitzpatrick</surname> <given-names>D.</given-names></name></person-group> (<year>1997</year>). <article-title>Orientation selectivity and arrangement of horizontal connections in tree shrew striate cortex</article-title>. <source>J. Neurosci.</source> <volume>17</volume>, <fpage>2112</fpage>&#x2013;<lpage>2127</lpage>. doi: <pub-id pub-id-type="doi">10.1523/JNEUROSCI.17-06-02112.1997</pub-id></citation></ref>
<ref id="ref9"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Brodatz</surname> <given-names>P.</given-names></name></person-group> (<year>1966</year>). <source>Textures: A photographic album for artists and designers</source>. <publisher-loc>New York</publisher-loc>: <publisher-name>Dover Publications</publisher-name>.</citation></ref>
<ref id="ref10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bruno</surname> <given-names>R. M.</given-names></name> <name><surname>Simons</surname> <given-names>D. J.</given-names></name></person-group> (<year>2002</year>). <article-title>Feedforward mechanisms of excitatory and inhibitory cortical receptive fields</article-title>. <source>J. Neurosci.</source> <volume>22</volume>, <fpage>10966</fpage>&#x2013;<lpage>10975</lpage>. doi: <pub-id pub-id-type="doi">10.1523/JNEUROSCI.22-24-10966.2002</pub-id>, PMID: <pub-id pub-id-type="pmid">12486192</pub-id></citation></ref>
<ref id="ref11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bubic</surname> <given-names>A.</given-names></name> <name><surname>von Cramon</surname> <given-names>D. Y.</given-names></name> <name><surname>Schubotz</surname> <given-names>R. I.</given-names></name></person-group> (<year>2010</year>). <article-title>Prediction, cognition and the brain</article-title>. <source>Front. Hum. Neurosci.</source> <volume>4</volume>:<fpage>25</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fnhum.2010.00025</pub-id>, PMID: <pub-id pub-id-type="pmid">20631856</pub-id></citation></ref>
<ref id="ref12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Budd</surname> <given-names>J. M. L.</given-names></name></person-group> (<year>2000</year>). <article-title>Inhibitory basket cell synaptic input to layer IV simple cells in cat striate visual cortex (area 17): a quantitative analysis of connectivity</article-title>. <source>Vis. Neurosci.</source> <volume>17</volume>, <fpage>331</fpage>&#x2013;<lpage>343</lpage>. doi: <pub-id pub-id-type="doi">10.1017/S095252380017302X</pub-id>, PMID: <pub-id pub-id-type="pmid">10910102</pub-id></citation></ref>
<ref id="ref13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Burton</surname> <given-names>H.</given-names></name> <name><surname>Fabri</surname> <given-names>M.</given-names></name></person-group> (<year>1995</year>). <article-title>Ipsilateral intracortical connections of physiologically defined cutaneous representations in areas 3b and 1 of macaque monkeys: projections in the vicinity of the central sulcus</article-title>. <source>J. Comp. Neurol.</source> <volume>355</volume>, <fpage>508</fpage>&#x2013;<lpage>538</lpage>. doi: <pub-id pub-id-type="doi">10.1002/cne.903550404</pub-id>, PMID: <pub-id pub-id-type="pmid">7636029</pub-id></citation></ref>
<ref id="ref14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Buxhoeveden</surname> <given-names>D. P.</given-names></name> <name><surname>Casanova</surname> <given-names>M. F.</given-names></name></person-group> (<year>2002</year>). <article-title>The minicolumn hypothesis in neuroscience</article-title>. <source>Brain</source> <volume>125</volume>, <fpage>935</fpage>&#x2013;<lpage>951</lpage>. doi: <pub-id pub-id-type="doi">10.1093/brain/awf110</pub-id>, PMID: <pub-id pub-id-type="pmid">11960884</pub-id></citation></ref>
<ref id="ref15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Callaway</surname> <given-names>E. M.</given-names></name></person-group> (<year>2004</year>). <article-title>Feedforward, feedback and inhibitory connections in primate visual cortex</article-title>. <source>Neural Netw.</source> <volume>17</volume>, <fpage>625</fpage>&#x2013;<lpage>632</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neunet.2004.04.004</pub-id>, PMID: <pub-id pub-id-type="pmid">15288888</pub-id></citation></ref>
<ref id="ref16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cauller</surname> <given-names>L. J.</given-names></name> <name><surname>Connors</surname> <given-names>B. W.</given-names></name></person-group> (<year>1994</year>). <article-title>Synaptic physiology of horizontal afferents to layer I in slices of rat SI neocortex</article-title>. <source>J. Neurosci.</source> <volume>14</volume>, <fpage>751</fpage>&#x2013;<lpage>762</lpage>. doi: <pub-id pub-id-type="doi">10.1523/JNEUROSCI.14-02-00751.1994</pub-id>, PMID: <pub-id pub-id-type="pmid">7905516</pub-id></citation></ref>
<ref id="ref17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cruikshank</surname> <given-names>S. J.</given-names></name> <name><surname>Lewis</surname> <given-names>T. J.</given-names></name> <name><surname>Connors</surname> <given-names>B. W.</given-names></name></person-group> (<year>2007</year>). <article-title>Synaptic basis for intense thalamocortical activation of feedforward inhibitory cells in neocortex</article-title>. <source>Nat. Neurosci.</source> <volume>10</volume>, <fpage>462</fpage>&#x2013;<lpage>468</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nn1861</pub-id>, PMID: <pub-id pub-id-type="pmid">17334362</pub-id></citation></ref>
<ref id="ref18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Da Costa</surname> <given-names>N. M.</given-names></name> <name><surname>Martin</surname> <given-names>K. A.</given-names></name></person-group> (<year>2010</year>). <article-title>Whose cortical column would that be?</article-title> <source>Front. Neuroanat.</source> <volume>4</volume>:<fpage>16</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fnana.2010.00016</pub-id>, PMID: <pub-id pub-id-type="pmid">20640245</pub-id></citation></ref>
<ref id="ref19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>de Sa</surname> <given-names>V.</given-names></name> <name><surname>Ballard</surname> <given-names>D. H.</given-names></name></person-group> (<year>1998</year>). <article-title>Category learning through multimodality sensing</article-title>. <source>Neural Comput.</source> <volume>10</volume>, <fpage>1097</fpage>&#x2013;<lpage>1117</lpage>. doi: <pub-id pub-id-type="doi">10.1162/089976698300017368</pub-id></citation></ref>
<ref id="ref20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Deco</surname> <given-names>G.</given-names></name> <name><surname>Obradovic</surname> <given-names>D.</given-names></name></person-group> (<year>1995</year>). <article-title>Decorrelated hebbian learning for clustering and function approximation</article-title>. <source>Neural Comput.</source> <volume>7</volume>, <fpage>338</fpage>&#x2013;<lpage>348</lpage>. doi: <pub-id pub-id-type="doi">10.1162/neco.1995.7.2.338</pub-id></citation></ref>
<ref id="ref21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>DeFelipe</surname> <given-names>J.</given-names></name> <name><surname>Ballesteros-Yanez</surname> <given-names>I.</given-names></name> <name><surname>Inda</surname> <given-names>M. C.</given-names></name> <name><surname>Munoz</surname> <given-names>A.</given-names></name></person-group> (<year>2006</year>). <article-title>Double-bouquet cells in the monkey and human cerebral cortex with special reference to areas 17 and 18</article-title>. <source>Prog. Brain Res.</source> <volume>154</volume>, <fpage>15</fpage>&#x2013;<lpage>32</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0079-6123(06)54002-6</pub-id></citation></ref>
<ref id="ref22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>DeFelipe</surname> <given-names>J.</given-names></name> <name><surname>Conley</surname> <given-names>M.</given-names></name> <name><surname>Jones</surname> <given-names>E. G.</given-names></name></person-group> (<year>1986</year>). <article-title>Long-range focal collateralization of axons arising from corticocortical cells in monkey sensory-motor cortex</article-title>. <source>J. Neurosci.</source> <volume>6</volume>, <fpage>3749</fpage>&#x2013;<lpage>3766</lpage>. doi: <pub-id pub-id-type="doi">10.1523/JNEUROSCI.06-12-03749.1986</pub-id>, PMID: <pub-id pub-id-type="pmid">2432205</pub-id></citation></ref>
<ref id="ref23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>DiCarlo</surname> <given-names>J. J.</given-names></name> <name><surname>Cox</surname> <given-names>D. D.</given-names></name></person-group> (<year>2007</year>). <article-title>Untangling invariant object recognition</article-title>. <source>Trends Cogn. Sci.</source> <volume>11</volume>, <fpage>333</fpage>&#x2013;<lpage>341</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.tics.2007.06.010</pub-id>, PMID: <pub-id pub-id-type="pmid">17631409</pub-id></citation></ref>
<ref id="ref24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Egger</surname> <given-names>V.</given-names></name> <name><surname>Feldmeyer</surname> <given-names>D.</given-names></name> <name><surname>Sakmann</surname> <given-names>B.</given-names></name></person-group> (<year>1999</year>). <article-title>Coincidence detection and changes of synaptic efficacy in spiny stellate neurons in rat barrel cortex</article-title>. <source>Nat. Neurosci.</source> <volume>2</volume>, <fpage>1098</fpage>&#x2013;<lpage>1105</lpage>. doi: <pub-id pub-id-type="doi">10.1038/16026</pub-id>, PMID: <pub-id pub-id-type="pmid">10570487</pub-id></citation></ref>
<ref id="ref25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Favorov</surname> <given-names>O. V.</given-names></name> <name><surname>Diamond</surname> <given-names>M. E.</given-names></name></person-group> (<year>1990</year>). <article-title>Demonstration of discrete place-defined columns - segregates - in the cat SI</article-title>. <source>J. Comp. Neurol.</source> <volume>298</volume>, <fpage>97</fpage>&#x2013;<lpage>112</lpage>. doi: <pub-id pub-id-type="doi">10.1002/cne.902980108</pub-id>, PMID: <pub-id pub-id-type="pmid">2212100</pub-id></citation></ref>
<ref id="ref26"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Favorov</surname> <given-names>O. V.</given-names></name> <name><surname>Kelly</surname> <given-names>D. G.</given-names></name></person-group> (<year>1996a</year>). &#x201C;<article-title>Local receptive field diversity within cortical neuronal populations</article-title>&#x201D; in <source>Somesthesis and the neurobiology of the somatosensory cortex</source>. eds. <person-group person-group-type="editor"><name><surname>Franzen</surname> <given-names>O.</given-names></name> <name><surname>Johansson</surname> <given-names>R.</given-names></name> <name><surname>Terenius</surname> <given-names>L.</given-names></name></person-group> (<publisher-loc>Basel</publisher-loc>: <publisher-name>Birkhauser Verlag AB</publisher-name>), <fpage>395</fpage>&#x2013;<lpage>408</lpage>.</citation></ref>
<ref id="ref27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Favorov</surname> <given-names>O. V.</given-names></name> <name><surname>Kelly</surname> <given-names>D. G.</given-names></name></person-group> (<year>1996b</year>). <article-title>Stimulus&#x2013;response diversity in local neuronal populations of the cerebral cortex</article-title>. <source>Neuroreport</source> <volume>7</volume>, <fpage>2293</fpage>&#x2013;<lpage>2301</lpage>. doi: <pub-id pub-id-type="doi">10.1097/00001756-199610020-00006</pub-id></citation></ref>
<ref id="ref28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Favorov</surname> <given-names>O. V.</given-names></name> <name><surname>Kursun</surname> <given-names>O.</given-names></name></person-group> (<year>2011</year>). <article-title>Neocortical layer 4 as a pluripotent function linearizer</article-title>. <source>J. Neurophysiol.</source> <volume>105</volume>, <fpage>1342</fpage>&#x2013;<lpage>1360</lpage>. doi: <pub-id pub-id-type="doi">10.1152/jn.00708.2010</pub-id>, PMID: <pub-id pub-id-type="pmid">21248059</pub-id></citation></ref>
<ref id="ref29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Favorov</surname> <given-names>O. V.</given-names></name> <name><surname>Nilaweera</surname> <given-names>W. U.</given-names></name> <name><surname>Miasnikov</surname> <given-names>A. A.</given-names></name> <name><surname>Beloozerova</surname> <given-names>I. N.</given-names></name></person-group> (<year>2015</year>). <article-title>Activity of somatosensory-responsive neurons in high subdivisions of SI cortex during locomotion</article-title>. <source>J. Neurosci.</source> <volume>35</volume>, <fpage>7763</fpage>&#x2013;<lpage>7776</lpage>. doi: <pub-id pub-id-type="doi">10.1523/JNEUROSCI.3545-14.2015</pub-id>, PMID: <pub-id pub-id-type="pmid">25995465</pub-id></citation></ref>
<ref id="ref30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Favorov</surname> <given-names>O. V.</given-names></name> <name><surname>Ryder</surname> <given-names>D.</given-names></name></person-group> (<year>2004</year>). <article-title>SINBAD: a neocortical mechanism for discovering environmental variables and regularities hidden in sensory input</article-title>. <source>Biol. Cybern.</source> <volume>90</volume>, <fpage>191</fpage>&#x2013;<lpage>202</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00422-004-0464-8</pub-id>, PMID: <pub-id pub-id-type="pmid">15052482</pub-id></citation></ref>
<ref id="ref31"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Favorov</surname> <given-names>O. V.</given-names></name> <name><surname>Whitsel</surname> <given-names>B. L.</given-names></name> <name><surname>Tommerdahl</surname> <given-names>M.</given-names></name></person-group> (<year>2015</year>). &#x201C;<article-title>Discrete, place-defined macrocolumns in somatosensory cortex: lessons for modular organization of the cerebral cortex</article-title>&#x201D; in <source>Recent advances on the modular organization of the cortex</source>. eds. <person-group person-group-type="editor"><name><surname>Casanova</surname> <given-names>M. F.</given-names></name> <name><surname>Opris</surname> <given-names>I.</given-names></name></person-group> (<publisher-loc>New York</publisher-loc>: <publisher-name>Springer Science+Business Media Dordrecht</publisher-name>), <fpage>143</fpage>&#x2013;<lpage>156</lpage>.</citation></ref>
<ref id="ref32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Felleman</surname> <given-names>D. J.</given-names></name> <name><surname>Van Essen</surname> <given-names>D. C.</given-names></name></person-group> (<year>1991</year>). <article-title>Distributed hierarchical processing in the primate cerebral cortex</article-title>. <source>Cereb. Cortex</source> <volume>1</volume>, <fpage>1</fpage>&#x2013;<lpage>47</lpage>. doi: <pub-id pub-id-type="doi">10.1093/cercor/1.1.1-a</pub-id>, PMID: <pub-id pub-id-type="pmid">1822724</pub-id></citation></ref>
<ref id="ref33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>George</surname> <given-names>D.</given-names></name> <name><surname>Lazaro-Gredilla</surname> <given-names>M.</given-names></name> <name><surname>Lehrach</surname> <given-names>W.</given-names></name> <name><surname>Dedieu</surname> <given-names>A.</given-names></name> <name><surname>Zhou</surname> <given-names>G.</given-names></name> <name><surname>Marino</surname> <given-names>J.</given-names></name></person-group> (<year>2025</year>). <article-title>A detailed theory of thalamic and cortical microcircuits for predictive visual inference</article-title>. <source>Sci. Adv.</source> <volume>11</volume>:<fpage>eadr6698</fpage>. doi: <pub-id pub-id-type="doi">10.1126/sciadv.adr6698</pub-id>, PMID: <pub-id pub-id-type="pmid">39908384</pub-id></citation></ref>
<ref id="ref34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gilbert</surname> <given-names>C. D.</given-names></name></person-group> (<year>1977</year>). <article-title>Laminar differences in receptive filed properties of cells in cat primary visual cortex</article-title>. <source>J. Physiol.</source> <volume>268</volume>, <fpage>391</fpage>&#x2013;<lpage>421</lpage>. doi: <pub-id pub-id-type="doi">10.1113/jphysiol.1977.sp011863</pub-id></citation></ref>
<ref id="ref35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gilbert</surname> <given-names>C. D.</given-names></name> <name><surname>Wiesel</surname> <given-names>T. N.</given-names></name></person-group> (<year>1983</year>). <article-title>Clustered intrinsic connections in cat visual cortex</article-title>. <source>J. Neurosci.</source> <volume>3</volume>, <fpage>1116</fpage>&#x2013;<lpage>1133</lpage>. doi: <pub-id pub-id-type="doi">10.1523/JNEUROSCI.03-05-01116.1983</pub-id>, PMID: <pub-id pub-id-type="pmid">6188819</pub-id></citation></ref>
<ref id="ref36"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Golub</surname> <given-names>G. H.</given-names></name> <name><surname>Van Loan</surname> <given-names>C. F.</given-names></name></person-group> (<year>2013</year>). <source>Matrix computations</source>. <edition>4th</edition> Edn. <publisher-loc>Baltimore, MD</publisher-loc>: <publisher-name>Johns Hopkins University Press</publisher-name>.</citation></ref>
<ref id="ref37"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Grubinger</surname> <given-names>M.</given-names></name> <name><surname>Clough</surname> <given-names>P.</given-names></name> <name><surname>M&#x00FC;ller</surname> <given-names>H.</given-names></name> <name><surname>Deselaers</surname> <given-names>T.</given-names></name></person-group> (<year>2006</year>) <article-title>The IAPR TC-12 benchmark: a new evaluation resource for visual information systems</article-title>. <conf-name>Proceedings of the Onto Image 2006 Language Resources For Content-Based Image Retrieval. Genoa, Italy</conf-name>. <volume>5</volume>, p. <fpage>10</fpage>. Available online at: <ext-link xlink:href="https://www.mathworks.com/help/deeplearning/ug/data-sets-for-deep-learning.html" ext-link-type="uri">https://www.mathworks.com/help/deeplearning/ug/data-sets-for-deep-learning.html</ext-link> (Accessed September 16, 2025).</citation></ref>
<ref id="ref38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hardoon</surname> <given-names>D.</given-names></name> <name><surname>Szedmak</surname> <given-names>S.</given-names></name> <name><surname>Shawe-Taylor</surname> <given-names>J.</given-names></name></person-group> (<year>2004</year>). <article-title>Canonical correlation analysis: an overview with application to learning methods</article-title>. <source>Neural Comput.</source> <volume>16</volume>, <fpage>2639</fpage>&#x2013;<lpage>2664</lpage>. doi: <pub-id pub-id-type="doi">10.1162/0899766042321814</pub-id>, PMID: <pub-id pub-id-type="pmid">15516276</pub-id></citation></ref>
<ref id="ref39"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Hawkins</surname> <given-names>J.</given-names></name> <name><surname>Blakeslee</surname> <given-names>S.</given-names></name></person-group> (<year>2004</year>). <source>On Intelligence</source>. <publisher-loc>New York</publisher-loc>: <publisher-name>Owl Books</publisher-name>.</citation></ref>
<ref id="ref40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hirsch</surname> <given-names>J. A.</given-names></name> <name><surname>Martinez</surname> <given-names>L. M.</given-names></name> <name><surname>Pillai</surname> <given-names>C.</given-names></name> <name><surname>Alonso</surname> <given-names>J. M.</given-names></name> <name><surname>Wang</surname> <given-names>Q.</given-names></name> <name><surname>Sommer</surname> <given-names>F. T.</given-names></name></person-group> (<year>2003</year>). <article-title>Functionally distinct inhibitory neurons at the first stage of visual cortical processing</article-title>. <source>Nat. Neurosci.</source> <volume>6</volume>, <fpage>1300</fpage>&#x2013;<lpage>1308</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nn1152</pub-id>, PMID: <pub-id pub-id-type="pmid">14625553</pub-id></citation></ref>
<ref id="ref41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hotelling</surname> <given-names>H.</given-names></name></person-group> (<year>1936</year>). <article-title>Relations between two sets of variates</article-title>. <source>Biometrika</source> <volume>28</volume>, <fpage>321</fpage>&#x2013;<lpage>377</lpage>. doi: <pub-id pub-id-type="doi">10.1093/biomet/28.3-4.321</pub-id>, PMID: <pub-id pub-id-type="pmid">36970824</pub-id></citation></ref>
<ref id="ref42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hubel</surname> <given-names>D. H.</given-names></name> <name><surname>Wiesel</surname> <given-names>T. N.</given-names></name></person-group> (<year>1962</year>). <article-title>Receptive fields, binocular interactions and functional architecture in the cat&#x2019;s visual cortex</article-title>. <source>J. Physiol.</source> <volume>160</volume>, <fpage>106</fpage>&#x2013;<lpage>154</lpage>. doi: <pub-id pub-id-type="doi">10.1113/jphysiol.1962.sp006837</pub-id></citation></ref>
<ref id="ref43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kay</surname> <given-names>J. W.</given-names></name> <name><surname>Phillips</surname> <given-names>W. A.</given-names></name></person-group> (<year>2011</year>). <article-title>Coherent Infomax as a computational goal for neural systems</article-title>. <source>Bull. Math. Biol.</source> <volume>73</volume>, <fpage>344</fpage>&#x2013;<lpage>372</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11538-010-9564-x</pub-id>, PMID: <pub-id pub-id-type="pmid">20821064</pub-id></citation></ref>
<ref id="ref44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>T.</given-names></name> <name><surname>Freeman</surname> <given-names>R. D.</given-names></name></person-group> (<year>2016</year>). <article-title>Direction selectivity of neurons in visual cortex is non-linear and laminar dependent</article-title>. <source>Eur. J. Neurosci.</source> <volume>43</volume>, <fpage>1389</fpage>&#x2013;<lpage>1399</lpage>. doi: <pub-id pub-id-type="doi">10.1111/ejn.13223</pub-id></citation></ref>
<ref id="ref45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kisvardy</surname> <given-names>Z. F.</given-names></name> <name><surname>Martin</surname> <given-names>K. A. C.</given-names></name> <name><surname>Freund</surname> <given-names>T. F.</given-names></name> <name><surname>Magloczky</surname> <given-names>Z.</given-names></name> <name><surname>Whitteridge</surname> <given-names>D.</given-names></name> <name><surname>Somogyi</surname> <given-names>P.</given-names></name></person-group> (<year>1986</year>). <article-title>Synaptic targets of HRP-filled layer III pyramidal cells in the cat striate cortex</article-title>. <source>Exp. Brain Res.</source> <volume>64</volume>, <fpage>541</fpage>&#x2013;<lpage>552</lpage>. doi: <pub-id pub-id-type="doi">10.1007/BF00340492</pub-id></citation></ref>
<ref id="ref46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kording</surname> <given-names>K. P.</given-names></name> <name><surname>Konig</surname> <given-names>P.</given-names></name></person-group> (<year>2000</year>). <article-title>Learning with two sites of synaptic integration</article-title>. <source>Netw. Comput. Neural Syst.</source> <volume>11</volume>, <fpage>25</fpage>&#x2013;<lpage>39</lpage>. doi: <pub-id pub-id-type="doi">10.1088/0954-898X_11_1_302</pub-id></citation></ref>
<ref id="ref47"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Kurkov&#x00E1;</surname> <given-names>V.</given-names></name></person-group> (<year>2003</year>). &#x201C;<article-title>Universal approximators</article-title>&#x201D; in <source>The handbook of brain theory and neural networks</source>. ed. <person-group person-group-type="editor"><name><surname>Arbib</surname> <given-names>M. A.</given-names></name></person-group>. <edition>2nd</edition> ed (<publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>MIT Press</publisher-name>), <fpage>1180</fpage>&#x2013;<lpage>1183</lpage>.</citation></ref>
<ref id="ref48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kursun</surname> <given-names>O.</given-names></name> <name><surname>Alpaydin</surname> <given-names>E.</given-names></name> <name><surname>Favorov</surname> <given-names>O. V.</given-names></name></person-group> (<year>2011</year>). <article-title>Canonical correlation analysis using within-class coupling</article-title>. <source>Pattern Recogn. Lett.</source> <volume>32</volume>, <fpage>134</fpage>&#x2013;<lpage>144</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.patrec.2010.09.025</pub-id></citation></ref>
<ref id="ref49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kursun</surname> <given-names>O.</given-names></name> <name><surname>Favorov</surname> <given-names>O. V.</given-names></name></person-group> (<year>2010</year>). <article-title>Feature selection and extraction using an unsupervised biologically-suggested approximation to Gebelein&#x2019;s maximal correlation</article-title>. <source>Int. J. Pattern Recognit. Artif. Intell.</source> <volume>24</volume>, <fpage>337</fpage>&#x2013;<lpage>358</lpage>. doi: <pub-id pub-id-type="doi">10.1142/S0218001410008007</pub-id></citation></ref>
<ref id="ref50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kursun</surname> <given-names>O.</given-names></name> <name><surname>Patooghy</surname> <given-names>A.</given-names></name> <name><surname>Poursani</surname> <given-names>P.</given-names></name> <name><surname>Favorov</surname> <given-names>O. V.</given-names></name></person-group> (<year>2024</year>). <article-title>CG-CNN: self-supervised feature extraction through contextual guidance and transfer learning</article-title>. <source>IEEE Access</source> <volume>12</volume>, <fpage>155851</fpage>&#x2013;<lpage>155866</lpage>. doi: <pub-id pub-id-type="doi">10.1109/ACCESS.2024.3484663</pub-id></citation></ref>
<ref id="ref51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kyriazi</surname> <given-names>H.</given-names></name> <name><surname>Carvell</surname> <given-names>G. E.</given-names></name> <name><surname>Brumberg</surname> <given-names>J. C.</given-names></name> <name><surname>Simons</surname> <given-names>D. J.</given-names></name></person-group> (<year>1996</year>). <article-title>Quantitative effects of GABA and bicuculline methiodide on receptive field properties of neurons in real and simulated whisker barrels</article-title>. <source>J. Neurophysiol.</source> <volume>75</volume>, <fpage>547</fpage>&#x2013;<lpage>560</lpage>. doi: <pub-id pub-id-type="doi">10.1152/jn.1996.75.2.547</pub-id>, PMID: <pub-id pub-id-type="pmid">8714634</pub-id></citation></ref>
<ref id="ref52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Larkum</surname> <given-names>M. E.</given-names></name> <name><surname>Waters</surname> <given-names>J.</given-names></name> <name><surname>Sakmann</surname> <given-names>B.</given-names></name> <name><surname>Helmchen</surname> <given-names>F.</given-names></name></person-group> (<year>2007</year>). <article-title>Dendritic spikes in apical dendrites of neocortical layer 2/3 pyramidal neurons</article-title>. <source>J. Neurosci.</source> <volume>27</volume>, <fpage>8999</fpage>&#x2013;<lpage>9008</lpage>. doi: <pub-id pub-id-type="doi">10.1523/JNEUROSCI.1717-07.2007</pub-id>, PMID: <pub-id pub-id-type="pmid">17715337</pub-id></citation></ref>
<ref id="ref53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Larkum</surname> <given-names>M. E.</given-names></name> <name><surname>Zhu</surname> <given-names>J. J.</given-names></name> <name><surname>Sakmann</surname> <given-names>B.</given-names></name></person-group> (<year>1999</year>). <article-title>A new cellular mechanism for coupling inputs arriving at different cortical layers</article-title>. <source>Nature</source> <volume>398</volume>, <fpage>338</fpage>&#x2013;<lpage>341</lpage>. doi: <pub-id pub-id-type="doi">10.1038/18686</pub-id>, PMID: <pub-id pub-id-type="pmid">10192334</pub-id></citation></ref>
<ref id="ref54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lin</surname> <given-names>T. Y.</given-names></name> <name><surname>Maire</surname> <given-names>M.</given-names></name> <name><surname>Belongie</surname> <given-names>S.</given-names></name> <name><surname>Bourdev</surname> <given-names>L.</given-names></name> <name><surname>Girshick</surname> <given-names>R.</given-names></name> <name><surname>Hays</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Microsoft COCO: common objects in context</article-title>. <source>arXiv</source>:<fpage>1405.0312v3</fpage>. doi: <pub-id pub-id-type="doi">10.48550/arXiv.1405.0312</pub-id></citation></ref>
<ref id="ref55"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Lowe</surname> <given-names>D.</given-names></name></person-group> (<year>2003</year>). &#x201C;<article-title>Radial basis function networks</article-title>&#x201D; in <source>The handbook of brain theory and neural networks (2nd ed.)</source>. ed. <person-group person-group-type="editor"><name><surname>Arbib</surname> <given-names>M. A.</given-names></name></person-group> (<publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>MIT Press</publisher-name>), <fpage>937</fpage>&#x2013;<lpage>940</lpage>.</citation></ref>
<ref id="ref56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lubke</surname> <given-names>J.</given-names></name> <name><surname>Roth</surname> <given-names>A.</given-names></name> <name><surname>Feldmeyer</surname> <given-names>D.</given-names></name> <name><surname>Sakmann</surname> <given-names>B.</given-names></name></person-group> (<year>2003</year>). <article-title>Morphometric analysis of the columnar innervation domain of neurons connecting layer 4 and layer 2/3 of juvenile rat barrel cortex</article-title>. <source>Cereb. Cortex</source> <volume>13</volume>, <fpage>1051</fpage>&#x2013;<lpage>1063</lpage>. doi: <pub-id pub-id-type="doi">10.1093/cercor/13.10.1051</pub-id>, PMID: <pub-id pub-id-type="pmid">12967922</pub-id></citation></ref>
<ref id="ref57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lund</surname> <given-names>J. S.</given-names></name> <name><surname>Yoshioka</surname> <given-names>T.</given-names></name> <name><surname>Levitt</surname> <given-names>J. B.</given-names></name></person-group> (<year>1993</year>). <article-title>Comparison of intrinsic connectivity in different areas of macaque monkey cerebral cortex</article-title>. <source>Cereb. Cortex</source> <volume>3</volume>, <fpage>148</fpage>&#x2013;<lpage>162</lpage>. doi: <pub-id pub-id-type="doi">10.1093/cercor/3.2.148</pub-id>, PMID: <pub-id pub-id-type="pmid">8490320</pub-id></citation></ref>
<ref id="ref58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Markram</surname> <given-names>H.</given-names></name> <name><surname>Muller</surname> <given-names>E.</given-names></name> <name><surname>Ramaswamy</surname> <given-names>S.</given-names></name> <name><surname>Reimann</surname> <given-names>M. W.</given-names></name> <name><surname>Abdellah</surname> <given-names>M.</given-names></name> <name><surname>Sanchez</surname> <given-names>C. A.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Reconstruction and simulation of neocortical microcircuitry</article-title>. <source>Cell</source> <volume>163</volume>, <fpage>456</fpage>&#x2013;<lpage>492</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cell.2015.09.029</pub-id>, PMID: <pub-id pub-id-type="pmid">26451489</pub-id></citation></ref>
<ref id="ref59"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Marvan</surname> <given-names>T.</given-names></name> <name><surname>Phillips</surname> <given-names>W. A.</given-names></name></person-group> (<year>2024</year>). <article-title>Cellular mechanisms of cooperative context-sensitive predictive inference</article-title>. <source>Curr. Res. Neurobiol.</source> <volume>6</volume>:<fpage>100129</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.crneur.2024.100129</pub-id>, PMID: <pub-id pub-id-type="pmid">38665363</pub-id></citation></ref>
<ref id="ref60"><citation citation-type="other"><person-group person-group-type="author"><collab id="coll1">MATLAB</collab></person-group> (<year>2023</year>) <source>Version R2023a. The MathWorks, Inc</source>. Available online at: <ext-link xlink:href="https://www.mathworks.com/" ext-link-type="uri">https://www.mathworks.com/</ext-link> (Accessed September 16, 2025).</citation></ref>
<ref id="ref61"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Meyer</surname> <given-names>H. S.</given-names></name> <name><surname>Wimmer</surname> <given-names>V. C.</given-names></name> <name><surname>Oberlaender</surname> <given-names>M.</given-names></name> <name><surname>de Kock</surname> <given-names>C. P. J.</given-names></name> <name><surname>Sakmann</surname> <given-names>B.</given-names></name> <name><surname>Helmstaedter</surname> <given-names>M.</given-names></name></person-group> (<year>2010</year>). <article-title>Number and laminar distribution of neurons in a thalamocortical projection column of rat vibrissal cortex</article-title>. <source>Cereb. Cortex</source> <volume>20</volume>, <fpage>2277</fpage>&#x2013;<lpage>2286</lpage>. doi: <pub-id pub-id-type="doi">10.1093/cercor/bhq067</pub-id>, PMID: <pub-id pub-id-type="pmid">20534784</pub-id></citation></ref>
<ref id="ref62"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Mountcastle</surname> <given-names>V. B.</given-names></name></person-group> (<year>1978</year>). &#x201C;<article-title>An organizing principle for cerebral function: the unit module and the distributed system</article-title>&#x201D; in <source>The mindful brain</source>. eds. <person-group person-group-type="editor"><name><surname>Edelman</surname> <given-names>G. M.</given-names></name> <name><surname>Mountcastle</surname> <given-names>V. B.</given-names></name></person-group> (<publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>MIT Press</publisher-name>), <fpage>7</fpage>&#x2013;<lpage>50</lpage>.</citation></ref>
<ref id="ref63"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mountcastle</surname> <given-names>V. B.</given-names></name></person-group> (<year>1997</year>). <article-title>The columnar organization of the neocortex</article-title>. <source>Brain</source> <volume>120</volume>, <fpage>701</fpage>&#x2013;<lpage>722</lpage>. doi: <pub-id pub-id-type="doi">10.1093/brain/120.4.701</pub-id>, PMID: <pub-id pub-id-type="pmid">9153131</pub-id></citation></ref>
<ref id="ref64"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Park</surname> <given-names>J.</given-names></name> <name><surname>Sandberg</surname> <given-names>I. W.</given-names></name></person-group> (<year>1991</year>). <article-title>Universal approximation using radial-basis-function networks</article-title>. <source>Neural Comput.</source> <volume>3</volume>, <fpage>246</fpage>&#x2013;<lpage>257</lpage>. doi: <pub-id pub-id-type="doi">10.1162/neco.1991.3.2.246</pub-id>, PMID: <pub-id pub-id-type="pmid">31167308</pub-id></citation></ref>
<ref id="ref65"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Petreanu</surname> <given-names>L.</given-names></name> <name><surname>Mao</surname> <given-names>T.</given-names></name> <name><surname>Sternson</surname> <given-names>S. M.</given-names></name> <name><surname>Svoboda</surname> <given-names>K.</given-names></name></person-group> (<year>2009</year>). <article-title>The subcellular organization of neocortical excitatory connections</article-title>. <source>Nature</source> <volume>457</volume>, <fpage>1142</fpage>&#x2013;<lpage>1145</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nature07709</pub-id>, PMID: <pub-id pub-id-type="pmid">19151697</pub-id></citation></ref>
<ref id="ref66"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Phillips</surname> <given-names>W. A.</given-names></name> <name><surname>Singer</surname> <given-names>W.</given-names></name></person-group> (<year>1997</year>). <article-title>In search of common foundations for cortical computation</article-title>. <source>Behav. Brain Sci.</source> <volume>20</volume>, <fpage>657</fpage>&#x2013;<lpage>683</lpage>. doi: <pub-id pub-id-type="doi">10.1017/S0140525X9700160X</pub-id>, PMID: <pub-id pub-id-type="pmid">10097008</pub-id></citation></ref>
<ref id="ref67"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Riesenhuber</surname> <given-names>M.</given-names></name> <name><surname>Poggio</surname> <given-names>T.</given-names></name></person-group> (<year>1999</year>). <article-title>Hierarchical models of object recognition in cortex</article-title>. <source>Nat. Neurosci.</source> <volume>2</volume>, <fpage>1019</fpage>&#x2013;<lpage>1025</lpage>. doi: <pub-id pub-id-type="doi">10.1038/14819</pub-id>, PMID: <pub-id pub-id-type="pmid">10526343</pub-id></citation></ref>
<ref id="ref68"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ringach</surname> <given-names>D. L.</given-names></name> <name><surname>Shapley</surname> <given-names>R. M.</given-names></name> <name><surname>Hawken</surname> <given-names>M. J.</given-names></name></person-group> (<year>2002</year>). <article-title>Orientation selectivity in macaque V1: diversity and laminar dependence</article-title>. <source>J. Neurosci.</source> <volume>22</volume>, <fpage>5639</fpage>&#x2013;<lpage>5651</lpage>. doi: <pub-id pub-id-type="doi">10.1523/JNEUROSCI.22-13-05639.2002</pub-id>, PMID: <pub-id pub-id-type="pmid">12097515</pub-id></citation></ref>
<ref id="ref69"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Ritter</surname> <given-names>H.</given-names></name></person-group> (<year>2003</year>). &#x201C;<article-title>Self-organizing feature maps</article-title>&#x201D; in <source>The handbook of brain theory and neural networks</source>. ed. <person-group person-group-type="editor"><name><surname>Arbib</surname> <given-names>M. A.</given-names></name></person-group>. <edition>2nd</edition> ed (<publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>MIT Press</publisher-name>), <fpage>1005</fpage>&#x2013;<lpage>1010</lpage>.</citation></ref>
<ref id="ref70"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rockland</surname> <given-names>K. S.</given-names></name> <name><surname>Pandya</surname> <given-names>D. N.</given-names></name></person-group> (<year>1979</year>). <article-title>Laminar origins and terminations of cortical connections of the occipital lobe in the rhesus monkey</article-title>. <source>Brain Res.</source> <volume>179</volume>, <fpage>3</fpage>&#x2013;<lpage>20</lpage>. doi: <pub-id pub-id-type="doi">10.1016/0006-8993(79)90485-2</pub-id>, PMID: <pub-id pub-id-type="pmid">116716</pub-id></citation></ref>
<ref id="ref71"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ryder</surname> <given-names>D.</given-names></name></person-group> (<year>2004</year>). <article-title>Sinbad neurosemantics: a theory of mental representation</article-title>. <source>Mind Lang.</source> <volume>19</volume>, <fpage>211</fpage>&#x2013;<lpage>240</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1468-0017.2004.00255.x</pub-id></citation></ref>
<ref id="ref72"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ryder</surname> <given-names>D.</given-names></name> <name><surname>Favorov</surname> <given-names>O. V.</given-names></name></person-group> (<year>2001</year>). <article-title>The new associationism: a neural explanation for the predictive powers of cerebral cortex</article-title>. <source>Brain Mind</source> <volume>2</volume>, <fpage>161</fpage>&#x2013;<lpage>194</lpage>. doi: <pub-id pub-id-type="doi">10.1023/A:1012296506279</pub-id></citation></ref>
<ref id="ref73"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>S&#x00E1;ez</surname> <given-names>I.</given-names></name> <name><surname>Friedlander</surname> <given-names>M. J.</given-names></name></person-group> (<year>2009</year>). <article-title>plasticity between neuronal pairs in layer 4 of visual cortex varies with synapse state</article-title>. <source>J. Neurosci.</source> <volume>29</volume>, <fpage>15286</fpage>&#x2013;<lpage>15298</lpage>. doi: <pub-id pub-id-type="doi">10.1523/JNEUROSCI.2980-09.2009</pub-id>, PMID: <pub-id pub-id-type="pmid">19955381</pub-id></citation></ref>
<ref id="ref74"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schiller</surname> <given-names>J.</given-names></name> <name><surname>Schiller</surname> <given-names>Y.</given-names></name> <name><surname>Stuart</surname> <given-names>G.</given-names></name> <name><surname>Sakmann</surname> <given-names>B.</given-names></name></person-group> (<year>1997</year>). <article-title>Calcium action potentials restricted to distal apical dendrites of rat neocortical pyramidal neurons</article-title>. <source>J. Physiol.</source> <volume>505</volume>, <fpage>605</fpage>&#x2013;<lpage>616</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1469-7793.1997.605ba.x</pub-id>, PMID: <pub-id pub-id-type="pmid">9457639</pub-id></citation></ref>
<ref id="ref75"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Sch&#x00F6;lkopf</surname> <given-names>B.</given-names></name> <name><surname>Smola</surname> <given-names>A. J.</given-names></name></person-group> (<year>2002</year>). <source>Learning with kernels</source>. <publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>MIT Press</publisher-name>.</citation></ref>
<ref id="ref76"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schummers</surname> <given-names>J.</given-names></name> <name><surname>Sharma</surname> <given-names>J.</given-names></name> <name><surname>Sur</surname> <given-names>M.</given-names></name></person-group> (<year>2005</year>). <article-title>Bottom-up and top-down dynamics in visual cortex</article-title>. <source>Prog. Brain Res.</source> <volume>149</volume>, <fpage>65</fpage>&#x2013;<lpage>81</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0079-6123(05)49006-8</pub-id>, PMID: <pub-id pub-id-type="pmid">16226577</pub-id></citation></ref>
<ref id="ref77"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Silberberg</surname> <given-names>G.</given-names></name> <name><surname>Markram</surname> <given-names>H.</given-names></name></person-group> (<year>2007</year>). <article-title>Disynaptic inhibition between neocortical pyramidal cells mediated by Martinotti cells</article-title>. <source>Neuron</source> <volume>53</volume>, <fpage>735</fpage>&#x2013;<lpage>746</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neuron.2007.02.012</pub-id>, PMID: <pub-id pub-id-type="pmid">17329212</pub-id></citation></ref>
<ref id="ref78"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Singer</surname> <given-names>W.</given-names></name> <name><surname>Lazar</surname> <given-names>A.</given-names></name></person-group> (<year>2016</year>). <article-title>Does the cerebral cortex exploit high-dimensional, non-linear dynamics for information processing?</article-title> <source>Front. Comput. Neurosci.</source> <volume>10</volume>:<fpage>99</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fncom.2016.00099</pub-id>, PMID: <pub-id pub-id-type="pmid">27713697</pub-id></citation></ref>
<ref id="ref79"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Skottun</surname> <given-names>B. C.</given-names></name> <name><surname>DeValois</surname> <given-names>R. L.</given-names></name> <name><surname>Grosof</surname> <given-names>D. H.</given-names></name> <name><surname>Movshon</surname> <given-names>J. A.</given-names></name> <name><surname>Albrecht</surname> <given-names>D. G.</given-names></name> <name><surname>Bonds</surname> <given-names>A. B.</given-names></name></person-group> (<year>1991</year>). <article-title>Classifying simple and complex cells on the basis of response modulation</article-title>. <source>Vis. Res.</source> <volume>31</volume>, <fpage>1078</fpage>&#x2013;<lpage>1086</lpage>. doi: <pub-id pub-id-type="doi">10.1016/0042-6989(91)90033-2</pub-id></citation></ref>
<ref id="ref80"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Somers</surname> <given-names>D. C.</given-names></name> <name><surname>Nelson</surname> <given-names>S. B.</given-names></name> <name><surname>Sur</surname> <given-names>M.</given-names></name></person-group> (<year>1995</year>). <article-title>An emergent model of orientation selectivity in cat visual cortical simple cells</article-title>. <source>J. Neurosci.</source> <volume>15</volume>, <fpage>5448</fpage>&#x2013;<lpage>5465</lpage>. doi: <pub-id pub-id-type="doi">10.1523/JNEUROSCI.15-08-05448.1995</pub-id>, PMID: <pub-id pub-id-type="pmid">7643194</pub-id></citation></ref>
<ref id="ref81"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stone</surname> <given-names>J. V.</given-names></name></person-group> (<year>1996</year>). <article-title>Learning perceptually salient visual parameters using spatiotemporal smoothness constraints</article-title>. <source>Neural Comput.</source> <volume>8</volume>, <fpage>1463</fpage>&#x2013;<lpage>1492</lpage>. doi: <pub-id pub-id-type="doi">10.1162/neco.1996.8.7.1463</pub-id>, PMID: <pub-id pub-id-type="pmid">8823943</pub-id></citation></ref>
<ref id="ref82"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stuart</surname> <given-names>G. J.</given-names></name> <name><surname>Spruston</surname> <given-names>N.</given-names></name></person-group> (<year>1998</year>). <article-title>Determinants of voltage attenuation in neocortical pyramidal neuron dendrites</article-title>. <source>J. Neurosci.</source> <volume>18</volume>, <fpage>3501</fpage>&#x2013;<lpage>3510</lpage>. doi: <pub-id pub-id-type="doi">10.1523/JNEUROSCI.18-10-03501.1998</pub-id>, PMID: <pub-id pub-id-type="pmid">9570781</pub-id></citation></ref>
<ref id="ref83"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>Q. Q.</given-names></name> <name><surname>Huguenard</surname> <given-names>J. R.</given-names></name> <name><surname>Prince</surname> <given-names>D. A.</given-names></name></person-group> (<year>2006</year>). <article-title>Barrel cortex microcircuits: thalamocortical feedforward inhibition in spiny stellate cells is mediated by a small number of fast-spiking interneurons</article-title>. <source>J. Neurosci.</source> <volume>26</volume>, <fpage>1219</fpage>&#x2013;<lpage>1230</lpage>. doi: <pub-id pub-id-type="doi">10.1523/JNEUROSCI.4727-04.2006</pub-id>, PMID: <pub-id pub-id-type="pmid">16436609</pub-id></citation></ref>
<ref id="ref84"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Swadlow</surname> <given-names>H. A.</given-names></name></person-group> (<year>2003</year>). <article-title>Fast-spiking interneurons and feedforward inhibition in awake sensory neocortex</article-title>. <source>Cereb. Cortex</source> <volume>13</volume>:<fpage>32</fpage>. doi: <pub-id pub-id-type="doi">10.1093/cercor/13.1.25</pub-id></citation></ref>
<ref id="ref85"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tallon-Baudry</surname> <given-names>C.</given-names></name></person-group> (<year>2012</year>). <article-title>On neural mechanisms subserving consciousness and attention</article-title>. <source>Front. Psychol.</source> <volume>2</volume>:<fpage>397</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpsyg.2011.00397</pub-id></citation></ref>
<ref id="ref86"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tommerdahl</surname> <given-names>M.</given-names></name> <name><surname>Favorov</surname> <given-names>O. V.</given-names></name> <name><surname>Whitsel</surname> <given-names>B. L.</given-names></name></person-group> (<year>2010</year>). <article-title>Dynamic representations of the somatosensory cortex</article-title>. <source>Neurosci. Biobehav. Rev.</source> <volume>34</volume>, <fpage>160</fpage>&#x2013;<lpage>170</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neubiorev.2009.08.009</pub-id>, PMID: <pub-id pub-id-type="pmid">19732790</pub-id></citation></ref>
<ref id="ref87"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tommerdahl</surname> <given-names>M.</given-names></name> <name><surname>Favorov</surname> <given-names>O. V.</given-names></name> <name><surname>Whitsel</surname> <given-names>B. L.</given-names></name> <name><surname>Nakhle</surname> <given-names>B.</given-names></name> <name><surname>Gonchar</surname> <given-names>Y. A.</given-names></name></person-group> (<year>1993</year>). <article-title>Minicolumnar activation patterns in cat and monkey SI cortex</article-title>. <source>Cereb. Cortex</source> <volume>3</volume>, <fpage>399</fpage>&#x2013;<lpage>411</lpage>. doi: <pub-id pub-id-type="doi">10.1093/cercor/3.5.399</pub-id>, PMID: <pub-id pub-id-type="pmid">8260808</pub-id></citation></ref>
<ref id="ref88"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Turrigiano</surname> <given-names>G. G.</given-names></name> <name><surname>Leslie</surname> <given-names>K. R.</given-names></name> <name><surname>Desai</surname> <given-names>N. S.</given-names></name> <name><surname>Rutherford</surname> <given-names>L. C.</given-names></name> <name><surname>Nelson</surname> <given-names>S. B.</given-names></name></person-group> (<year>1998</year>). <article-title>Activity-dependent scaling of quantal amplitude in neocortical neurons</article-title>. <source>Nature</source> <volume>391</volume>, <fpage>892</fpage>&#x2013;<lpage>896</lpage>. doi: <pub-id pub-id-type="doi">10.1038/36103</pub-id>, PMID: <pub-id pub-id-type="pmid">9495341</pub-id></citation></ref>
<ref id="ref89"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Uhlhaas</surname> <given-names>P. J.</given-names></name> <name><surname>Pipa</surname> <given-names>G.</given-names></name> <name><surname>Lima</surname> <given-names>B.</given-names></name> <name><surname>Melloni</surname> <given-names>L.</given-names></name> <name><surname>Neuenschwander</surname> <given-names>S.</given-names></name> <name><surname>Nikolic</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2009</year>). <article-title>Neural synchrony in cortical networks: history, concept and current status</article-title>. <source>Front. Integr. Neurosci.</source> <volume>3</volume>:<fpage>17</fpage>. doi: <pub-id pub-id-type="doi">10.3389/neuro.07.017.2009</pub-id></citation></ref>
<ref id="ref90"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vinje</surname> <given-names>W. E.</given-names></name> <name><surname>Gallant</surname> <given-names>J. L.</given-names></name></person-group> (<year>2000</year>). <article-title>Sparse coding and decorrelation in primary visual cortex during natural vision</article-title>. <source>Science</source> <volume>287</volume>, <fpage>1273</fpage>&#x2013;<lpage>1276</lpage>. doi: <pub-id pub-id-type="doi">10.1126/science.287.5456.1273</pub-id>, PMID: <pub-id pub-id-type="pmid">10678835</pub-id></citation></ref>
<ref id="ref91"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Watanabe</surname> <given-names>S.</given-names></name></person-group> (<year>1960</year>). <article-title>Information theoretical analysis of multivariate correlation</article-title>. <source>IBM J. Res. Dev.</source> <volume>4</volume>, <fpage>66</fpage>&#x2013;<lpage>82</lpage>. doi: <pub-id pub-id-type="doi">10.1147/rd.41.0066</pub-id></citation></ref>
</ref-list>
</back>
</article>