<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/publishing/1.2/JATS-journalpublishing1.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="other" dtd-version="1.2" xml:lang="en">
    <front>
        <journal-meta>
            <journal-id journal-id-type="pmc">F1000Research</journal-id>
            <journal-title-group>
                <journal-title>F1000Research</journal-title>
            </journal-title-group>
            <issn pub-type="epub">2046-1402</issn>
            <publisher>
                <publisher-name>F1000 Research Limited</publisher-name>
                <publisher-loc>London, UK</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="doi">10.12688/f1000research.15020.1</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Opinion Article</subject>
                </subj-group>
                <subj-group>
                    <subject>Articles</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Lost in translation</article-title>
                <fn-group content-type="pub-status">
                    <fn>
                        <p>[version 1; peer review: 2 approved]</p>
                    </fn>
                </fn-group>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author" corresp="yes">
                    <name>
                        <surname>Nachev</surname>
                        <given-names>Parashkev</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Funding Acquisition</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-2718-4423</uri>
                    <xref ref-type="corresp" rid="c1">a</xref>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Rees</surname>
                        <given-names>Geraint</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Funding Acquisition</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a1">1</xref>
                    <xref ref-type="aff" rid="a2">2</xref>
                    <xref ref-type="aff" rid="a3">3</xref>
                    <xref ref-type="aff" rid="a4">4</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Frackowiak</surname>
                        <given-names>Richard</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Funding Acquisition</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <aff id="a1">
                    <label>1</label>Institute of Neurology, University College London, London, WC1N 3BG, UK</aff>
                <aff id="a2">
                    <label>2</label>Institute of Cognitive Neuroscience, University College London, London, WC1N 3AR, UK</aff>
                <aff id="a3">
                    <label>3</label>Faculty of Life Sciences, University College London, London, WC1E 6BT, UK</aff>
                <aff id="a4">
                    <label>4</label>Wellcome Trust Centre for Neuroimaging, University College London, London, WC1N 3BG, UK</aff>
            </contrib-group>
            <author-notes>
                <corresp id="c1">
                    <label>a</label>
                    <email xlink:href="mailto:p.nachev@ucl.ac.uk">p.nachev@ucl.ac.uk</email>
                </corresp>
                <fn fn-type="conflict">
                    <p>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>21</day>
                <month>5</month>
                <year>2018</year>
            </pub-date>
            <pub-date pub-type="collection">
                <year>2018</year>
            </pub-date>
            <volume>7</volume>
            <elocation-id>620</elocation-id>
            <history>
                <date date-type="accepted">
                    <day>17</day>
                    <month>5</month>
                    <year>2018</year>
                </date>
            </history>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2018 Nachev P et al.</copyright-statement>
                <copyright-year>2018</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access article distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <self-uri content-type="pdf" xlink:href="https://f1000research.com/articles/7-620/pdf"/>
            <abstract>
                <p>Translation in cognitive neuroscience remains beyond the horizon, brought no closer by supposed major advances in our understanding of the brain. Unless our explanatory models descend to the individual level&#x2014;a cardinal requirement for any intervention&#x2014;their real-world applications will always be limited. Drawing on an analysis of the informational properties of the brain, here we argue that adequate individualisation needs models of far greater dimensionality than has been usual in the field. This necessity arises from the widely distributed causality of neural systems, a consequence of the fundamentally adaptive nature of their developmental and physiological mechanisms. We discuss how recent advances in high-performance computing, combined with collections of large-scale data, enable the high-dimensional modelling we argue is critical to successful translation, and urge its adoption if the ultimate goal of impact on the lives of patients is to be achieved.</p>
            </abstract>
            <kwd-group kwd-group-type="author">
                <kwd>Translation</kwd>
                <kwd>high-dimensional inference</kwd>
                <kwd>causality</kwd>
                <kwd>neuroimaging</kwd>
                <kwd>cognitive neuroscience</kwd>
                <kwd>machine learning.</kwd>
            </kwd-group>
            <funding-group>
                <award-group id="fund-1" xlink:href="http://dx.doi.org/10.13039/501100000276">
                    <funding-source>Department of Health</funding-source>
                    <award-id>HICF-R9-501</award-id>
                </award-group>
                <award-group id="fund-2" xlink:href="http://dx.doi.org/10.13039/100004440">
                    <funding-source>Wellcome Trust</funding-source>
                    <award-id>103709</award-id>
                </award-group>
                <award-group id="fund-3">
                    <funding-source>UCLH NIHR Biomedical Research Centre</funding-source>
                </award-group>
                <funding-statement>PN is funded by a Health Innovation Challenge Fund award (HICF-R9-501, WT-103709) and the UCLH NIHR Biomedical Research Centre. </funding-statement>
                <funding-statement>
                    <italic>The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</italic>
                </funding-statement>
            </funding-group>
        </article-meta>
    </front>
    <body>
        <sec>
            <title>The question</title>
            <p>Cognitive neuroscience is yet to produce applications of major clinical impact. If its relative immaturity is to blame, we need merely wait. But if its approach is fundamentally ill-suited, we could be left waiting forever. We must therefore consider how well the means of cognitive neuroscience support translational ends. Such consideration cannot be expected to emerge spontaneously from the field itself, for neuroscience evolves under the selective pressure of supposed understanding, not the collateral of mechanistic insight translation is widely perceived to be. Nor may we presume the obstacles to translation to be peculiar to each cognitive subfield and unlikely to be illuminated by a general analysis: it is possible they lie within the proximal, cardinal steps common to all of neuroscience. Here we examine this possibility, show it to be overwhelmingly likely, and outline how neuroscience must change if it is to deliver real-world patient impact.</p>
        </sec>
        <sec>
            <title>Translation and individualisation</title>
            <p>Most societies give primacy to the individual person, imposing collective interests only with reluctance. This is especially true of healthcare, where the object of clinical action is archetypally the individual and the group only secondarily. To take a striking example, we could overnight revolutionize population outcomes in acute stroke by intervening with thrombolytic therapy at the kerbside, bypassing delays that hospital transfer for diagnostic computed tomographic scans inevitably introduce (
                <xref ref-type="bibr" rid="ref-32">Wardlaw 
                    <italic toggle="yes">et al</italic>., 1997</xref>). However, no matter how compelling the population statistics, such a manoeuvre is rendered unconscionable by the resultant death or greater disability of the 10% of patients with primary intracerebral haemorrhage (
                <xref ref-type="bibr" rid="ref-22">Qureshi 
                    <italic toggle="yes">et al</italic>., 2009</xref>). Even where the stakes are less sharply polarised, it remains difficult to implement any treatment whose individual benefit is only crudely probabilistic, for all interventions have a cost:  both personal and financial. Moreover, since populations merely summarise effects on individuals, the greater the individual variation, the lesser the population-level impact. Both constitutively and politically, translational success or failure is thus critically dependent on our ability to individualise our interventions.</p>
            <p>How is individuality determined? Consider by way of illustration that most personal part of the body, the face (
                <xref ref-type="fig" rid="f1">Figure 1</xref>). Though one feature may sometimes be uniquely idiosyncratic, to distinguish a face from another generally requires the conjunction of 
                <italic toggle="yes">many</italic> features, even when all redundancy is eliminated. Such irreducibly high intrinsic dimensionality is conveniently captured by the notion of 
                <bold>minimum description length</bold> (
                <xref ref-type="bibr" rid="ref-24">Rissanen, 1978</xref>) &#x2013; intuitively, the most compressed complete description of a system. This quantity sets a hard limit on the minimal complexity of any model that must distinguish one state or instance of a system from another to perform its task. No matter how clever the mathematics, a machine vision model tasked with (say) classifying the sex of a face will always perform badly when  starved of input features because no small subset of features contains the necessary information; conversely, even a relatively unsophisticated model with sufficient capacity will perform well, given enough data (
                <xref ref-type="bibr" rid="ref-21">Parkhi 
                    <italic toggle="yes">et al</italic>., 2015</xref>; 
                <xref ref-type="bibr" rid="ref-26">Schroff 
                    <italic toggle="yes">et al</italic>., 2015</xref>; 
                <xref ref-type="bibr" rid="ref-33">Zhou 
                    <italic toggle="yes">et al</italic>., 2015</xref>). It should come as no surprise that face coding in the primate brain takes a high-dimensional approach, deriving identity by projecting a multiplicity of features onto a compacted representational space (
                <xref ref-type="bibr" rid="ref-4">Chang &amp; Tsao, 2017</xref>). Now our concern is not individuation 
                <italic toggle="yes">simpliciter</italic> but the individuation of causal mechanisms of predictive or prescriptive utility. For this we need a 
                <italic toggle="yes">causally constrained</italic> extension of the concept of minimal description length: what we here term a 
                <bold>minimal causal field</bold>. To see how this is specified requires a brief examination of biological causality.</p>
            <fig fig-type="figure" id="f1" orientation="portrait" position="float">
                <label>Figure 1. </label>
                <caption>
                    <title>Dimensionality and individualisation.</title>
                    <p>The face of the Roman Emperor Hostilian (top left) is poorly described by the canonical face of all Roman Emperors (top right), which is&#x2014;by definition&#x2014;not identical with any of the individual faces from which it is derived. Furthermore, the individuality of a face is better captured by a low-precision, high-dimensional parameterisation (bottom left), than it is by a high-precision, low-dimensional parameterisation such as the inter-pupillary distance (bottom right). The photograph of Hostilian is reproduced with the kind permission of Dr William Storage.</p>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/16353/59d271f1-fa75-45de-ae6e-1dbcd8b58d8f_figure1.gif"/>
            </fig>
        </sec>
        <sec>
            <title>Neural causation</title>
            <p>We have a natural intellectual predisposition to causal models with two cardinal features: economy and seriality (
                <xref ref-type="bibr" rid="ref-11">Hacker, 2007</xref>). This is a consequence partly of reasoning by analogy and partly of practicability. The intelligible, mechanistically pellucid processes we observe in the non-organic world and exploit in the machines we build tend to have few parameters of causal significance, arranged sequentially. It seems natural to apply the same approach to biology, indeed inevitable, for a causal model with (say) a thousand parameters is intellectually intractable. When we insist on identifying 
                <italic toggle="yes">necessary</italic> and 
                <italic toggle="yes">sufficient</italic> links within a more or less serial chain, it is because no other option has been open to us.</p>
            <p>But whereas this notion of causation is adequate for understanding simple, serially organised systems, it does not scale with complexity. In complex systems, where a multiplicity of factors is 
                <italic toggle="yes">jointly</italic> brought to bear on the outcome, each individual factor becomes an insufficient but necessary part of a set of factors that are unnecessary but 
                <italic toggle="yes">s</italic>ufficient for the result: an 
                <bold>INUS condition</bold> (
                <xref ref-type="bibr" rid="ref-17">Mackie, 1974</xref>). To give an adequately explanatory account it is necessary to specify a 
                <bold>causal field</bold> of many such INUS conditional factors that interact in complex ways (see 
                <xref ref-type="fig" rid="f2">Figure 2</xref>).</p>
            <fig fig-type="figure" id="f2" orientation="portrait" position="float">
                <label>Figure 2. </label>
                <caption>
                    <title>Causal fields.</title>
                    <p>Distributed causality is elegantly illustrated by the behaviour of artificial neural networks 
                        <bold>trained</bold> to transform an input into an output by optimising the weights of a stack of fully connected nodes. Here the input-output transformation is causally dependent on the nodes and their connections, for it cannot occur without most of them. But when the network is large, its dependence on any limited subset of nodes will be low. This is not because there is a reserve of unused nodes, but because the causality of the system is constitutionally distributed. Inactivating (in black) a set of nodes (large circles) or their connections (small circles) will thus degrade performance broadly in proportion to their number and not necessarily their identity. Causality thus becomes irreducible to any simple specification of necessity and sufficiency. Instead, each node becomes an insufficient but necessary part of an unnecessary but sufficient set of factors: an INUS condition. An adequate description of the causality of the system as a whole then requires specification of the entire 
                        <italic toggle="yes">causal field</italic> of factors: no subset will do, and no strong ranking need exist between them. If the architecture of real neural networks makes such causality possible&#x2014;and it certainly does&#x2014;we need to be capable of modelling it. But this is more than just a theoretical possibility. It is striking that encouraging distributed causal architectures through dropping nodes or connections during training dramatically improves the performance of artificial neural networks. And, of course, real neural substrates often exhibit remarkable robustness to injury, a phenomenon conventionally construed as &#x201c;reserve&#x201d;, but since no part of the brain lies in wait, inactive, distributed causality is a more plausible explanation.</p>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/16353/59d271f1-fa75-45de-ae6e-1dbcd8b58d8f_figure2.gif"/>
            </fig>
            <p>Do neural systems require such a complexity of causal specification? Consider the far simpler behaviour of artificial neural networks, such as deep-learning architectures in which layers of laterally connected units are hierarchically arranged in an end-to-end error-minimising stack (
                <xref ref-type="bibr" rid="ref-10">Goodfellow 
                    <italic toggle="yes">et al</italic>., 2016</xref>; 
                <xref ref-type="bibr" rid="ref-15">LeCun 
                    <italic toggle="yes">et al</italic>., 2015</xref>). Taking the input-output transformation produced by such a network as its &#x201c;function&#x201d;, we can test the causal contribution of sets of network nodes by examining the functional consequences of deactivating them, essentially performing artificial neural network lesion-deficit mapping (
                <xref ref-type="bibr" rid="ref-1">Adolphs, 2016</xref>; 
                <xref ref-type="bibr" rid="ref-25">Rorden &amp; Karnath, 2004</xref>). When a trained network is subjected to such 
                <bold>drop-out</bold> (
                <xref ref-type="bibr" rid="ref-8">Gal &amp; Ghahramani, 2016</xref>; 
                <xref ref-type="bibr" rid="ref-14">Le Cun 
                    <italic toggle="yes">et al</italic>., 1989</xref>; 
                <xref ref-type="bibr" rid="ref-27">Srivastava 
                    <italic toggle="yes">et al</italic>., 2014</xref>; 
                <xref ref-type="bibr" rid="ref-31">Wan 
                    <italic toggle="yes">et al</italic>., 2013</xref>), the degradation of any output is gradual, and often proportionate with the mass of deactivated nodes but varying with their identity in a complex manner that precludes the identification of a "critical" node, or even a clear ranking of the material contribution of individual nodes. Causality is constitutionally 
                <italic toggle="yes">distributed</italic> in a way any conventional description simply cannot capture; only a causal field specification will do (
                <xref ref-type="bibr" rid="ref-17">Mackie, 1974</xref>).</p>
            <p>The widespread use of drop-out in the deep-learning literature shows causally distributed architectures learn complex input-output transformations better than other systems examined to date (
                <xref ref-type="bibr" rid="ref-10">Goodfellow 
                    <italic toggle="yes">et al</italic>., 2016</xref>). They are also more robust to damage, an important consideration for any biological system. However, there is no need to appeal to plausibility in our argument: to the extent that a node contributes to function it 
                <italic toggle="yes">must</italic> be causally relevant. It is inconceivable that the observed complexity of real neural systems is merely epiphenomenal to a much simpler underlying causal organisation. In any event, since we cannot 
                <italic toggle="yes">assume</italic> the minimal causal field is small, we need to consider how to model it when it is irreducibly large.</p>
        </sec>
        <sec>
            <title>Mapping causal fields</title>
            <p>In seeking to understand the causality of any complex system, we must distinguish between causally relevant and incidental variation. Though rarely acknowledged, the approach to making such a distinction depends critically on a cardinal assumption about a system&#x2019;s structure. If we assume the organisation of a particular brain network is fundamentally the same across people&#x2014;i.e. it is 
                <bold>monomorphous</bold>&#x2014;individual variation may be treated as noise. The population mean will then be the best available guide to the fundamental mechanism and to its expression in individuals. This is an implicit assumption behind the vast majority of studies in cognitive neuroscience where a set of estimates, derived from a small group, are considered to reveal general truths about the brain. But if, at some causally critical level, the neural organisation is 
                <italic toggle="yes">not</italic> the same across people&#x2014;i.e. it is 
                <bold>polymorphous</bold>&#x2014;individual variation cannot be treated as noise and the population mean will be a poor guide, both to mechanism and individual behaviour (see 
                <xref ref-type="fig" rid="f3">Figure 3</xref>). The distinction between monomorphous and polymorphous organisation is crucial because it radically alters the optimal inferential approach. We suggest the common assumption of a monomorphous architecture of the brain is unjustified&#x2014;both empirically and theoretically&#x2014;and must be discarded, for the following reasons.</p>
            <fig fig-type="figure" id="f3" orientation="portrait" position="float">
                <label>Figure 3. </label>
                <caption>
                    <title>Monomorphous vs polymorphous systems.</title>
                    <p>Where the fundamental architecture of a biological system is the same, our best guide will be the simple mean of the population, for each individual will differ from it randomly. Studying such monorphous systems is illustrated by adding random noise to an image of a specific watch mechanism, and then averaging across 45 noisy instances. The underlying architecture is thereby easily revealed. Where the solution in each individual differs locally, illustrated by taking a family of 45 different watch mechanisms of the same brand, the population mean is a very poor guide, for individual variability is no longer noise but the outcome of a plurality of comparably good solutions. We must instead define local regularities of organisation, here done by t stochastic neighbour embedding of the images into a two dimensional latent space, revealing characteristic features of each family of solutions. Given that neural systems are complex, stochastically initiated, and optimised by feedback, polymorphous architectures are likely to dominate, mandating a data-driven, neighbourhood-defining approach to modelling.</p>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/16353/59d271f1-fa75-45de-ae6e-1dbcd8b58d8f_figure3.gif"/>
            </fig>
        </sec>
        <sec>
            <title>The genetic information gap</title>
            <p>A neural architecture can be shared across individuals only as far as it is identically specified by the genome, the environment, and their interaction. The constitutive variability of the environment leaves the genome as the primary driver of inter-individual homology. Genomic information content is information theoretically limited by the number of base pairs and the range of nucleotide options at each locus. If we implausibly (
                <xref ref-type="bibr" rid="ref-23">Rands 
                    <italic toggle="yes">et al</italic>., 2014</xref>) assume every locus is both functional and material to the operations of the brain, so that no section is redundant, we have only ~6 x 10
                <sup>9</sup> bits of information, roughly the content of an old compact disc. Even if all this information is used to specify the minimal causal field of a human brain, leaving none for the rest of the body, we remain unable to meet even the most conservative estimates of the brain&#x2019;s complexity. A commonly offered prenatal estimate, ~10
                <sup>14</sup> bits, derived from the number of synapses in the brain (
                <xref ref-type="bibr" rid="ref-13">Huttenlocher &amp; Dabholkar, 1997</xref>; 
                <xref ref-type="bibr" rid="ref-28">Tang 
                    <italic toggle="yes">et al</italic>., 2001</xref>), implausibly assumes a synapse can only encode one bit at any one time, and that neural connectivity is the only differentiator. This is equivalent to treating a neuron rather like a transistor in a modern computer-processing unit, distinguished from its neighbours only by the role assigned to it. In short, we are not faced with an information gap but more an information chasm. The conclusion is that a great deal of the functional architecture of the brain 
                <italic toggle="yes">cannot</italic> be monomorphous, for the necessary information simply is not there.</p>
        </sec>
        <sec>
            <title>Creating polymorphous architectures</title>
            <p>The brain cannot violate the laws of physics, so how can complexity arise from so relatively impoverished an initial specification? Theoretically the simplest approach is to inject 
                <italic toggle="yes">randomness</italic> (
                <xref ref-type="bibr" rid="ref-19">Matsuoka, 1992</xref>) at the outset of development, allowing a complex order to emerge downstream through 
                <italic toggle="yes">feedback learning</italic>.</p>
            <p>Such stochastic initiation is evident in normal neural development, where as many cells face an orchestrated death, at great structural and energetic cost to the organism, as survive into adulthood (
                <xref ref-type="bibr" rid="ref-16">Lossi &amp; Merighi, 2003</xref>). Seemingly playing a compound game of &#x201c;Russian roulette cum musical chairs&#x201d;, developing neurons are subjected to an environmentally dependent selection process, determined only once development is in play. The process is not fully specified in the genome, or else the redundant neurons would never be born. The biologically dominant prohibition of regeneration in the central nervous system, far from being mysterious, is necessary where the organising information emerges during development, and is therefore stored only in the final product itself.</p>
            <p>Equally, the ubiquity of neural feedback learning is evident in the way recurrence is so densely woven into the neural fabric. One-way brain pathways are an exception, not the rule (
                <xref ref-type="bibr" rid="ref-2">Bressler &amp; Menon, 2010</xref>). It could not be otherwise, for learning&#x2014;here neural learning&#x2014;is the only way an order more complex than the initial genetic specifications could conceivably arise.</p>
            <p>Now a stochastically-initiated, feedback-learning system, with multiple tuneable parameters, will inevitably have many 
                <italic toggle="yes">different</italic> solutions for the 
                <italic toggle="yes">same</italic> target input/output transformation. It is therefore bound to be polymorphous. Crucially, there need be no mechanism for regularising such solutions across individuals to impose a higher, species-level order, for no such order need exist, even if it could be imposed. An organism adapts its structure in response to errors only within its 
                <italic toggle="yes">own</italic> input-output transformations, not those of others; biology does not do federated learning (
                <xref ref-type="bibr" rid="ref-20">McMahan 
                    <italic toggle="yes">et al</italic>., 2016</xref>).</p>
            <p>Though our concern is to define the bounds of biological possibility our models must be able to cover, it is natural to seek empirical evidence of biological plausibility. The only credible evidence can come from a system that has been comprehensively characterised. Since our claim is about under-estimating complexity, we may as well pick a simple one. Consider, the gut of the lobster, or rather the stomatogastric sub-circuit, meticulously studied for decades by Eve Marder. Though absurdly simple anatomically, with only 30 neurons, and physiologically, with only regular peristaltic oscillation, the relation between the two is not only complex, but also polymorphous in precisely the way described. The same functional physiology can be arrived at from different individual neuronal &#x201c;settings&#x201d;, both across time in the same animal and across different animals (
                <xref ref-type="bibr" rid="ref-18">Marder &amp; Bucher, 2007</xref>). We cannot presume that the rules of human functional brain organisation are any simpler.</p>
        </sec>
        <sec>
            <title>Modelling polymorphous systems</title>
            <p>We must confront the functional complexity of neural organisation before us if translation from mechanisms of disease to rational treatments is to be possible. How do we 
                <italic toggle="yes">generate</italic>, 
                <italic toggle="yes">estimate</italic>, and 
                <italic toggle="yes">validate</italic> polymorphous neural models of potentially incomprehensible complexity?</p>
            <sec>
                <title>Model validation</title>
                <p>Let us begin with the last step first: validation. It is conventional to take goodness-of-fit, qualified by some statistical measure, as evidence for the plausibility and utility of a model. But this is of little use where the field of possible models is both vast and sparsely sampled. That our model shows a degree of fit with the data means little if uncountable very different models fit just as well or better. The practice is kin with awarding oneself a gold medal after finishing a race blind to the rest of the field. Nor is limited model comparison acceptable, for differentiating between a handful of models tells us little about the sea of possibilities from which they are drawn.</p>
                <p>Rather, we need to quantify the 
                    <italic toggle="yes">individual</italic> predictive power of a model, across time or across individuals, in relation to the future state of a system, or some outcome measure of interest. Such prediction is naturally framed in standard terms of sensitivity and specificity, derived from a comprehensive spread of data the model has not seen (
                    <xref ref-type="bibr" rid="ref-6">Dwork 
                        <italic toggle="yes">et al</italic>., 2015</xref>; 
                    <xref ref-type="bibr" rid="ref-30">Vapnik, 1998</xref>). A model with perfect predictive power cannot be improved upon, so its competitors may be reasonably dismissed. A model with imperfect predictive power is to be stratified by metrics, leaving as much or as little room for exploring others as its performance dictates.</p>
                <p>Crucially, if a given model is powerfully predictive, none of the constituent features can be treated as noise, no matter how random they may appear when viewed in isolation. This approach does not implicate any individual constituent feature mechanistically, because functionally irrelevant incidentals (data and/or features) may drive prediction, like correlation. But it does imply no component feature leading to a good prediction can be safely ignored.</p>
                <p>Of course, the richer the parameterisation of a model, the more susceptible it is to &#x201c;overfitting&#x201d; - the identification of coincidences of features in a dataset arising by chance with no predictive power beyond it (
                    <xref ref-type="bibr" rid="ref-12">Hawkins, 2004</xref>). But that is no more reason for avoiding such an approach than the possibility of being dazzled is a reason for keeping one&#x2019;s eyes permanently shut. It is in any event a practical, not a theoretical objection, addressable through the use of large-scale, fully inclusive datasets and high performance computing, as we discuss below.</p>
            </sec>
            <sec>
                <title>Model generation and estimation</title>
                <p>To insist on 
                    <italic toggle="yes">intuiting</italic> a hypothesis as the first investigative step imposes a bias towards models couched in familiar concepts within a contemporary sphere of comfort. Where the hypothesis space is too large for our imaginations to traverse confidently, relying on intuition is not principled but hubristic. We need a formal hypothesis generation step, explicitly driven by exploratory analysis of data at sufficient scale and with adequate dimensional richness. The optimal scale and dimensionality will vary unknowably with any specific problem, but since both are likely to be very large, practical feasibility shall generally be the limit (
                    <xref ref-type="bibr" rid="ref-9">Ghahramani, 2015</xref>).</p>
                <p>The manner of model generation constrains subsequent model estimation. If the former requires high dimensionality so will the latter. We cannot assume the underlying causal field to be sparse, or that its components will be linearly separable. In attempting to compress the dimensionality of models&#x2014;explicitly through the use of a feature selection step, or implicitly through the use of sparsity-promoting inferential methods&#x2014;we need to watch the impact on individual predictive power, assessed over a sufficiently diverse sample. Where a smooth decrement in prediction performance is seen with feature reduction, the underlying system is likely to be polymorphous, and aggressive feature selection is likely to be counter-productive. Equally, we cannot reliably rank input features taken in isolation on their marginal contribution to predictability, for this necessarily ignores their interactions (
                    <xref ref-type="bibr" rid="ref-5">Drami&#x0144;ski 
                        <italic toggle="yes">et al</italic>., 2008</xref>).</p>
                <p>In short, models need to be complex enough to be tractable only with the highest capacity inferential architectures, such as the neurally inspired forms that have so rapidly grown to dominate the field of machine learning, notably in vision research. As in that case, this conclusion reveals two crucial problems, namely sensitivity to data scale and interpretability, both widely discussed in the literature (e.g. (
                    <xref ref-type="bibr" rid="ref-3">Bzdok &amp; Yeo, 2017</xref>)). Rather than rehearse the familiar difficulties they present, here we draw attention to a few unexpected possibilities they reveal.</p>
            </sec>
        </sec>
        <sec>
            <title>The blessing of dimensionality</title>
            <p>We have seen that complex, polymorphous systems require irreducibly many variables to achieve individually meaningful predictions. The resultant expansion of the parameter space under-determines models in proportion to the small scale of commonly available data. This familiar 
                <italic toggle="yes">curse</italic> of dimensionality [25] makes good solutions hard to find and even harder to generalize, for the risk of purely accidental fits increases with the number of parameters.</p>
            <p>But we should recognise that dimensionality also carries a blessing. Consider the parameterisations of contrasting dimensionality shown in 
                <xref ref-type="fig" rid="f1">Figure 1</xref>. Such individualisation as our low-dimensional parameterisation may achieve, here the inter-ocular distance, will be strongly dependent on the precision of measurement, for everyone is differentiated along a single dimension. In contrast with a high-dimensional parameterisation, such as a crudely pixelated rendition of the image, the precision of each individual variable is much less important, for the signal is conveyed in the covariance across variables. Crucially, since the structure of the underlying high-dimensional pattern is unlikely to resemble instrumental or other sources of noise, we can achieve 
                <italic toggle="yes">greater</italic> individualisation with 
                <italic toggle="yes">lower</italic> quality data. This is intuitively obvious in our ability to recognize faces from noisy, low-resolution images, robust not only to affine transforms of the data such as contrast, zoom, and skew, but also to fairly complex non-linear distortions.</p>
            <p>The conventional resistance to using routinely acquired data on the grounds of noise and heterogeneity is only justified where the analysis is low dimensional. When measuring (say) total grey matter volume, it matters that one scanner will generate consistently greater estimates compared with another.  But when extracting the high-dimensional variation of grey matter concentration across the brain, such effects will drop out as irrelevant affine shifts that leave the complex, individuating covariance patterns intact.</p>
            <p>Perhaps the most important objection to high-dimensional modelling&#x2014;the scale of the data required&#x2014;is thus addressable through collections for another purpose, obtained outside a research environment. In the domain of structural brain imaging, the obvious source is clinical imaging (
                <xref ref-type="bibr" rid="ref-7">Frackowiak &amp; Markram, 2015</xref>). Since brain imaging is carried out to resolve diagnostic uncertainty towards normality almost as often as away from it, such data need not be restricted to the realm of pathology. Similarly, though smartphones may fall short of the precision of dedicated psychophysical devices, their ubiquity and critical mediating role in life enable the collection of rich, high-dimensional data on a vast scale (
                <xref ref-type="bibr" rid="ref-29">Teki 
                    <italic toggle="yes">et al</italic>., 2016</xref>).</p>
            <p>Of course, the correct balance between data size and data quality is an empirical question, to be settled case-by-case. But we cannot assume the former must be gated by the latter, and discount a high-dimensional approach simply because a conventional psychophysical laboratory cannot scale to thousands of participants. Rather, we must reconsider what we actually need to know, and what human activity may collaterally disclose it.</p>
        </sec>
        <sec>
            <title>Living with opacity</title>
            <p>What use are high-dimensional models if they are too complex to understand? Where outcomes are highly variable, as is the norm in cognitive neurology, prediction is clinically invaluable, not simply because patients are consoled by accurate prognosis but because interventions need to be guided by their individually predicted responses. If a &#x201c;black box&#x201d; predictor is the best guide to a correct choice of treatment actuarially, it would be difficult to justify not following it 
                <italic toggle="yes">merely</italic> because its operations cannot be paraphrased in intelligible prose.</p>
            <p>Moreover, clinical interventions are already primarily driven by &#x201c;black boxes&#x201d; - the contents of our heads are a good example. To give a 
                <italic toggle="yes">reason</italic> for acting is not to specify a cause or to imply an underlying causal model, it is kin with pointing to a latent variable. It is only rarely, where very simple biological systems are concerned, never in the brain, that we have a perspicuous, mechanistic explanatory model available. That a human expert can cite a reason for his actions does not make his decision-making less opaque than that of a synthetic counterpart.</p>
            <p>If a system requires a complex model to describe it, then it 
                <italic toggle="yes">is</italic> complex. Translational science needs to adjust to this emotionally, not hopelessly attempt to change it intellectually. A causal field so intricate it can only be specified as an artificial neural network with a million parameters 
                <italic toggle="yes">is</italic> explanatory, even if its incomprehensibility makes us hesitate to use a word stronger than predictive. We can no more hope to understand the brain shackled to simple, linear models, than a literary critic could hope to understand Shakespeare applying the basic rules of grammar alone.</p>
        </sec>
        <sec sec-type="conclusions">
            <title>Concluding remarks</title>
            <p>Until a decade ago, the foregoing analysis would have been unbearably nihilistic, for we had neither the data nor the computational tools to realise the alternative it urges. The ground is still new and uncertain, yet to be proven capable of supporting the structure we argue it is imperative we begin to erect on it. But if we wish to move beyond discussions of tractability or feasibility into translatable action, we must confront the single most striking fact about the brain - its immense complexity.</p>
            <p>The difficulties are all the greater for being distributed across many intellectual, technological, even political domains, reaching deep into the foundations of the very notion of biological understanding. A cognitive neuroscience recast in the form we propose will have more in common with meteorology than horology. If so, then it will be because the fundamental nature of the brain has compelled it, for what we urge here above all is to let the data, not our own brains, speak first. And if effective prediction supplants defective understanding as a result, those outside the field, whose lives cognitive neuroscience and cognitive neurology seek ultimately to serve, will appreciate the exchange.</p>
        </sec>
        <sec>
            <title>Data availability</title>
            <p>No data is associated with this article.</p>
        </sec>
    </body>
    <back>
        <ref-list>
            <ref id="ref-1">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Adolphs</surname>
                            <given-names>R</given-names>
                        </name>
</person-group>:
                    <article-title>Human Lesion Studies in the 21st Century.</article-title>
                    <source>

                        <italic toggle="yes">Neuron.</italic>
</source>
                    <year>2016</year>;<volume>90</volume>(<issue>6</issue>):<fpage>1151</fpage>&#x2013;<lpage>1153</lpage>.
                    <pub-id pub-id-type="pmid">27311080</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.neuron.2016.05.014</pub-id>
                    <pub-id pub-id-type="pmcid">5656290</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-2">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Bressler</surname>
                            <given-names>SL</given-names>
                        </name>

                        <name name-style="western">
                            <surname> Menon</surname>
                            <given-names>V</given-names>
                        </name>
</person-group>:
                    <article-title>Large-scale brain networks in cognition: emerging methods and principles.</article-title>
                    <source>

                        <italic toggle="yes">Trends Cogn Sci.</italic>
</source>
                    <year>2010</year>;<volume>14</volume>(<issue>6</issue>):<fpage>277</fpage>&#x2013;<lpage>290</lpage>.
                    <pub-id pub-id-type="pmid">20493761</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.tics.2010.04.004</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-3">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Bzdok</surname>
                            <given-names>D</given-names>
                        </name>

                        <name name-style="western">
                            <surname> Yeo</surname>
                            <given-names>BTT</given-names>
                        </name>
</person-group>:
                    <article-title>Inference in the age of big data: Future perspectives on neuroscience.</article-title>
                    <source>

                        <italic toggle="yes">NeuroImage.</italic>
</source>
                    <year>2017</year>;<volume>155</volume>:<fpage>549</fpage>&#x2013;<lpage>564</lpage>.
                    <pub-id pub-id-type="pmid">28456584</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.neuroimage.2017.04.061</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-4">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Chang</surname>
                            <given-names>L</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Tsao </surname>
                            <given-names>DY</given-names>
                        </name>
</person-group>:
                    <article-title>The Code for Facial Identity in the Primate Brain.</article-title>
                    <source>

                        <italic toggle="yes">Cell.</italic>
</source>
                    <year>2017</year>;<volume>169</volume>(<issue>6</issue>):<fpage>1013</fpage>&#x2013;<lpage>1028.e14</lpage>.
                    <pub-id pub-id-type="pmid">28575666</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.cell.2017.05.011</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-5">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Drami&#x0144;ski</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Rada-Iglesias</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Enroth</surname>
                            <given-names>S</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Monte Carlo feature selection for supervised classification.</article-title>
                    <source>

                        <italic toggle="yes">Bioinformatics.</italic>
</source>
                    <year>2008</year>;<volume>24</volume>(<issue>1</issue>):<fpage>110</fpage>&#x2013;<lpage>117</lpage>.
                    <pub-id pub-id-type="pmid">18048398</pub-id>
                    <pub-id pub-id-type="doi">10.1093/bioinformatics/btm486</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-6">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Dwork</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Feldman</surname>
                            <given-names>V</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hardt</surname>
                            <given-names>M</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>STATISTICS. The reusable holdout: Preserving validity in adaptive data analysis.</article-title>
                    <source>

                        <italic toggle="yes">Science.</italic>
</source>
                    <year>2015</year>;<volume>349</volume>(<issue>6248</issue>):<fpage>636</fpage>&#x2013;<lpage>638</lpage>.
                    <pub-id pub-id-type="pmid">26250683</pub-id>
                    <pub-id pub-id-type="doi">10.1126/science.aaa9375</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-7">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Frackowiak</surname>
                            <given-names>R</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Markram </surname>
                            <given-names>H</given-names>
                        </name>
</person-group>:
                    <article-title>The future of human cerebral cartography: a novel approach.</article-title>
                    <source>

                        <italic toggle="yes">Philos Trans R Soc Lond B Biol Sci.</italic>
</source>
                    <year>2015</year>;<volume>370</volume>(<issue>1668</issue>): pii: 20140171.
                    <pub-id pub-id-type="pmid">25823868</pub-id>
                    <pub-id pub-id-type="doi">10.1098/rstb.2014.0171</pub-id>
                    <pub-id pub-id-type="pmcid">4387512</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-8">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Gal</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname> Ghahramani</surname>
                            <given-names>Z</given-names>
                        </name>
</person-group>:
                    <article-title>Dropout as a Bayesian Approximation: Representing Model Uncertainty in Deep Learning.</article-title>In
                    <source>

                        <italic toggle="yes">PMLR.</italic>
</source>
                    <year>2016</year>;<fpage>1050</fpage>&#x2013;<lpage>1059</lpage>. [Accessed June 5, 2017].
                    <ext-link ext-link-type="uri" xlink:href="http://proceedings.mlr.press/v48/gal16.html">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-9">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Ghahramani</surname>
                            <given-names>Z</given-names>
                        </name>
</person-group>:
                    <article-title>Probabilistic machine learning and artificial intelligence.</article-title>
                    <source>

                        <italic toggle="yes">Nature.</italic>
</source>
                    <year>2015</year>;<volume>521</volume>(<issue>7553</issue>):<fpage>452</fpage>&#x2013;<lpage>459</lpage>.
                    <pub-id pub-id-type="pmid">26017444</pub-id>
                    <pub-id pub-id-type="doi">10.1038/nature14541</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-10">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Goodfellow</surname>
                            <given-names>I</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Bengio</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Courville</surname>
                            <given-names>A</given-names>
                        </name>
</person-group>:
                    <article-title>Deep Learning</article-title>. MIT Press,<year>2016</year>.
                    <ext-link ext-link-type="uri" xlink:href="https://mitpress.mit.edu/books/deep-learning">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-11">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Hacker</surname>
                            <given-names>PMS</given-names>
                        </name>
</person-group>:
                    <article-title>Human Nature: The Categorial Framework</article-title>. John Wiley &amp; Sons.<year>2007</year>.
                    <ext-link ext-link-type="uri" xlink:href="http://14.139.206.50:8080/jspui/bitstream/1/2337/1/Hacker,%20P.M.S.%20-%20Human%20Nature%20The%20Categorial%20Framework%20%202007.pdf">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-12">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Hawkins</surname>
                            <given-names>DM</given-names>
                        </name>
</person-group>:
                    <article-title>The problem of overfitting.</article-title>
                    <source>

                        <italic toggle="yes">J Chem Inf Comput Sci.</italic>
</source>
                    <year>2004</year>;<volume>44</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>12</lpage>.
                    <pub-id pub-id-type="pmid">14741005</pub-id>
                    <pub-id pub-id-type="doi">10.1021/ci0342472</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-13">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Huttenlocher</surname>
                            <given-names>PR</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Dabholkar</surname>
                            <given-names>AS</given-names>
                        </name>
</person-group>:
                    <article-title>Regional differences in synaptogenesis in human cerebral cortex.</article-title>
                    <source>

                        <italic toggle="yes">J Comp Neurol.</italic>
</source>
                    <year>1997</year>;<volume>387</volume>(<issue>2</issue>):<fpage>167</fpage>&#x2013;<lpage>178</lpage>.
                    <pub-id pub-id-type="pmid">9336221</pub-id>
                    <pub-id pub-id-type="doi">10.1002/(SICI)1096-9861(19971020)387:2&lt;167::AID-CNE1&gt;3.0.CO;2-Z</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-14">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Le Cun</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Denker</surname>
                            <given-names>JS</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Solla</surname>
                            <given-names>SA</given-names>
                        </name>
</person-group>:
                    <article-title>Optimal Brain Damage</article-title>. In
                    <source>

                        <italic toggle="yes">Proceedings of the 2Nd International Conference on Neural Information Processing Systems.</italic>
</source>NIPS&#x2019; 89. (Cambridge, MA USA: MIT Press),<year>1989</year>;<fpage>598</fpage>&#x2013;<lpage>605</lpage>.
                    <ext-link ext-link-type="uri" xlink:href="http://dl.acm.org/citation.cfm?id=2969830.2969903">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-15">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>LeCun</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Bengio</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hinton</surname>
                            <given-names>G</given-names>
                        </name>
</person-group>:
                    <article-title>Deep learning.</article-title>
                    <source>

                        <italic toggle="yes">Nature.</italic>
</source>
                    <year>2015</year>;<volume>521</volume>(<issue>7553</issue>):<fpage>436</fpage>&#x2013;<lpage>444</lpage>.
                    <pub-id pub-id-type="pmid">26017442</pub-id>
                    <pub-id pub-id-type="doi">10.1038/nature14539</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-16">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Lossi</surname>
                            <given-names>L</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Merighi</surname>
                            <given-names>A</given-names>
                        </name>
</person-group>:
                    <article-title>
                        <italic toggle="yes">In vivo</italic> cellular and molecular mechanisms of neuronal apoptosis in the mammalian CNS.</article-title>
                    <source>

                        <italic toggle="yes">Prog Neurobiol.</italic>
</source>
                    <year>2003</year>;<volume>69</volume>(<issue>5</issue>):<fpage>287</fpage>&#x2013;<lpage>312</lpage>.
                    <pub-id pub-id-type="pmid">12787572</pub-id>
                    <pub-id pub-id-type="doi">10.1016/S0301-0082(03)00051-0</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-17">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Mackie</surname>
                            <given-names>JL</given-names>
                        </name>
</person-group>:
                    <article-title>The Cement of the Universe</article-title>. Oxford, Clarendon Press,<year>1974</year>.
                    <ext-link ext-link-type="uri" xlink:href="https://philpapers.org/rec/MACTCO-7">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-18">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Marder</surname>
                            <given-names>E</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Bucher</surname>
                            <given-names>D</given-names>
                        </name>
</person-group>:
                    <article-title>Understanding circuit dynamics using the stomatogastric nervous system of lobsters and crabs.</article-title>
                    <source>

                        <italic toggle="yes">Annu Rev Physiol.</italic>
</source>
                    <year>2007</year>;<volume>69</volume>:<fpage>291</fpage>&#x2013;<lpage>316</lpage>.
                    <pub-id pub-id-type="pmid">17009928</pub-id>
                    <pub-id pub-id-type="doi">10.1146/annurev.physiol.69.031905.161516</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-19">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Matsuoka</surname>
                            <given-names>K</given-names>
                        </name>
</person-group>:
                    <article-title>Noise injection into inputs in back-propagation learning.</article-title>
                    <source>

                        <italic toggle="yes">IEEE Transactions on Systems, Man, and Cybernetics.</italic>
</source>
                    <year>1992</year>;<volume>22</volume>(<issue>3</issue>):<fpage>436</fpage>&#x2013;<lpage>440</lpage>.
                    <pub-id pub-id-type="doi">10.1109/21.155944</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-20">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>McMahan</surname>
                            <given-names>HB</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Moore</surname>
                            <given-names>E</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ramage</surname>
                            <given-names>D</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Communication-Efficient Learning of Deep Networks from Decentralized Data.</article-title>
                    <source>

                        <italic toggle="yes">arXiv: 1602.05629 [cs].</italic>
</source>
                    <year>2016</year>. [Accessed May 13, 2018].
                    <ext-link ext-link-type="uri" xlink:href="http://arxiv.org/abs/1602.05629">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-21">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Parkhi</surname>
                            <given-names>OM</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Vedaldi</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zisserman</surname>
                            <given-names>A</given-names>
                        </name>
</person-group>:
                    <article-title>Deep Face Recognition</article-title>. In
                    <source>

                        <italic toggle="yes">BMVC.</italic>
</source>
                    <year>2015</year>;<fpage>6</fpage>.
                    <pub-id pub-id-type="doi">10.5244/C.29.41</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-22">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Qureshi</surname>
                            <given-names>AI</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Mendelow</surname>
                            <given-names>AD</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hanley</surname>
                            <given-names>DF</given-names>
                        </name>
</person-group>:
                    <article-title>Intracerebral haemorrhage.</article-title>
                    <source>

                        <italic toggle="yes">Lancet.</italic>
</source>
                    <year>2009</year>;<volume>373</volume>(<issue>9675</issue>):<fpage>1632</fpage>&#x2013;<lpage>1644</lpage>.
                    <pub-id pub-id-type="pmid">19427958</pub-id>
                    <pub-id pub-id-type="doi">10.1016/S0140-6736(09)60371-8</pub-id>
                    <pub-id pub-id-type="pmcid">3138486</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-23">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Rands</surname>
                            <given-names>CM</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Meader</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ponting</surname>
                            <given-names>CP</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>8.2% of the Human genome is constrained: variation in rates of turnover across functional element classes in the human lineage.</article-title>
                    <source>

                        <italic toggle="yes">PLoS Genet.</italic>
</source>
                    <year>2014</year>;<volume>10</volume>(<issue>7</issue>):<fpage>e1004525</fpage>.
                    <pub-id pub-id-type="pmid">25057982</pub-id>
                    <pub-id pub-id-type="doi">10.1371/journal.pgen.1004525</pub-id>
                    <pub-id pub-id-type="pmcid">4109858</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-24">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Rissanen</surname>
                            <given-names>J</given-names>
                        </name>
</person-group>:
                    <article-title>Modeling by shortest data description.</article-title>
                    <source>

                        <italic toggle="yes">Automatica.</italic>
</source>
                    <year>1978</year>;<volume>14</volume>(<issue>5</issue>):<fpage>465</fpage>&#x2013;<lpage>471</lpage>.
                    <pub-id pub-id-type="doi">10.1016/0005-1098(78)90005-5</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-25">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Rorden</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Karnath</surname>
                            <given-names>HO</given-names>
                        </name>
</person-group>:
                    <article-title>Using human brain lesions to infer function: a relic from a past era in the fMRI age?</article-title>
                    <source>

                        <italic toggle="yes">Nat Rev Neurosci.</italic>
</source>
                    <year>2004</year>;<volume>5</volume>(<issue>10</issue>):<fpage>813</fpage>&#x2013;<lpage>819</lpage>.
                    <pub-id pub-id-type="pmid">15378041</pub-id>
                    <pub-id pub-id-type="doi">10.1038/nrn1521</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-26">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Schroff</surname>
                            <given-names>F</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Kalenichenko</surname>
                            <given-names>D</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Philbin</surname>
                            <given-names>J</given-names>
                        </name>
</person-group>:
                    <article-title>FaceNet: A Unified Embedding for Face Recognition and Clustering</article-title>.<year>2015</year>;<fpage>815</fpage>&#x2013;<lpage>823</lpage>. [Accessed December 7, 2016].
                    <pub-id pub-id-type="doi">10.1109/CVPR.2015.7298682</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-27">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Srivastava</surname>
                            <given-names>N</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hinton</surname>
                            <given-names>G</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Krizhevsky</surname>
                            <given-names>A</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Dropout: A Simple Way to Prevent Neural Networks from Overfitting.</article-title>
                    <source>

                        <italic toggle="yes">J Mach Learn Res.</italic>
</source>
                    <year>2014</year>;<volume>15</volume>:<fpage>1929</fpage>&#x2013;<lpage>1958</lpage>.
                    <ext-link ext-link-type="uri" xlink:href="http://jmlr.org/papers/volume15/srivastava14a.old/srivastava14a.pdf">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-28">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Tang</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Nyengaard</surname>
                            <given-names>JR</given-names>
                        </name>

                        <name name-style="western">
                            <surname>De Groot</surname>
                            <given-names>DM</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Total regional and global number of synapses in the human brain neocortex.</article-title>
                    <source>

                        <italic toggle="yes">Synapse.</italic>
</source>
                    <year>2001</year>;<volume>41</volume>(<issue>3</issue>):<fpage>258</fpage>&#x2013;<lpage>273</lpage>.
                    <pub-id pub-id-type="pmid">11418939</pub-id>
                    <pub-id pub-id-type="doi">10.1002/syn.1083</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-29">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Teki</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Kumar</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Griffiths</surname>
                            <given-names>TD</given-names>
                        </name>
</person-group>:
                    <article-title>Large-Scale Analysis of Auditory Segregation Behavior Crowdsourced via a Smartphone App.</article-title>
                    <source>

                        <italic toggle="yes">PLoS One.</italic>
</source>
                    <year>2016</year>;<volume>11</volume>(<issue>4</issue>):<fpage>e0153916</fpage>.
                    <pub-id pub-id-type="pmid">27096165</pub-id>
                    <pub-id pub-id-type="doi">10.1371/journal.pone.0153916</pub-id>
                    <pub-id pub-id-type="pmcid">4838209</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-30">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Vapnik</surname>
                            <given-names>V</given-names>
                        </name>
</person-group>:
                    <article-title>Statistical learning theory</article-title>. Wiley.<year>1998</year>.
                    <ext-link ext-link-type="uri" xlink:href="http://read.pudn.com/downloads161/ebook/733192/Statistical-Learning-Theory.pdf">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-31">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Wan</surname>
                            <given-names>L</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zeiler</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>S</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Regularization of Neural Networks using DropConnect</article-title>.<year>2013</year>;<fpage>1058</fpage>&#x2013;<lpage>1066</lpage>. [Accessed June 5, 2017].
                    <ext-link ext-link-type="uri" xlink:href="http://proceedings.mlr.press/v28/wan13.pdf">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-32">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Wardlaw</surname>
                            <given-names>JM</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Warlow</surname>
                            <given-names>CP</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Counsell</surname>
                            <given-names>C</given-names>
                        </name>
</person-group>:
                    <article-title>Systematic review of evidence on thrombolytic therapy for acute ischaemic stroke.</article-title>
                    <source>

                        <italic toggle="yes">Lancet.</italic>
</source>
                    <year>1997</year>;<volume>350</volume>(<issue>9078</issue>):<fpage>607</fpage>&#x2013;<lpage>614</lpage>.
                    <pub-id pub-id-type="pmid">9288042</pub-id>
                    <pub-id pub-id-type="doi">10.1016/S0140-6736(97)03022-5</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-33">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Zhou</surname>
                            <given-names>E</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Cao</surname>
                            <given-names>Z</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Yin</surname>
                            <given-names>Q</given-names>
                        </name>
</person-group>:
                    <article-title>Naive-Deep Face Recognition: Touching the Limit of LFW Benchmark or Not?</article-title>
                    <source>

                        <italic toggle="yes">arXiv: 1501.04690 [cs].</italic>
</source>
                    <year>2015</year>.
                    <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/pdf/1501.04690.pdf">Reference Source</ext-link>
                </mixed-citation>
            </ref>
        </ref-list>
    </back>
    <sub-article article-type="reviewer-report" id="report35675">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.16353.r35675</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Wager</surname>
                        <given-names>Tor D.</given-names>
                    </name>
                    <xref ref-type="aff" rid="r35675a1">1</xref>
                    <role>Referee</role>
                </contrib>
                <aff id="r35675a1">
                    <label>1</label>Department of Psychology and Neuroscience, University of Colorado Boulder, Boulder, CO, USA</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>23</day>
                <month>8</month>
                <year>2018</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2018 Wager TD</copyright-statement>
                <copyright-year>2018</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport35675" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.15020.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>In &#x201c;Lost in Translation&#x201d;, Nachev et al. provide a bold and thought-provoking piece on the past and future of cognitive neuroscience. Their thesis is that the classic inferential tools of neuropsychology, which also formed some of the foundational building blocks of cognitive neuroscience, are inadequate to model and understand the complexity of the brain. New paradigms are needed, and Nachev et al. offer a fresh, theoretical argument for why we should embrace new concepts of distributed causality, nonlinearity, and models that move beyond averaging over individuals to better capture inter-individual variation. The implication is that only by embracing such models can cognitive neuroscience, and perhaps neuroimaging in particular, develop models that are accurate enough to predict individual performance and clinical status - in short, to be translationally useful.</p>
            <p> </p>
            <p> Nachev et al.&#x2019;s position has much to recommend it. One anchor point in their argument is that the brain processes that drive (cause) feeling and behavior are distributed across neurons and/or brain systems&#x2014;and, if this is the case, then models and measures with coarse, distributed features (even if noisy) will outperform those with only a few, high-precision features. I resonate with this point. There is substantial evidence that the neural representations underlying multiple forms of cognition, emotion, and action are population codes distributed across large numbers of neurons and (in the case of fMRI) brain regions and systems (e.g., for review, see Kragel et al. 2018
                <sup>
                    <xref ref-type="bibr" rid="rep-ref-35675-1">1</xref>
                </sup>).&#x00a0; In fMRI studies, distributed predictive models that include activity across regions and systems can dramatically outperform those based on even the best single brain regions (for recent reviews see, e.g., Arbabshirani et al. 2017
                <sup>
                    <xref ref-type="bibr" rid="rep-ref-35675-2">2</xref>
                </sup>; Bzdok &amp; Meyer-Lindenberg 2017
                <sup>
                    <xref ref-type="bibr" rid="rep-ref-35675-3">3</xref>
                </sup>; Woo et al. 2017
                <sup>
                    <xref ref-type="bibr" rid="rep-ref-35675-4">4</xref>
                </sup>; Kragel et al. 2018, Figure 3 and text). &#x00a0;</p>
            <p> </p>
            <p> 
                <italic>Units of analysis</italic>
            </p>
            <p> </p>
            <p> The essential question when it comes to brain systems is &#x201c;What are the units of analysis&#x201d;? The authors imply that translational failures come from a localisationist approach, and provide a thought-provoking theoretical argument for why the brain - at least with respect to cognition, feeling, and behavior - ought to be treated as a system with broadly distributed causality. I agree in part. Lesioning isolated nodes in a neural network typically does not catastrophically, or selectively, impair performance largely because the single node (or neuron) is not the relevant unit of analysis. But if one were to lesion a 
                <italic>layer</italic>, particularly a layer dedicated to a particular function as in the structured, brain-inspired networks of O&#x2019;Reilly et al. (Aisa et al. 2008
                <sup>
                    <xref ref-type="bibr" rid="rep-ref-35675-5">5</xref>
                </sup>; O&#x2019;Reilly et al. 2017
                <sup>
                    <xref ref-type="bibr" rid="rep-ref-35675-6">6</xref>
                </sup>), the effects on network behavior would be profound. Recent advances in opto- and chemogenetics allow for the targeting and activation/inactivation of distributed sets of neurons that collectively represent particular cognitions and actions (e.g., Ramirez et al. 2013
                <sup>
                    <xref ref-type="bibr" rid="rep-ref-35675-7">7</xref>
                </sup>), with strong effects on behavior. Likewise, when studying ecosystems, the loss of individual organisms selected at random has little effect on the behavior of the system as a whole; but loss of a species can have a profound effect. The species, but not the individual, can be characterized as having necessary and sufficient roles in the system&#x2019;s behavior. Likewise, individual neurons are likely not necessary or sufficient for anything, but neural populations are.&#x00a0;</p>
            <p> </p>
            <p> A related point is Nachev et al.&#x2019;s critique of averaging over individuals, which also hinges on the issue of which units of analysis are averaged over. Nachev et al.&#x2019;s &#x201c;watch&#x201d; example is an interesting case study. They show that averaging over visual images of watch mechanisms does not elucidate the nature of watches or produce anything like any of the individual watches. But the problem is not averaging per se - it is knowing what to average over. Pixels in an image of the watch mechanisms are simply not the right unit of analysis, so averaging over them is meaningless. However, the average watch has 2 gear wheels, 2 hands, and one battery; averaging over or otherwise characterizing the distributions over these properties makes sense.</p>
            <p> </p>
            <p> Perhaps we will discover that brain voxels are not the right features to average over, either (and I suspect that they are not!). Cognitive neuroscience converges with machine learning in that a big part of the endeavor is, and has always been, discovering the units (or features) and level of analysis that confer maximal ability to understand the mind and predict future behavior.&#x00a0;</p>
            <p> </p>
            <p> 
                <italic>Monomorphous and polymorphous</italic>
            </p>
            <p> </p>
            <p> Another interesting contrast that Nachev et al. make is the distinction between monomorphous populations, whose individuals are identical, and polymorphous populations, whose individuals vary. Their central argument is that because human brains are polymorphous, we should not characterize them using averages across individuals; rather, we should focus on more individualized models.&#x00a0;</p>
            <p> </p>
            <p> Clearly, humans are a polymorphous bunch. But does this mean that population-level studies that characterize averages - or, alternatively, develop multivariate predictive models of behavior across individuals - are useless? Really, the brain is both monomorphous and polymorphous, at different levels of analysis. Identifying patterns of commonality does not mean that all variation is noise. If I were trying to describe to a space-faring alien what a car looks like, I would not assume that all cars are identical and the difference between a Tesla and a Toyota is &#x201c;noise&#x201d;. But neither would I assume that every car is completely different, which would preclude any sort of common description at all. The brain is similar in this respect. Virtually all of us have an occipital lobe, which contains a primary visual cortex. We have a primary motor cortex, a hippocampus, an inferior frontal junction, each of which plays consistent roles in behavior across individuals. In my lab&#x2019;s work, we find that systems that track and predict the intensity of evoked pain experience are very similar across individuals - for example, the same brain pattern responds to painful events to some degree in 95% of participants (the 5% might well be largely noise; see Zunhammer et al., N = 603). But this does not mean that individual differences are unimportant! Rather, these baseline commonalities are a launching point for understanding the &#x2018;variations on a theme&#x2019; that make individuals different from one another. &#x00a0;</p>
            <p> 
                <italic>Lost and found</italic>
            </p>
            <p> </p>
            <p> A final reflection: It is true that cognitive neuroscience has not developed many translational applications that are used clinically or commercially (e.g., Woo et al. 2017). But this does not necessarily imply that cognitive neuroscience has failed so far.&#x00a0; We should remember that the goal of cognitive neuroscience has been to understand the physiological representation of thought and behavior - one of the thorniest challenges in all of science, and a basic (not clinical) goal at that. Like many forms of basic science, the hope is that by better understanding how the mind works, without tying it immediately to any commercial venture or practical application, will yield new ways of thinking about the brain and mind, which in turn will inspire future applications that were previously unimagined. In my own lab&#x2019;s work on pain and emotion, I have learned that the gaps between science and commercial application are not just about limitations in the science. Even if current cognitive neuroscience-based models could reliably diagnose mental and brain health conditions in individual people with perfect sensitivity and specificity, there would be gaps related to business development, marketing, public understanding and policy, economic cost/benefit ratios, equal access, insurance reimbursements, and more. I believe that in the past 2-3 years, cognitive and clinical neuroscience has succeeded in developing models of brain function that could be useful for characterizing dementia, depression, pain, autism, and more. Their clinical and commercial success will depend largely on what society wants to do with the science.</p>
            <p> </p>
            <p> This does not, of course, take away from the point that translation is a worthy and useful goal, both from a humanitarian (e.g., Gabrieli et al. 2015
                <sup>
                    <xref ref-type="bibr" rid="rep-ref-35675-8">8</xref>
                </sup>) and scientific perspective. Not only can it advance clinical applications, translation also provides a concrete, objective yardstick against which to evaluate our understanding of the brain. Clearly, we have a great distance to go;&#x00a0;the good news is that we're moving forward.</p>
            <p>Is the topic of the opinion article discussed accurately in the context of the current literature?</p>
            <p>Yes</p>
            <p>Are arguments sufficiently supported by evidence from the published literature?</p>
            <p>Partly</p>
            <p>Are all factual statements correct and adequately supported by citations?</p>
            <p>Partly</p>
            <p>Are the conclusions drawn balanced and justified on the basis of the presented arguments?</p>
            <p>Partly</p>
            <p>Reviewer Expertise:</p>
            <p>NA</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard.</p>
        </body>
        <back>
            <ref-list>
                <title>References</title>
                <ref id="rep-ref-35675-1">
                    <label>1</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Representation, Pattern Information, and Brain Signatures: From Neurons to Neuroimaging.</article-title>
                        <source>
                            <italic>Neuron</italic>
                        </source>.<year>2018</year>;<volume>99</volume>(<issue>2</issue>) :
                        <elocation-id>10.1016/j.neuron.2018.06.009</elocation-id>
                        <fpage>257</fpage>-<lpage>273</lpage>
                        <pub-id pub-id-type="pmid">30048614</pub-id>
                        <pub-id pub-id-type="doi">10.1016/j.neuron.2018.06.009</pub-id>
                    </mixed-citation>
                </ref>
                <ref id="rep-ref-35675-2">
                    <label>2</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Single subject prediction of brain disorders in neuroimaging: Promises and pitfalls</article-title>.
                        <source>
                            <italic>NeuroImage</italic>
                        </source>.<year>2017</year>;<volume>145</volume>:
                        <elocation-id>10.1016/j.neuroimage.2016.02.079</elocation-id>
                        <fpage>137</fpage>-<lpage>165</lpage>
                        <pub-id pub-id-type="doi">10.1016/j.neuroimage.2016.02.079</pub-id>
                    </mixed-citation>
                </ref>
                <ref id="rep-ref-35675-3">
                    <label>3</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Inference in the age of big data: Future perspectives on neuroscience.</article-title>
                        <source>
                            <italic>Neuroimage</italic>
                        </source>.<year>2017</year>;<volume>155</volume>:
                        <elocation-id>10.1016/j.neuroimage.2017.04.061</elocation-id>
                        <fpage>549</fpage>-<lpage>564</lpage>
                        <pub-id pub-id-type="pmid">28456584</pub-id>
                        <pub-id pub-id-type="doi">10.1016/j.neuroimage.2017.04.061</pub-id>
                    </mixed-citation>
                </ref>
                <ref id="rep-ref-35675-4">
                    <label>4</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Building better biomarkers: brain models in translational neuroimaging.</article-title>
                        <source>
                            <italic>Nat Neurosci</italic>
                        </source>.<year>2017</year>;<volume>20</volume>(<issue>3</issue>) :
                        <elocation-id>10.1038/nn.4478</elocation-id>
                        <fpage>365</fpage>-<lpage>377</lpage>
                        <pub-id pub-id-type="pmid">28230847</pub-id>
                        <pub-id pub-id-type="doi">10.1038/nn.4478</pub-id>
                    </mixed-citation>
                </ref>
                <ref id="rep-ref-35675-5">
                    <label>5</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>The emergent neural modeling system.</article-title>
                        <source>
                            <italic>Neural Netw</italic>
                        </source>.<year>2008</year>;<volume>21</volume>(<issue>8</issue>) :
                        <elocation-id>10.1016/j.neunet.2008.06.016</elocation-id>
                        <fpage>1146</fpage>-<lpage>52</lpage>
                        <pub-id pub-id-type="pmid">18684591</pub-id>
                        <pub-id pub-id-type="doi">10.1016/j.neunet.2008.06.016</pub-id>
                    </mixed-citation>
                </ref>
                <ref id="rep-ref-35675-6">
                    <label>6</label>
                    <mixed-citation>
                        <person-group person-group-type="author"/>:
                        <article-title>Deep Predictive Learning: A Comprehensive Model of Three Visual Streams</article-title>.
                        <source>
                            <italic>arXiv [q-bio.NC]</italic>
                        </source>.<year>2017</year>;</mixed-citation>
                </ref>
                <ref id="rep-ref-35675-7">
                    <label>7</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Creating a false memory in the hippocampus.</article-title>
                        <source>
                            <italic>Science</italic>
                        </source>.<year>2013</year>;<volume>341</volume>(<issue>6144</issue>) :
                        <elocation-id>10.1126/science.1239073</elocation-id>
                        <fpage>387</fpage>-<lpage>91</lpage>
                        <pub-id pub-id-type="pmid">23888038</pub-id>
                        <pub-id pub-id-type="doi">10.1126/science.1239073</pub-id>
                    </mixed-citation>
                </ref>
                <ref id="rep-ref-35675-8">
                    <label>8</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Prediction as a humanitarian and pragmatic contribution from human cognitive neuroscience.</article-title>
                        <source>
                            <italic>Neuron</italic>
                        </source>.<year>2015</year>;<volume>85</volume>(<issue>1</issue>) :
                        <elocation-id>10.1016/j.neuron.2014.10.047</elocation-id>
                        <fpage>11</fpage>-<lpage>26</lpage>
                        <pub-id pub-id-type="pmid">25569345</pub-id>
                        <pub-id pub-id-type="doi">10.1016/j.neuron.2014.10.047</pub-id>
                    </mixed-citation>
                </ref>
            </ref-list>
        </back>
        <sub-article article-type="response" id="comment4325-35675">
            <front-stub>
                <contrib-group>
                    <contrib contrib-type="author">
                        <name>
                            <surname>Nachev</surname>
                            <given-names>Parashkev</given-names>
                        </name>
                        <aff>UCL, UK</aff>
                    </contrib>
                </contrib-group>
                <author-notes>
                    <fn fn-type="conflict">
                        <p>
                            <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                    </fn>
                </author-notes>
                <pub-date pub-type="epub">
                    <day>27</day>
                    <month>12</month>
                    <year>2018</year>
                </pub-date>
            </front-stub>
            <body>
                <p>We are grateful to Professor Wager for his thoughtful commentary on our paper, and are pleased he finds sympathy with the broad thrust of our argument. Our revision clarifies the points he raises, and we provide a few further thoughts below.</p>
                <p>
                    <italic>Units of analysis</italic>
                </p>
                <p>We agree there is no warrant for presuming a neural system must be intelligible at a neuroscientist's chosen pet scale of analysis. It is essential to explore a wide variety of scales, including those intelligible only through high-dimensional modelling, where&#x2014;as we argue in detail in the paper&#x2014;the critical organisation is mostly likely to be found. But it is also true that no 
                    <italic>single</italic> scale of analysis need be sufficient, for the organisation may be distributed across a 
                    <italic>multiplicity</italic> of them. Indeed, the kind of compact causal structure biology is likely to favour&#x2014;for the information theoretic reasons we give&#x2014;is constitutionally widely distributed. Of course, necessity and sufficiency is easily obtained at a whole brain level of analysis, but such causality is merely permissive rather than properly explanatory of how thought and behaviour really arise. Might there be some isolated "intermediate" level where causality is plain yet the underlying relations are revealed in sufficient detail? We doubt it, but the only way to tell is through the high-dimensional modelling approach we describe in the second half of the paper.</p>
                <p>
                    <italic>Averaging</italic>
                </p>
                <p>It is a criterion both of general explanation&#x2014;to the satisfaction of the scientist&#x2014;and individual prediction&#x2014;to the satisfaction of the clinician&#x2014;that one can generalise from known instances to unknown ones. In both cases a model 
                    <italic>learns</italic> from one set of data (even if it is not called learning in the conventional statistical literature) and extrapolates to another. When we criticise averaging, our target is specifically low-dimensional models whose form is intuitively specified. In a high-dimensional, necessarily data-driven model, averaging occurs too, but across a 
                    <italic>local neighbourhood</italic>, not across an arbitrarily defined group as a whole. And that neighbourhood is determined by the modelling process itself, guided by out-of-sample predictive performance rather than model statistics. The point is illustrated by the clock mechanism example given in Figure 3.</p>
                <p>
                    <italic>Translation</italic>
                </p>
                <p>We are clinicians, and for us the value of thought is measured by its utility in action. Others may, of course, adopt a different perspective. But consider what the ultimate criterion of fidelity must always be. A neuroscientist may claim his beautifully perspicuous theory of the function of some aspect of the brain is explanatory because it fits a model with half a dozen dimensions derived from fifty people. But what do we tell the patients&#x2014;often the majority&#x2014;the model does not fit? That they are 
                    <italic>noise</italic>? This would be an acceptable excuse 
                    <italic>only</italic> if the predictive power of more complex models remains poor, and the unmodelled variance is indeed plausibly noise. Once a model with better&#x2014;and of course generalisable&#x2014;predictive power is found, the claim is fatally undermined, for what was previously discarded as noise is now explained. That the resultant explanation might be complex need not be to its detriment: generalisable individual predictive performance always trumps perspicuity. The primary concern of the clinician ought to be the scientist's too.</p>
            </body>
        </sub-article>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report34258">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.16353.r34258</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Thiebaut de Schotten</surname>
                        <given-names>Michel</given-names>
                    </name>
                    <xref ref-type="aff" rid="r34258a1">1</xref>
                    <xref ref-type="aff" rid="r34258a2">2</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-0329-1814</uri>
                </contrib>
                <aff id="r34258a1">
                    <label>1</label>INSERM (French Institute of Health and Medical Research) U 1127, CNRS (French National Center for Scientific Research), UMR 7225, ICM Institute for Brain and Spinal Cord, Piti&#x00e9;-Salp&#x00ea;tri&#x00e8;re Hospital, Sorbonne University, Paris, France</aff>
                <aff id="r34258a2">
                    <label>2</label>BCBlab, Sorbonne University, Paris, France</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>19</day>
                <month>6</month>
                <year>2018</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2018 Thiebaut de Schotten M</copyright-statement>
                <copyright-year>2018</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport34258" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.15020.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>In their excellent and timely contribution Nachev, Rees and Frackowiak tackle current limitation in the models used to understand the brain functioning and the translation of this knowledge to the clinical practice. The text is engaging, and the message is clear. The authors did not limit their focus on the current problems but also provide clear new solutions and recommendations for future generations.&#x00a0;</p>
            <p> </p>
            <p> May I suggest the part on Dimensionality and individualisation to be linked up to a recent editorial entitled 'is a *single* brain model sufficient' (Thiebaut de Schotten and Shallice Cortex 2017)
                <sup>
                    <xref ref-type="bibr" rid="rep-ref-34258-1">1</xref>
                </sup>. I think this is appropriate but I leave it as optional for the authors.&#x00a0;</p>
            <p> </p>
            <p> Again, thank you for this elegant contribution soon to become a classic in the field.</p>
            <p>Is the topic of the opinion article discussed accurately in the context of the current literature?</p>
            <p>Yes</p>
            <p>Are arguments sufficiently supported by evidence from the published literature?</p>
            <p>Yes</p>
            <p>Are all factual statements correct and adequately supported by citations?</p>
            <p>Yes</p>
            <p>Are the conclusions drawn balanced and justified on the basis of the presented arguments?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>NA</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard.</p>
        </body>
        <back>
            <ref-list>
                <title>References</title>
                <ref id="rep-ref-34258-1">
                    <label>1</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Identical, similar or different? Is a single brain model sufficient?</article-title>.
                        <source>
                            <italic>Cortex</italic>
                        </source>.<year>2017</year>;<volume>86</volume>:
                        <elocation-id>10.1016/j.cortex.2016.12.002</elocation-id>
                        <fpage>172</fpage>-<lpage>175</lpage>
                        <pub-id pub-id-type="pmid">28041614</pub-id>
                        <pub-id pub-id-type="doi">10.1016/j.cortex.2016.12.002</pub-id>
                    </mixed-citation>
                </ref>
            </ref-list>
        </back>
        <sub-article article-type="response" id="comment4326-34258">
            <front-stub>
                <contrib-group>
                    <contrib contrib-type="author">
                        <name>
                            <surname>Nachev</surname>
                            <given-names>Parashkev</given-names>
                        </name>
                        <aff>UCL, UK</aff>
                    </contrib>
                </contrib-group>
                <author-notes>
                    <fn fn-type="conflict">
                        <p>
                            <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                    </fn>
                </author-notes>
                <pub-date pub-type="epub">
                    <day>27</day>
                    <month>12</month>
                    <year>2018</year>
                </pub-date>
            </front-stub>
            <body>
                <p>We thank Professor Thiebaut de Schotten for his appreciative comments, and for the reference now cited in the revised version.</p>
            </body>
        </sub-article>
    </sub-article>
</article>
