﻿<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1 20151215//EN" "JATS-journalpublishing1.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="systematic-review">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">Explor Neuroprot Ther</journal-id>
<journal-id journal-id-type="publisher-id">ENT</journal-id>
<journal-title-group>
<journal-title>Exploration of Neuroprotective Therapy</journal-title>
</journal-title-group>
<issn pub-type="epub">2769-6510</issn>
<publisher>
<publisher-name>Open Exploration Publishing</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.37349/ent.2026.1004141</article-id>
<article-id pub-id-type="manuscript">1004141</article-id>
<article-categories>
<subj-group>
<subject>Systematic Review</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Machine learning or morphometric scaling? A systematic review of methodological confounds and the generalizability of sex classification in neuroimaging</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-2384-8771</contrib-id>
<name>
<surname>Sapuan</surname>
<given-names>Abdul Halim</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role content-type="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing—original draft</role>
<xref ref-type="aff" rid="I1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<contrib-id contrib-id-type="orcid">https://orcid.org/0009-0002-8600-1102</contrib-id>
<name>
<surname>Jamaludin</surname>
<given-names>Iqbal</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role content-type="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing—review &amp; editing</role>
<xref ref-type="aff" rid="I1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<contrib-id contrib-id-type="orcid">https://orcid.org/0009-0001-7344-6308</contrib-id>
<name>
<surname>Abdul Majid</surname>
<given-names>Zafri Azran</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role content-type="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing—review &amp; editing</role>
<xref ref-type="aff" rid="I1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0003-1397-8174</contrib-id>
<name>
<surname>Mohd Tamrin</surname>
<given-names>Mohd Izzuddin</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role content-type="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing—review &amp; editing</role>
<xref ref-type="aff" rid="I2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-5496-0822</contrib-id>
<name>
<surname>Che Azemin</surname>
<given-names>Mohd Zulfaezal</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role content-type="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing—review &amp; editing</role>
<xref ref-type="aff" rid="I3">
<sup>3</sup>
</xref>
<xref ref-type="corresp" rid="cor1">
<sup>*</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-6661-8469</contrib-id>
<name>
<surname>Turaev</surname>
<given-names>Sherzod</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role content-type="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<xref ref-type="aff" rid="I4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="editor">
<name>
<surname>Mozley</surname>
<given-names>P. David</given-names>
</name>
<role>Academic Editor</role>
<aff>Cornell University Weill School of Medicine, USA</aff>
</contrib>
</contrib-group>
<aff id="I1">
<sup>1</sup>Department of Diagnostic Imaging and Radiotherapy, Kulliyyah of Allied Health Sciences, International Islamic University Malaysia, Kampus Kuantan, Kuantan 25200, Pahang Darul Makmur, Malaysia</aff>
<aff id="I2">
<sup>2</sup>Department of Information Systems, Kulliyyah of Information and Communication Technology, International Islamic University Malaysia, Gombak 53100, Selangor Darul Ehsan, Malaysia</aff>
<aff id="I3">
<sup>3</sup>Department of Optometry and Visual Sciences, Kulliyyah of Allied Health Sciences, International Islamic University Malaysia, Kampus Kuantan, Kuantan 25200, Pahang Darul Makmur, Malaysia</aff>
<aff id="I4">
<sup>4</sup>Department of Computer Science and Software Engineering, College of Information Technology, United Arab Emirates University, P.O. Box 15551, Al Ain, Abu Dhabi, United Arab Emirates</aff>
<author-notes>
<corresp id="cor1">
<bold>
<sup>*</sup>Correspondence:</bold> Mohd Zulfaezal Che Azemin, Department of Optometry and Visual Sciences, Kulliyyah of Allied Health Sciences, International Islamic University Malaysia, Kampus Kuantan, Jalan Sultan Ahmad Shah, Kuantan 25200, Pahang Darul Makmur, Malaysia. <email>zulfaezal@iium.edu.my</email></corresp>
</author-notes>
<pub-date pub-type="collection">
<year>2026</year>
</pub-date>
<pub-date pub-type="epub">
<day>23</day>
<month>03</month>
<year>2026</year>
</pub-date>
<volume>6</volume>
<elocation-id>1004141</elocation-id>
<history>
<date date-type="received">
<day>05</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>05</day>
<month>03</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>© The Author(s) 2026.</copyright-statement>
<license xlink:href="https://creativecommons.org/licenses/by/4.0/">
<license-p>This is an Open Access article licensed under a Creative Commons Attribution 4.0 International License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, sharing, adaptation, distribution and reproduction in any medium or format, for any purpose, even commercially, as long as you give appropriate credit to the original author(s) and the source, provide a link to the Creative Commons license, and indicate if changes were made.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Background:</title>
<p id="absp-1">This systematic review critically evaluates whether machine learning (ML) identifies biologically meaningful sex-related brain architecture or merely exploits methodological artifacts and allometric scaling. While ML models achieve high classification accuracies, it remains unclear if these reflect stable, mechanistically informative dimorphism or are driven by confounds such as total intracranial volume (TIV) and site-specific noise. We examine how imaging modalities, algorithms, and population strata influence both classification outcomes and biological interpretability.</p>
</sec>
<sec>
<title>Methods:</title>
<p id="absp-2">Following Preferred Reporting Items for Systematic Reviews and Meta-Analyses (PRISMA) guidelines, we searched Web of Science, PubMed, and Scopus through January 2024. Included studies [healthy humans, 3T magnetic resonance imaging (MRI), ML-based sex classification] were assessed for risk of bias, focusing on data leakage, validation strategies, and confound management.</p>
</sec>
<sec>
<title>Results:</title>
<p id="absp-3">Thirty-five studies (<italic>n</italic> &gt; 110,000) were included. While reported accuracies reached 98.06% for T1-weighted MRI, 96.0% for diffusion MRI (dMRI), and 94.72% for functional MRI (fMRI), performance was highly dependent on population characterization and age. Deep learning consistently outperformed traditional ML (TML) but showed high sensitivity to methodological artifacts. Notably, studies failing to correct for TIV reported potentially inflated accuracies, suggesting that many models identify physical scale rather than intrinsic neuroanatomical dimorphism.</p>
</sec>
<sec>
<title>Discussion:</title>
<p id="absp-4">High classification accuracies are often bolstered by methodological confounds and a lack of cross-site validation. There is a significant discrepancy between ML-driven predictive power and biological inference validity. Current pipelines do not yet allow for robust, generalizable inference about brain sex. To move beyond statistical separation toward mechanistic understanding, the field must prioritize TIV-corrected benchmarks and diverse non-WEIRD (Western, Educated, Industrialized, Rich, Democratic) datasets. We conclude that while ML is a powerful pattern detector, its results must be interpreted with caution regarding biological dimorphism.</p>
</sec>
</abstract>
<kwd-group>
<kwd>sex classification</kwd>
<kwd>brain MRI</kwd>
<kwd>machine learning</kwd>
<kwd>deep learning</kwd>
<kwd>neuroimaging</kwd>
<kwd>grey matter</kwd>
<kwd>functional connectivity</kwd>
<kwd>diffusion imaging</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p id="p-1">Magnetic resonance imaging (MRI) has transformed in vivo brain research by offering high-resolution insights into neuroanatomy and function. Its ability to delineate intricate tissue structures has made it indispensable in studying sex-based variations in brain morphology. Early reports highlighted anatomical differences such as greater brain weight and circumference in males [<xref ref-type="bibr" rid="B1">1</xref>]. Subsequent research using statistical morphometry identified sex differences in grey matter, although with varying magnitudes and conflicting biological interpretations [<xref ref-type="bibr" rid="B2">2</xref>–<xref ref-type="bibr" rid="B5">5</xref>]. For example, male brains are typically 8–12% larger than female brains—a difference that emerges early and persists across the lifespan [<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B7">7</xref>].</p>
<p id="p-2">Recent advances in machine learning (ML) have enabled multivariate modeling of complex neuroimaging data, frequently demonstrating classification accuracies exceeding 90% [<xref ref-type="bibr" rid="B8">8</xref>, <xref ref-type="bibr" rid="B9">9</xref>]. Compared to conventional statistics, ML models can identify subtle, distributed neuroanatomical patterns undetectable by univariate approaches. However, a critical gap remains between predictive performance and inferential validity. While ML is a powerful pattern detector, it is often unclear whether these high accuracies reflect stable, mechanistically informative dimorphism or are driven by proxies such as global size (allometric scaling) and demographic structure. If the predictive signal is largely a product of uncorrected total intracranial volume (TIV) or site-specific artifacts, then current models are constrained in what they can legitimately claim about sex-related differences in brain architecture.</p>
<p id="p-3">In this review, “sex” refers strictly to biological attributes—such as chromosomal, hormonal, and anatomical characteristics assigned at birth—and does not encompass gender identity or sociocultural constructs. Our goal is to systematically evaluate whether ML-based neuroimaging pipelines currently allow for confound-controlled, cross-site generalizable inference about sex, or if they merely enable statistical separation at the population level. By interrogating what these high classification numbers truly mean, we aim to clarify the contribution of ML to our understanding of sex-related neuroanatomical organization, with broader implications for disorders exhibiting sex-specific prevalence or expression [<xref ref-type="bibr" rid="B10">10</xref>–<xref ref-type="bibr" rid="B15">15</xref>].</p>
</sec>
<sec id="s2">
<title>Materials and methods</title>
<sec id="t2-1">
<title>Protocols and registration</title>
<p id="p-4">This systematic review was conducted in accordance with the Preferred Reporting Items for Systematic Reviews and Meta-Analyses (PRISMA) statement. The protocol for this review was not prospectively registered in a systematic review database (e.g., PROSPERO).</p>
</sec>
<sec id="t2-2">
<title>Information sources and search strategy</title>
<p id="p-5">Studies were identified through an electronic search of the Web of Science, PubMed, and Scopus databases conducted on 19th January 2026. These databases were selected for their comprehensive coverage of biomedical and scientific literature, ensuring access to a wide array of relevant research at the intersection of neuroimaging, sex differences, and ML.</p>
<p id="p-6">The search strategy employed keywords and indexed terms including “sex”, “gender”, “dimorphism”, “predict”, “classify”, “disparities”, “difference”, “discriminate”, “distinguish”, “brain”, “magnetic resonance imaging”, “MRI”, “machine learning”, “deep learning”, and “classifier”. These terms were combined using Boolean operators to refine the results. For example, the following string was adapted for each database: (sex OR gender) AND (dimorphism OR predict OR classify OR disparities OR difference OR discriminate OR distinguish) AND (brain) AND (magnetic resonance imaging OR MRI) AND (machine learning OR deep learning).</p>
<p id="p-7">To ensure transparency and reproducibility, the exact Boolean search strings used for each database are provided below:</p>
<sec id="t2-2-1">
<title>Web of Science search string</title>
<p id="p-8">TS = ((“brain” OR “cerebral” OR “neuro” OR “cortex”) AND (“sex differences” OR “gender differences” OR “sexual dimorphism” OR “sex classification”) AND (“artificial intelligence” OR “ai” OR “machine learning” OR “deep learning”) AND (“magnetic resonance imaging” OR “MRI” OR “neuroimaging” OR “brain imaging”)).</p>
</sec>
<sec id="t2-2-2">
<title>PubMed search string</title>
<p id="p-9">(“brain” [tiab] OR “cerebral” [tiab] OR “neuro” [tiab] OR “cortex” [tiab]) AND (“sex differences” [tiab] OR “gender differences” [tiab] OR “sexual dimorphism” [tiab] OR “sex classification” [tiab]) AND (“artificial intelligence” [tiab] OR “ai” [tiab] OR “machine learning” [tiab] OR “deep learning” [tiab]) AND (“magnetic resonance imaging” [tiab] OR “MRI” [tiab] OR “neuroimaging” [tiab] OR “brain imaging” [tiab]).</p>
</sec>
<sec id="t2-2-3">
<title>Scopus search string</title>
<p id="p-10">(TITLE-ABS-KEY (brain OR cerebral OR neuro OR cortex)) AND (TITLE-ABS-KEY (“sex differences” OR “gender differences” OR “sexual dimorphism” OR “sex classification”)) AND (TITLE-ABS-KEY(“artificial intelligence” OR “ai” OR “machine learning” OR “deep learning”)) AND (TITLE-ABS-KEY(“magnetic resonance imaging” OR “MRI” OR “neuroimaging” OR “brain imaging”)).</p>
<p id="p-11">The search encompassed all available literature up to 19 January 2026, with no date restrictions applied. This inclusive approach ensured that both foundational historical studies and recent developments were captured, enhancing the review’s robustness across a broad temporal range. Furthermore, the search date ensures the inclusion of the most recent advancements in the field as of early 2026.</p>
</sec>
</sec>
<sec id="t2-3">
<title>Eligibility criteria</title>
<p id="p-12">To ensure a high level of technical consistency and diagnostic relevance, studies were selected based on the following criteria:</p>
<sec id="t2-3-1">
<title>Inclusion criteria</title>
<p id="p-13">
<list list-type="bullet">
<list-item>
<p>In vivo studies in healthy humans;</p>
</list-item>
<list-item>
<p>Use of 3T MRI;</p>
</list-item>
<list-item>
<p>ML-based sex classification;</p>
</list-item>
<list-item>
<p>Peer-reviewed, full-text English articles.</p>
</list-item>
</list>
</p>
</sec>
<sec id="t2-3-2">
<title>Exclusion criteria</title>
<p id="p-14">
<list list-type="bullet">
<list-item>
<p>Post-mortem studies;</p>
</list-item>
<list-item>
<p>Clinical populations with neurological or psychiatric disorders;</p>
</list-item>
<list-item>
<p>Non-English articles;</p>
</list-item>
<list-item>
<p>Reviews, conference abstracts, and proceedings;</p>
</list-item>
<list-item>
<p>Studies using field strengths other than 3T (e.g., 1.5T or 7T) or those not utilizing ML for classification.</p>
</list-item>
</list>
</p>
</sec>
<sec id="t2-3-3">
<title>Rationale for selection</title>
<p id="p-15">The emphasis on 3T MRI was chosen due to its prevalence in contemporary research, offering superior spatial resolution and signal-to-noise ratio (SNR) compared to lower field strengths. This standardization minimizes variance across scanners and enhances the reliability of the subtle brain measurements required for accurate sex classification.</p>
<p id="p-16">The inclusion of both structural and functional imaging [T1-weighted, diffusion MRI (dMRI), and functional MRI (fMRI)] allows for a multidimensional assessment. While structural modalities provide insights into neuroanatomical morphology, fMRI captures dynamic activity, offering a holistic view of sex-based neurobiological variation [<xref ref-type="bibr" rid="B16">16</xref>–<xref ref-type="bibr" rid="B24">24</xref>].</p>
<p id="p-17">The exclusion of non-English publications and secondary literature was a strategic decision to ensure uniformity in data interpretation and to maintain a focus on original, peer-reviewed findings. These constraints were designed to balance the breadth of the review with the need for high-quality, reproducible data.</p>
</sec>
</sec>
<sec id="t2-4">
<title>Selection process</title>
<p id="p-18">Two reviewers independently screened all titles and abstracts identified through the search. The same reviewers independently assessed full-text articles for eligibility. Disagreements were resolved through consensus, or when necessary, by consultation with a senior author.</p>
</sec>
<sec id="t2-5">
<title>Risk of bias and quality assessment</title>
<p id="p-19">To evaluate the internal validity and methodological rigor of the included studies, a structured narrative quality assessment was performed. In the absence of a singular, universally accepted risk-of-bias tool specifically for ML-neuroimaging, we adapted criteria from the PROBAST (Prediction model Risk Of Bias Assessment Tool) and QUADAS-2 frameworks, tailored to address three critical domains:</p>
<sec id="t2-5-1">
<title>Data leakage and analytical bias</title>
<p id="p-20">A primary focus of our assessment was the identification of data leakage, a significant source of inflated accuracy in ML. We scrutinized studies for:</p>
<p id="p-21">
<list list-type="bullet">
<list-item>
<p>Feature selection leakage: Ensuring feature selection was performed strictly within cross-validation loops rather than on the entire dataset.</p>
</list-item>
<list-item>
<p>Subject overlap: Verifying that samples used for training were strictly isolated from testing, particularly in longitudinal or multi-modal studies where the same participant might appear across different data points.</p>
</list-item>
<list-item>
<p>Validation strategy: We prioritized studies using <italic>k</italic>-fold cross-validation or, ideally, hold-out independent test sets. Studies utilizing simple “train-test splits” on small samples were flagged for high risk of overfitting.</p>
</list-item>
</list>
</p>
</sec>
<sec id="t2-5-2">
<title>Sample size and demographic representativeness</title>
<p id="p-22">We assessed the “power” of the findings based on sample size and diversity:</p>
<p id="p-23">
<list list-type="bullet">
<list-item>
<p>Sample size: Small-scale studies (<italic>n</italic> &lt; 100) were categorized as having a higher risk of capturing dataset-specific noise rather than generalizable sex differences.</p>
</list-item>
<list-item>
<p>Population bias: We evaluated the reliance on high-income, “WEIRD” datasets [e.g., Human Connectome Project (HCP), UK Biobank (UKB)]. While these datasets offer high technical quality, their demographic homogeneity limits the external validity of the resulting models.</p>
</list-item>
</list>
</p>
</sec>
<sec id="t2-5-3">
<title>Image acquisition and preprocessing (confound management)</title>
<p id="p-24">The assessment monitored the handling of technical and biological confounds:</p>
<p id="p-25">
<list list-type="bullet">
<list-item>
<p>TIV and global scaling: Studies were evaluated for whether they corrected for TIV. As noted in our results, the absence of this correction in several high-accuracy studies represents a significant source of classification bias.</p>
</list-item>
<list-item>
<p>Scanner effects: We noted whether studies employed multi-site data or harmonization techniques (e.g., ComBat). Models trained and tested on a single scanner were considered to have a moderate risk of bias due to potential “site-signature” learning.</p>
</list-item>
</list>
</p>
</sec>
</sec>
<sec id="t2-6">
<title>Overall quality synthesis</title>
<p id="p-26">Across the 35 included studies, the risk of bias was found to be moderate to high. While the transition toward deep learning (DL) has improved the handling of complex data, consistent gaps remain—specifically regarding the reporting of TIV-normalization and the use of external, cross-site validation sets. These gaps suggest that the “ceiling” of sex-classification accuracy may be partially bolstered by methodological artifacts.</p>
</sec>
</sec>
<sec id="s3">
<title>Results</title>
<sec id="t3-1">
<title>Study selection and data extraction</title>
<p id="p-27">The study selection and screening process is illustrated in the PRISMA flow diagram (<xref ref-type="fig" rid="fig1">Figure 1</xref>). The initial search across three electronic databases yielded 112 records. Following the removal of 42 duplicate entries, 70 unique records remained for title and abstract screening. Of these, 14 irrelevant studies were excluded, and 56 articles underwent full-text assessment for eligibility. After a detailed review, 21 articles were excluded for not meeting the pre-defined inclusion criteria (e.g., use of 1.5T MRI, focus on clinical populations, or lack of ML-based classification).</p>
<fig id="fig1" position="float">
<label>Figure 1</label>
<caption>
<p id="fig1-p-1">
<bold>PRISMA 2020 flow diagram for new systematic reviews.</bold> Adapted from Page MJ, McKenzie JE, Bossuyt PM, Boutron I, Hoffmann TC, Mulrow CD, et al. The PRISMA 2020 statement: an updated guideline for reporting systematic reviews. BMJ. 2021;372:n71 (doi: 10.1136/bmj.n71). © Author(s) (or their employer(s)) 2021. CC BY. PRISMA: Preferred Reporting Items for Systematic Reviews and Meta-Analyses.</p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="ent-06-1004141-g001.tif" />
</fig>
<p id="p-28">Ultimately, 35 articles [<xref ref-type="bibr" rid="B4">4</xref>, <xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B16">16</xref>–<xref ref-type="bibr" rid="B48">48</xref>] were deemed eligible and included in the final analysis. Data regarding sample population, age, morphometric features, ML algorithms, and sex-classification accuracy were extracted from these studies and are summarized in <xref ref-type="sec" rid="s-suppl">Table S1</xref>. Our quality assessment revealed a critical methodological landscape: while the field has transitioned toward powerful DL architectures, there remain significant gaps in inference validity. Notably, only a minority of high-accuracy studies explicitly corrected for TIV or employed external, cross-scanner validation sets. This suggests that the reported “performance ceiling” of sex classification may be partially bolstered by allometric scaling and site-specific artifacts.</p>
</sec>
<sec id="t3-2">
<title>High-resolution T1-weighted MRI</title>
<p id="p-29">This systematic review investigated the efficacy of various ML algorithms in classifying sex based on gray matter (GM) morphometric features. Overall, the classification models exhibited high accuracy in distinguishing between sexes, ranging from 56.0% to 98.06%. The highest performing method (98.06%) employed a specialized DL approach termed Multi-Layer 3D Convolution Extreme Learning Machine (MCN-ELM) [<xref ref-type="bibr" rid="B25">25</xref>], while the lowest accuracy (56.0%) was observed using a support vector machine (SVM) [<xref ref-type="bibr" rid="B31">31</xref>].</p>
<sec id="t3-2-1">
<title>Feature selection and morphometry</title>
<p id="p-30">The selection of morphological features is a critical determinant of model performance. Particular emphasis was placed on GM segmentation data, assessed through various measurement approaches:</p>
<p id="p-31">
<list list-type="bullet">
<list-item>
<p>Grey matter volume: Five studies focused on GM volume [<xref ref-type="bibr" rid="B29">29</xref>, <xref ref-type="bibr" rid="B34">34</xref>, <xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B42">42</xref>, <xref ref-type="bibr" rid="B46">46</xref>]. Zhang et al. [<xref ref-type="bibr" rid="B42">42</xref>] (2020) achieved the highest accuracy at 94.3%, followed by Sanchis-Segura et al. [<xref ref-type="bibr" rid="B34">34</xref>] (2022), who reached 90.0% using SVM. Wang et al. [<xref ref-type="bibr" rid="B39">39</xref>] (2012) and Matte Bon et al. [<xref ref-type="bibr" rid="B29">29</xref>] (2024) reported accuracies of 86.1% and 82.3%, respectively. Conversely, Yang et al. [<xref ref-type="bibr" rid="B46">46</xref>] (2021) reported the lowest accuracy in this category at 66.0%. Notably, four of these studies utilized SVM; however, Matte Bon et al. [<xref ref-type="bibr" rid="B29">29</xref>] (2024) employed gradient-boosted trees, achieving 82.3% on limbic volume compared to 77.6% for non-limbic volume.</p>
</list-item>
<list-item>
<p>Global intensity and segmentation: Seven investigations incorporated global GM data or intensity features [<xref ref-type="bibr" rid="B17">17</xref>, <xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B23">23</xref>, <xref ref-type="bibr" rid="B25">25</xref>, <xref ref-type="bibr" rid="B30">30</xref>, <xref ref-type="bibr" rid="B40">40</xref>]. Following the 98.06% accuracy of MCN-ELM [<xref ref-type="bibr" rid="B25">25</xref>], Bi et al. [<xref ref-type="bibr" rid="B17">17</xref>] (2023) achieved 97.3% using a Convolutional Neural Network (CNN). Other notable results included 88.0% by Feis et al. [<xref ref-type="bibr" rid="B23">23</xref>], 84.0% using linear regression [<xref ref-type="bibr" rid="B40">40</xref>], and an area under the curve (AUC) of 0.85 using a CNN [<xref ref-type="bibr" rid="B30">30</xref>].</p>
</list-item>
<list-item>
<p>Cortical architecture: Six studies examined intricacies such as 3D morphology, thickness, surface area, and folding indices (gyrification, sulcal depth, and fractal dimension) [<xref ref-type="bibr" rid="B16">16</xref>, <xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B24">24</xref>, <xref ref-type="bibr" rid="B28">28</xref>, <xref ref-type="bibr" rid="B37">37</xref>, <xref ref-type="bibr" rid="B48">48</xref>]. Luo et al. [<xref ref-type="bibr" rid="B28">28</xref>] (2019) reached 96.77% accuracy using hierarchical sparse representation-based classification (HSRC). Ge et al. [<xref ref-type="bibr" rid="B24">24</xref>] (2021) found that among five cortical features, cortical thickness yielded the highest accuracy (80.0%), followed by the gyrification index (72.0%) and sulcal depth (70.0%). Similarly, Metoki et al. [<xref ref-type="bibr" rid="B48">48</xref>] (2024) reported 76.0% accuracy for cortical thickness.</p>
</list-item>
<list-item>
<p>Modified indices: Studies employing modified indices (asymmetry, <italic>z</italic>-scores, or networks) generally reported lower performance [<xref ref-type="bibr" rid="B4">4</xref>, <xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B31">31</xref>]. For example, Dumitru [<xref ref-type="bibr" rid="B4">4</xref>] (2023) utilized brain asymmetry indices [subtraction index (SI), distance index (DI), and laterality index (LI)], yielding accuracies between 62.0% and 64.0%. However, Ebel et al. [<xref ref-type="bibr" rid="B9">9</xref>] (2023) achieved 95.78% using <italic>z</italic>-score normalization of GM voxels with logistic regression (LR).</p>
</list-item>
<list-item>
<p>The influence of global scaling: We observed a clear performance discrepancy linked to TIV management. Studies utilizing uncorrected GM volume, such as Sanchis-Segura et al. [<xref ref-type="bibr" rid="B34">34</xref>] (2022), reached 90.0% accuracy. However, the same study demonstrated that these differences attenuate significantly when TIV is controlled for, suggesting that uncorrected models may simply be identifying “head size”.</p>
</list-item>
<list-item>
<p>Feature sensitivity: Specialized DL approaches, such as the MCN-ELM [<xref ref-type="bibr" rid="B25">25</xref>], achieved the review’s highest accuracy (98.06%) by learning complex non-linear patterns. In contrast, models using brain asymmetry indices reported significantly lower accuracies (62.0–64.0%) [<xref ref-type="bibr" rid="B4">4</xref>], highlighting that predictive power is highly dependent on the “proxy potential” of the selected features.</p>
</list-item>
</list>
</p>
</sec>
<sec id="t3-2-2">
<title>Multimodal and regional specificity</title>
<p id="p-32">Seven studies explored combining multiple morphological features, consistently revealing higher accuracies than individual features alone [<xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B23">23</xref>, <xref ref-type="bibr" rid="B24">24</xref>, <xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B40">40</xref>, <xref ref-type="bibr" rid="B42">42</xref>, <xref ref-type="bibr" rid="B47">47</xref>]. For instance, Brennan et al. [<xref ref-type="bibr" rid="B18">18</xref>] (2021) observed an increase in accuracy to 86.33% (from a baseline of 69.0–76.0%) when combining cortical area, thickness, volume, and intensity metrics.</p>
<p id="p-33">Identifying discriminative brain regions further illuminates the landscape of sexual dimorphism. Matte Bon et al. [<xref ref-type="bibr" rid="B29">29</xref>] (2024) found that limbic volume (82.3%) was more predictive than whole-brain volume (79.7%). Conversely, Ebel et al. [<xref ref-type="bibr" rid="B9">9</xref>] (2023) reported that the whole brain exhibited the highest predictive power (AUC = 0.98), followed by the cerebellum (0.95) and thalamus (0.88). Luo et al. [<xref ref-type="bibr" rid="B28">28</xref>] (2019) noted that frontal regions were the most discriminative (87.87%), whereas the temporal gyrus was the least (62.89%).</p>
</sec>
</sec>
<sec id="t3-3">
<title>Diffusion-weighted MRI</title>
<p id="p-34">Diffusion-weighted imaging (DWI) examines water diffusion patterns to assess white matter microstructural integrity and brain connectivity. Five of the included studies utilized diffusion-based features for sex classification [<xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B23">23</xref>, <xref ref-type="bibr" rid="B43">43</xref>, <xref ref-type="bibr" rid="B46">46</xref>, <xref ref-type="bibr" rid="B47">47</xref>].</p>
<p id="p-35">
<list list-type="bullet">
<list-item>
<p>Fractional anisotropy (FA) and DL: Xin et al. [<xref ref-type="bibr" rid="B43">43</xref>] (2019) achieved a peak accuracy of 93.3% using FA maps paired with a 3D CNN; notably, their comparative SVM model reached only 78.2% on the same data. Chen et al. [<xref ref-type="bibr" rid="B19">19</xref>] (2024) reported a similar accuracy of 91.0% using FA with a 2D CNN, which unexpectedly outperformed both 3D CNN and Vision Transformer (ViT) architectures. This indicates that DL excels at extracting subtle connectivity signatures that traditional ML (TML) misses.</p>
</list-item>
<list-item>
<p>Performance variance: Yeung et al. [<xref ref-type="bibr" rid="B47">47</xref>] (2023) obtained comparatively lower accuracies—79.74% for FA and 78.15% for mean diffusivity (MD)—using the BrainNet CNN framework. Similarly, Yang et al. [<xref ref-type="bibr" rid="B46">46</xref>] (2021) reported an accuracy of only 55.0% using an SVM on diffusion tensor data.</p>
</list-item>
<list-item>
<p>Multimodal enhancement: A consistent finding across diffusion studies was the benefit of multimodal integration. Feis et al. [<xref ref-type="bibr" rid="B23">23</xref>] (2013) achieved 83.0% accuracy using FA data alone, which increased significantly to 96.0% when combined with T1- and T2-weighted GM segmentation features. This trend was mirrored by Yang et al. [<xref ref-type="bibr" rid="B46">46</xref>] (2021), whose accuracy improved from 55.0% to 72.0% when diffusion features were fused with T1-weighted data.</p>
</list-item>
</list>
</p>
</sec>
<sec id="t3-4">
<title>Functional MRI</title>
<p id="p-36">fMRI captures dynamic brain activity by measuring blood-oxygen-level-dependent (BOLD) signals. This review evaluated both task-based fMRI, which maps activity during specific cognitive challenges, and resting-state fMRI (rs-fMRI), which assesses intrinsic functional connectivity.</p>
<p id="p-37">
<list list-type="bullet">
<list-item>
<p>Task-based fMRI: Two studies utilized task-based paradigms, reporting moderate classification performance. Leming and Suckling (2021) achieved an AUC of 0.783 using an emotion-processing task, while Xu et al. [<xref ref-type="bibr" rid="B44">44</xref>] (2020) reported an accuracy of 75.86% using a language-based paradigm.</p>
</list-item>
<list-item>
<p>rs-fMRI: Resting-state studies generally yielded higher accuracies, particularly when employing DL architectures. Ryali et al. [<xref ref-type="bibr" rid="B33">33</xref>] (2024) achieved a peak accuracy of 94.72% using a spatiotemporal deep neural network (stDNN). High performance was also reported by Sen and Parhi [<xref ref-type="bibr" rid="B36">36</xref>] (2021) at 94.0%, utilizing a random forest (RF) classifier on dynamic functional connectivity measures (tensor PARAFAC). Fan et al. [<xref ref-type="bibr" rid="B22">22</xref>] (2020) reported 93.05% accuracy by implementing a hybrid CNN-LSTM (long short-term memory) architecture to capture temporal dependencies.</p>
</list-item>
<list-item>
<p>Standard performance and baselines: Most rs-fMRI studies reported accuracies between 80.0% and 90.0% [<xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B32">32</xref>, <xref ref-type="bibr" rid="B40">40</xref>, <xref ref-type="bibr" rid="B48">48</xref>]. Conversely, the lowest performances were observed in studies utilizing SVM: Patel et al. [<xref ref-type="bibr" rid="B32">32</xref>] (2024) reported 67.53%, and Satterthwaite et al. [<xref ref-type="bibr" rid="B35">35</xref>] (2015) reported 71.0%.</p>
</list-item>
</list>
</p>
</sec>
<sec id="t3-5">
<title>Combination of MRI sequences</title>
<p id="p-38">A key finding across the literature is the significant improvement in classification accuracy achieved through the integration of multiple MRI sequences. Five studies demonstrated that fusing morphological and functional data—including T1-weighted, T2-weighted, diffusion-weighted, and functional (resting-state and task-evoked) MRI—consistently outperformed single-modality models.</p>
<p id="p-39">
<list list-type="bullet">
<list-item>
<p>Incremental gains: The earliest evidence for this trend came from Wang et al. [<xref ref-type="bibr" rid="B39">39</xref>] (2012), who observed that combining GM volume with rs-fMRI increased accuracy to 89.1%, surpassing the 86.1% achieved using GM volume alone.</p>
</list-item>
<list-item>
<p>Structural synergy: Feis et al. [<xref ref-type="bibr" rid="B23">23</xref>] (2013) achieved a near-perfect accuracy of 96.0% by integrating features from three structural sequences: T1-weighted (88.0%), T2-weighted (85.0%), and diffusion-weighted MRI (83.0%).</p>
</list-item>
<list-item>
<p>Holistic multimodal integration: More recent investigations utilizing both structural and functional domains have reported the highest accuracies in the review. Weber et al. [<xref ref-type="bibr" rid="B40">40</xref>] (2022) achieved 93.3%, while Zhang et al. [<xref ref-type="bibr" rid="B42">42</xref>] (2020) reached a peak of 96.6% by synthesizing features from GM, white matter, rs-fMRI, and task-evoked fMRI.</p>
</list-item>
</list>
</p>
</sec>
<sec id="t3-6">
<title>Classification model performance</title>
<p id="p-40">A comparative analysis of the included studies reveals distinct patterns between TML and DL architectures. While TML models—including SVM, RFs, and gradient boosted trees—demonstrated high performance, DL models consistently established the upper bounds of classification accuracy.</p>
<p id="p-41">
<list list-type="bullet">
<list-item>
<p>TML: Among studies utilizing TML, the peak accuracy reached was 96.77%, achieved by Luo et al. [<xref ref-type="bibr" rid="B28">28</xref>] (2019) through their HSRC approach. SVM was the most prevalent algorithm, utilized in 17 studies. Zhang et al. [<xref ref-type="bibr" rid="B42">42</xref>] (2020) reported the highest SVM-based accuracy (96.6%) by integrating structural and functional features. However, TML performance varied significantly, with some SVM models reporting accuracies as low as 55.0% [<xref ref-type="bibr" rid="B31">31</xref>, <xref ref-type="bibr" rid="B46">46</xref>], highlighting a high sensitivity to feature selection and preprocessing.</p>
</list-item>
<list-item>
<p>DL: DL techniques, particularly CNNs, pushed accuracy thresholds further. The highest overall accuracy in this review (98.06%) was achieved using a specialized MCN-ELM [<xref ref-type="bibr" rid="B25">25</xref>].</p>
</list-item>
</list>
</p>
<p id="p-42">In head-to-head evaluations, the choice of algorithm often dictated performance. Sanchis-Segura et al. [<xref ref-type="bibr" rid="B34">34</xref>] (2022) compared five algorithms [linear discriminant analysis (LDA), LR, MARS, RF, and SVM] in a sex- and age-matched cohort (<italic>n</italic> = 876), finding that SVM outperformed the others with an accuracy of 90.0% when using uncorrected GM volume.</p>
<p id="p-43">However, the assumption that DL always outperforms TML was challenged by Ebel et al. [<xref ref-type="bibr" rid="B9">9</xref>] (2023). In their study using the Study of Health in Pomerania (SHIP) dataset, LR (95.78%) outperformed a CNN [<xref ref-type="bibr" rid="B9">9</xref>]. This was attributed to the use of <italic>z</italic>-score normalization on GM voxels, suggesting that rigorous feature engineering in TML can occasionally match or exceed the automated feature extraction of DL models. This dichotomy underscores that while DL generally offers higher ceilings, TML remains highly effective when paired with optimized preprocessing.</p>
</sec>
<sec id="t3-7">
<title>Age-stratified classification performance</title>
<p id="p-44">Given that brain maturation and aging involve distinct neurobiological processes, this review assessed how ML accuracy varies across the lifespan.</p>
<p id="p-45">
<list list-type="bullet">
<list-item>
<p>Children and adolescents (under 23 years): Eight studies focused on younger populations [<xref ref-type="bibr" rid="B17">17</xref>, <xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B30">30</xref>, <xref ref-type="bibr" rid="B32">32</xref>, <xref ref-type="bibr" rid="B35">35</xref>, <xref ref-type="bibr" rid="B37">37</xref>, <xref ref-type="bibr" rid="B38">38</xref>, <xref ref-type="bibr" rid="B46">46</xref>]. The highest accuracy reported was 97.3% in a large-scale study of approximately 11,000 children (aged 9–12 years) from the Adolescent Brain Cognitive Development (ABCD) study [<xref ref-type="bibr" rid="B17">17</xref>]. This suggests that sex-specific neuroanatomical patterns are already highly distinguishable by late childhood.</p>
</list-item>
<list-item>
<p>Young adults (20–37 years): This demographic was the most frequently studied, with 17 investigations primarily utilizing the HCP dataset [<xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B16">16</xref>, <xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B22">22</xref>, <xref ref-type="bibr" rid="B24">24</xref>, <xref ref-type="bibr" rid="B25">25</xref>, <xref ref-type="bibr" rid="B28">28</xref>, <xref ref-type="bibr" rid="B29">29</xref>, <xref ref-type="bibr" rid="B33">33</xref>, <xref ref-type="bibr" rid="B34">34</xref>, <xref ref-type="bibr" rid="B36">36</xref>, <xref ref-type="bibr" rid="B40">40</xref>, <xref ref-type="bibr" rid="B41">41</xref>, <xref ref-type="bibr" rid="B43">43</xref>, <xref ref-type="bibr" rid="B45">45</xref>, <xref ref-type="bibr" rid="B46">46</xref>]. The review’s peak accuracy of 98.06% was achieved within this group using a DL architecture, suggesting that the early adult brain may represent the “pinnacle” of sexual dimorphism in neuroimaging features [<xref ref-type="bibr" rid="B25">25</xref>].</p>
</list-item>
<list-item>
<p>Lifespan and older adults (14–90 years): Six studies examined broader age ranges to capture aging effects [<xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B41">41</xref>, <xref ref-type="bibr" rid="B42">42</xref>, <xref ref-type="bibr" rid="B47">47</xref>]. The highest accuracy in these heterogeneous samples was 95.78%, achieved through the SHIP cohort [<xref ref-type="bibr" rid="B9">9</xref>]. The slightly lower ceiling in lifespan studies compared to young adult cohorts may reflect the increased inter-individual variability and cortical atrophy associated with aging, which can obscure sex-specific features.</p>
</list-item>
</list>
</p>
</sec>
<sec id="t3-8">
<title>Stratification by age and brain volume</title>
<p id="p-46">To reach further stratification power, the included studies were characterized by developmental stage and morphometric constraints. A clear performance gradient emerged when stratifying by age: studies focusing on the adolescent stratum (9–12 years) and young adult stratum (20–35 years) reported the highest mean accuracies (97.3% and 98.06%, respectively). In contrast, studies spanning the full adult lifespan (14–90 years) showed increased variance and a slightly lower performance ceiling (95.78%), likely due to age-related cortical atrophy. Furthermore, when characterizing groups by TIV, studies that did not stratify for head size reported consistently higher accuracies. This suggests that the “power” of sex classification is significantly mediated by the homogeneity of the age and size strata being analyzed.</p>
</sec>
</sec>
<sec id="s4">
<title>Discussion</title>
<p id="p-47">This systematic review demonstrates that while ML can classify biological sex from neuroimaging data with high precision, these results require a fundamental shift in interpretation. By synthesizing evidence across diverse age groups and imaging modalities, we find that while human brains can be categorized with up to 98.06% accuracy, these results are heavily influenced by model architecture, feature selection, and, crucially, methodological rigor. While high accuracies are often used to reinforce the existence of sex-related neuroanatomical patterns [<xref ref-type="bibr" rid="B28">28</xref>, <xref ref-type="bibr" rid="B29">29</xref>], they must be interrogated to determine if they represent biologically meaningful dimorphism or merely enable statistical separation via proxies.</p>
<sec id="t4-1">
<title>The “big brain problem” and inferential validity</title>
<p id="p-48">The most consequential finding regarding the validity of these models is the role of confounding factors, primarily TIV. Because male brains are, on average, 8–12% larger than female brains [<xref ref-type="bibr" rid="B10">10</xref>], models trained on uncorrected volumetric data may achieve “near-perfect” accuracies by exploiting global scaling cues rather than intrinsic multivariate morphology. Our review found that reporting on TIV correction was alarmingly limited [<xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B34">34</xref>]. As Sanchis-Segura et al. [<xref ref-type="bibr" rid="B34">34</xref>] demonstrated, sex differences appear “large” when uncorrected but become significantly attenuated once TIV is controlled. If a model “cheats” by using head size as a proxy for sex, it is not identifying neurobiological sex differences, but rather allometric scaling. This distinction is vital: if the predictive signal is size-driven, the field is not yet in a position to use these models as evidence for stable, mechanistically informative dimorphism.</p>
</sec>
<sec id="t4-2">
<title>Algorithmic efficacy: TML vs. DL</title>
<p id="p-49">The transition toward DL has pushed classification boundaries toward a 98% ceiling [<xref ref-type="bibr" rid="B25">25</xref>]. Architectures such as 3D CNNs excel by automatically learning complex, non-linear spatiotemporal patterns. However, DL models showed higher sensitivity to methodological artifacts. While TML, specifically SVMs, remains the most utilized due to transparency [<xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B23">23</xref>], DL is the primary driver of state-of-the-art precision. Yet, without robust explainability, it remains unclear if these “black box” models are identifying biological truth or “predictive noise”.</p>
</sec>
<sec id="t4-3">
<title>The power of multimodal integration</title>
<p id="p-50">Integrating multiple MRI sequences consistently outperformed single-modality models [<xref ref-type="bibr" rid="B40">40</xref>]. Fusing structural (T1w, T1-weighted image), diffusion (dMRI), and functional (fMRI) data allows for a holistic view of sex-based variation. However, the increased accuracy of multimodal models (up to 96.6%) may also amplify the aggregation of confounding signals—such as motion artifacts in fMRI paired with size-bias in T1w data—unless rigorous cross-modal confound control is applied.</p>
</sec>
<sec id="t4-4">
<title>Statistical inference vs. ML prioritization</title>
<p id="p-51">A critical methodological tension exists between traditional statistical-driven and ML-driven applications. While statistical approaches prioritize the identification of significant regional differences (inference), ML prioritizes the maximization of classification accuracy (prediction). Our analysis highlights that these two approaches do not always yield the same prioritization of brain features [<xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B34">34</xref>]. For instance, an ML model might prioritize a combination of subtle, non-significant features—such as cortical folding patterns or functional connectivity weights—to reach high accuracy. This discrepancy suggests that ML may “prioritize” features that are statistically weak on their own but computationally powerful in aggregate, potentially exploiting “predictive noise” that lacks true inferential validity.</p>
</sec>
<sec id="t4-5">
<title>Technical limitations and the fragility of generalizability</title>
<p id="p-52">High accuracy does not equate to biological generalizability. A recurring limitation is the absence of cross-site or cross-scanner validation. Models trained on single-site datasets (e.g., HCP, UKB) may inadvertently learn “site-specific signatures”—such as scanner gradients or head-coil configurations—rather than universal biological signals. Furthermore, the reliance on WEIRD (Western, Educated, Industrialized, Rich, Democratic) populations introduces demographic biases. An accuracy of 98% may reflect overfitting to site-specific noise and demographic homogeneity, failing when applied to more diverse groups.</p>
</sec>
<sec id="t4-6">
<title>Beyond determinism: the mosaic brain</title>
<p id="p-53">Crucially, these findings do not imply deterministic brain dimorphism. High classification accuracy is a testament to the power of multivariate statistics to find patterns in overlapping data, not an endorsement of binary biological essentialism. Individual brains are more accurately described as a “mosaic” [<xref ref-type="bibr" rid="B6">6</xref>] of features. Transparent reporting and cautious interpretation are essential to prevent the misuse of high-accuracy ML results in contexts that demand binary certainty, where nature provides a spectrum of variability.</p>
</sec>
<sec id="t4-7">
<title>Ethical considerations</title>
<p id="p-54">The high classification accuracies identified in this review—reaching up to 98.06%—necessitate a move beyond viewing sex-classification as a purely technical challenge. Our findings reveal specific methodological trends that carry significant ethical weight.</p>
<p id="p-55">Our review found that T1-weighted imaging and DL architectures (e.g., MCN-ELM) produce the highest accuracies. However, these results must be interpreted with caution. There is a profound ethical risk that these “near-perfect” statistical separations are used to support essentialist claims—the idea that male and female brains are “opposite” or “dimorphic”. As noted in our discussion of the “brain mosaic”, high accuracy in a multivariate model does not negate the extensive overlap in individual brain features. Misrepresenting these statistical patterns as deterministic labels could be misused to justify gender-based discrimination in education, employment, or forensic contexts.</p>
<p id="p-56">Our findings show a heavy reliance on datasets like the HCP, UKB, and ABCD. Because these cohorts predominantly sample WEIRD populations, there is a direct ethical risk of creating inequitable algorithms. If a model achieves 98% accuracy on a high-income, Western cohort but is then deployed in a global health context without cross-cultural validation, it may produce biased or invalid results for underrepresented groups. The “robustness” reported in current literature is, therefore, demographically “fragile”, potentially reinforcing systemic healthcare disparities.</p>
<p id="p-57">A critical ethical concern arising from our analysis is the lack of TIV correction in several high-accuracy studies. When models “cheat” by using global head size as a proxy for sex, they are not identifying neurobiological sex differences; they are identifying physical scale. Attributing this to “brain sex” is ethically problematic, as it presents a technical confound as an innate biological truth, potentially leading to flawed theories about cognitive or behavioral differences.</p>
</sec>
<sec id="t4-8">
<title>Recommendations for ethical research</title>
<p id="p-58">To mitigate these risks, we recommend that future neuroimaging-ML research adopt the following mandatory reporting standards:</p>
<p id="p-59">
<list list-type="simple">
<list-item>
<label>1.</label>
<p>Mandatory TIV disclosure: Researchers must explicitly report whether and how they corrected for TIV to ensure accuracy reflects morphology, not just size.</p>
</list-item>
<list-item>
<label>2.</label>
<p>Granular demographic reporting: Manuscripts should include a detailed “diversity statement” regarding the training data, specifying the ethnicity, socioeconomic status, and geographic origin of participants.</p>
</list-item>
<list-item>
<label>3.</label>
<p>Cross-dataset validation: High accuracy claims should be treated as preliminary until validated on an external, demographically distinct dataset to test for algorithmic fairness.</p>
</list-item>
<list-item>
<label>4.</label>
<p>Interpretive caution: Results should be framed in terms of “statistical classification” rather than “biological essence”, explicitly acknowledging the role of neuroplasticity and environment in shaping the observed features.</p>
</list-item>
</list>
</p>
</sec>
<sec id="t4-9">
<title>Limitations</title>
<p id="p-60">A primary limitation of this systematic review is the methodological heterogeneity regarding confound management, particularly TIV. Since male brains are, on average, 8–12% larger than female brains, models that do not rigorously normalize for TIV—a gap identified in several high-accuracy studies—may be capturing allometric scaling rather than intrinsic neuroanatomical dimorphism. This “size-confounding” significantly inflates accuracy and obscures true biological signals.</p>
<p id="p-61">Furthermore, the field’s heavy reliance on a few large, shared public datasets (e.g., HCP, UKB) introduces a profound population bias. These datasets represent WEIRD cohorts, which lack the diversity necessary to claim universal biological validity. The absence of cross-site validation in many studies suggests that models may be overfitting to site-specific noise—such as scanner manufacturer gradients or specific preprocessing idiosyncrasies—rather than generalizable neurobiology. This “site-signature” effect means that a 98% accuracy on one dataset might drop to chance levels when applied to another [<xref ref-type="bibr" rid="B44">44</xref>].</p>
<p id="p-62">The absence of prospective protocol registration in a repository such as PROSPERO is a notable limitation. Although the review followed a rigorous, predefined internal protocol verified by multiple independent authors to minimize selective reporting bias, the lack of public registration may impact the transparency of the study selection process. Additionally, while our search was expanded to include Web of Science, PubMed, and Scopus to capture the interdisciplinary intersection of neuroscience and engineering, the exclusion of other technical databases (e.g., IEEE Xplore) remains a potential constraint on the absolute comprehensiveness of the literature surveyed. Finally, the restriction to English-language publications may exclude culturally diverse findings that could further challenge the “binary” narrative of brain sex. These combined artifacts suggest that current literature may provide an inflated sense of certainty regarding the categorical distinction of the human brain.</p>
</sec>
<sec id="t4-10">
<title>Conclusion</title>
<p id="p-63">This systematic review reveals that while ML can achieve peak accuracies of 98.06% in sex classification, these results must be viewed with significant skepticism. The high performance is likely bolstered by methodological artifacts, including inadequate TIV correction and the learning of dataset-specific scanner signatures. Rather than confirming a deterministic binary, these models identify population-level statistical trends that are heavily influenced by global head size and demographic homogeneity.</p>
<p id="p-64">We conclude that the human brain is better described as a mosaic of overlapping features rather than two distinct categories. For ML to move from a “pattern detector” to a valid neuroscientific tool, future research must prioritize mandatory TIV disclosure, cross-site validation, and the use of demographically diverse datasets. Without these rigorous standards, high classification accuracy remains a statistical achievement of limited biological and clinical utility.</p>
</sec>
</sec>
</body>
<back>
<glossary>
<title>Abbreviations</title>
<def-list>
<def-item>
<term>ABCD</term>
<def>
<p>Adolescent Brain Cognitive Development</p>
</def>
</def-item>
<def-item>
<term>AUC</term>
<def>
<p>area under the curve</p>
</def>
</def-item>
<def-item>
<term>CNN</term>
<def>
<p>Convolutional Neural Network</p>
</def>
</def-item>
<def-item>
<term>DI</term>
<def>
<p>distance index</p>
</def>
</def-item>
<def-item>
<term>DL</term>
<def>
<p>deep learning</p>
</def>
</def-item>
<def-item>
<term>dMRI</term>
<def>
<p>diffusion magnetic resonance imaging</p>
</def>
</def-item>
<def-item>
<term>DWI</term>
<def>
<p>diffusion-weighted imaging</p>
</def>
</def-item>
<def-item>
<term>FA</term>
<def>
<p>fractional anisotropy</p>
</def>
</def-item>
<def-item>
<term>fMRI</term>
<def>
<p>functional magnetic resonance imaging</p>
</def>
</def-item>
<def-item>
<term>GM</term>
<def>
<p>gray matter</p>
</def>
</def-item>
<def-item>
<term>HCP</term>
<def>
<p>Human Connectome Project</p>
</def>
</def-item>
<def-item>
<term>HSRC</term>
<def>
<p>hierarchical sparse representation-based classification</p>
</def>
</def-item>
<def-item>
<term>LDA</term>
<def>
<p>linear discriminant analysis</p>
</def>
</def-item>
<def-item>
<term>LI</term>
<def>
<p>laterality index</p>
</def>
</def-item>
<def-item>
<term>LR</term>
<def>
<p>logistic regression</p>
</def>
</def-item>
<def-item>
<term>LSTM</term>
<def>
<p>long short-term memory</p>
</def>
</def-item>
<def-item>
<term>MCN-ELM</term>
<def>
<p>Multi-Layer 3D Convolution Extreme Learning Machine</p>
</def>
</def-item>
<def-item>
<term>MD</term>
<def>
<p>mean diffusivity</p>
</def>
</def-item>
<def-item>
<term>ML</term>
<def>
<p>machine learning</p>
</def>
</def-item>
<def-item>
<term>MRI</term>
<def>
<p>magnetic resonance imaging</p>
</def>
</def-item>
<def-item>
<term>PRISMA</term>
<def>
<p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses</p>
</def>
</def-item>
<def-item>
<term>RF</term>
<def>
<p>random forest</p>
</def>
</def-item>
<def-item>
<term>rs-fMRI</term>
<def>
<p>resting-state functional magnetic resonance imaging</p>
</def>
</def-item>
<def-item>
<term>SHIP</term>
<def>
<p>Study of Health in Pomerania</p>
</def>
</def-item>
<def-item>
<term>SI</term>
<def>
<p>subtraction index</p>
</def>
</def-item>
<def-item>
<term>SNR</term>
<def>
<p>signal-to-noise ratio</p>
</def>
</def-item>
<def-item>
<term>stDNN</term>
<def>
<p>spatiotemporal deep neural network</p>
</def>
</def-item>
<def-item>
<term>SVM</term>
<def>
<p>support vector machine</p>
</def>
</def-item>
<def-item>
<term>T1w</term>
<def>
<p>T1-weighted image</p>
</def>
</def-item>
<def-item>
<term>TIV</term>
<def>
<p>total intracranial volume</p>
</def>
</def-item>
<def-item>
<term>TML</term>
<def>
<p>traditional machine learning</p>
</def>
</def-item>
<def-item>
<term>UKB</term>
<def>
<p>UK Biobank</p>
</def>
</def-item>
<def-item>
<term>WEIRD</term>
<def>
<p>Western, Educated, Industrialized, Rich, Democratic</p>
</def>
</def-item>
</def-list>
</glossary>
<sec id="s-suppl" sec-type="supplementary-material">
<title>Supplementary materials</title>
<p>The supplementary table for this article is available at: <uri xlink:href="https://www.explorationpub.com/uploads/Article/file/1004141_sup_1.pdf">https://www.explorationpub.com/uploads/Article/file/1004141_sup_1.pdf</uri>.</p>
<supplementary-material id="SD1" content-type="local-data">
<media xlink:href="1004141_sup_1.pdf" mimetype="application" mime-subtype="pdf"></media>
</supplementary-material>
</sec>
<sec id="s6">
<title>Declarations</title>
<sec id="t-6-1">
<title>Acknowledgments</title>
<p>During the preparation of this work, the authors used Gemini (Google) to improve the manuscript's linguistic clarity, readability, and grammatical accuracy. This service was utilized solely as a language-polishing tool following the completion of the initial draft. The authors formally confirm that all substantive intellectual content, data analysis, interpretation of results, and final conclusions are entirely their own. The AI tool did not generate new ideas, perform statistical evaluations, or influence the scientific direction of the study. After using this service, the authors reviewed and edited the content as needed and take full responsibility for the entire content of the publication.</p>
</sec>
<sec id="t-6-2">
<title>Author contributions</title>
<p>AHS: Investigation, Formal analysis, Data curation, Methodology, Writing—original draft. IJ: Supervision, Conceptualization, Methodology, Funding acquisition, Writing—review &amp; editing. ZAAM: Supervision, Conceptualization, Methodology, Funding acquisition, Writing—review &amp; editing. MIMT: Supervision, Conceptualization, Methodology, Funding acquisition, Writing—review &amp; editing. MZCA: Supervision, Conceptualization, Methodology, Funding acquisition, Writing—review &amp; editing. ST: Visualization, Validation. All authors read and approved the submitted version.</p>
</sec>
<sec id="t-6-3" sec-type="COI-statement">
<title>Conflicts of interest</title>
<p>The authors declare that they have no conflicts of interest.</p>
</sec>
<sec id="t-6-4">
<title>Ethical approval</title>
<p>Not applicable.</p>
</sec>
<sec id="t-6-5">
<title>Consent to participate</title>
<p>Not applicable.</p>
</sec>
<sec id="t-6-6">
<title>Consent to publication</title>
<p>Not applicable.</p>
</sec>
<sec id="t-6-7" sec-type="data-availability">
<title>Availability of data and materials</title>
<p>The datasets supporting the findings of this study are available from the corresponding author upon reasonable request.</p>
</sec>
<sec id="t-6-8">
<title>Funding</title>
<p>This research is part of the Fundamental Research Grant Scheme (FRGS/1/2024/WAS12/UIAM/01/3) under the Ministry of Higher Education Malaysia. The funder had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</p>
</sec>
<sec id="t-6-9">
<title>Copyright</title>
<p>© The Author(s) 2026.</p>
</sec>
</sec>
<sec id="s7">
<title>Publisher’s note</title>
<p>Open Exploration maintains a neutral stance on jurisdictional claims in published institutional affiliations and maps. All opinions expressed in this article are the personal views of the author(s) and do not represent the stance of the editorial team or the publisher.</p>
</sec>
<ref-list>
<ref id="B1">
<label>1</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Janowsky</surname>
<given-names>JS</given-names>
</name>
</person-group>
<article-title>Sexual dimorphism in the human brain: dispelling the myths</article-title>
<source>Dev Med Child Neurol</source>
<year iso-8601-date="1989">1989</year>
<volume>31</volume>
<fpage>257</fpage>
<lpage>63</lpage>
<pub-id pub-id-type="doi">10.1111/j.1469-8749.1989.tb03987.x</pub-id>
<pub-id pub-id-type="pmid">2661290</pub-id>
</element-citation>
</ref>
<ref id="B2">
<label>2</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ingalhalikar</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Smith</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Parker</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Satterthwaite</surname>
<given-names>TD</given-names>
</name>
<name>
<surname>Elliott</surname>
<given-names>MA</given-names>
</name>
<name>
<surname>Ruparel</surname>
<given-names>K</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Sex differences in the structural connectome of the human brain</article-title>
<source>Proc Natl Acad Sci U S A</source>
<year iso-8601-date="2014">2014</year>
<volume>111</volume>
<fpage>823</fpage>
<lpage>8</lpage>
<pub-id pub-id-type="doi">10.1073/pnas.1316909110</pub-id>
<pub-id pub-id-type="pmid">24297904</pub-id>
<pub-id pub-id-type="pmcid">PMC3896179</pub-id>
</element-citation>
</ref>
<ref id="B3">
<label>3</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wierenga</surname>
<given-names>LM</given-names>
</name>
<name>
<surname>Doucet</surname>
<given-names>GE</given-names>
</name>
<name>
<surname>Dima</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Agartz</surname>
<given-names>I</given-names>
</name>
<name>
<surname>Aghajani</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Akudjedu</surname>
<given-names>TN</given-names>
</name>
<etal>et al.</etal>
<collab>Karolinska Schizophrenia Project (KaSP) Consortium</collab>
<name>
<surname>Klein</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Koenders</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Kolskår</surname>
<given-names>KK</given-names>
</name>
<name>
<surname>Krämer</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Kuntsi</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Lagopoulos</surname>
<given-names>J</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Greater male than female variability in regional brain structure across the lifespan</article-title>
<source>Hum Brain Mapp</source>
<year iso-8601-date="2022">2022</year>
<volume>43</volume>
<fpage>470</fpage>
<lpage>99</lpage>
<pub-id pub-id-type="doi">10.1002/hbm.25204</pub-id>
<pub-id pub-id-type="pmid">33044802</pub-id>
<pub-id pub-id-type="pmcid">PMC8675415</pub-id>
</element-citation>
</ref>
<ref id="B4">
<label>4</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dumitru</surname>
<given-names>ML</given-names>
</name>
</person-group>
<article-title>Brain asymmetry is globally different in males and females: exploring cortical volume, area, thickness, and mean curvature</article-title>
<source>Cereb Cortex</source>
<year iso-8601-date="2023">2023</year>
<volume>33</volume>
<fpage>11623</fpage>
<lpage>33</lpage>
<pub-id pub-id-type="doi">10.1093/cercor/bhad396</pub-id>
<pub-id pub-id-type="pmid">37851852</pub-id>
<pub-id pub-id-type="pmcid">PMC10724869</pub-id>
</element-citation>
</ref>
<ref id="B5">
<label>5</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Witelson</surname>
<given-names>SF</given-names>
</name>
<name>
<surname>Beresh</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Kigar</surname>
<given-names>DL</given-names>
</name>
</person-group>
<article-title>Intelligence and brain size in 100 postmortem brains: sex, lateralization and age factors</article-title>
<source>Brain</source>
<year iso-8601-date="2006">2006</year>
<volume>129</volume>
<fpage>386</fpage>
<lpage>98</lpage>
<pub-id pub-id-type="doi">10.1093/brain/awh696</pub-id>
<pub-id pub-id-type="pmid">16339797</pub-id>
</element-citation>
</ref>
<ref id="B6">
<label>6</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Joel</surname>
<given-names>D</given-names>
</name>
</person-group>
<article-title>Beyond the binary: Rethinking sex and the brain</article-title>
<source>Neurosci Biobehav Rev</source>
<year iso-8601-date="2021">2021</year>
<volume>122</volume>
<fpage>165</fpage>
<lpage>75</lpage>
<pub-id pub-id-type="doi">10.1016/j.neubiorev.2020.11.018</pub-id>
<pub-id pub-id-type="pmid">33440198</pub-id>
</element-citation>
</ref>
<ref id="B7">
<label>7</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Joel</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Garcia-Falgueras</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Swaab</surname>
<given-names>D</given-names>
</name>
</person-group>
<article-title>The Complex Relationships between Sex and the Brain</article-title>
<source>Neuroscientist</source>
<year iso-8601-date="2020">2020</year>
<volume>26</volume>
<fpage>156</fpage>
<lpage>69</lpage>
<pub-id pub-id-type="doi">10.1177/1073858419867298</pub-id>
<pub-id pub-id-type="pmid">31509086</pub-id>
</element-citation>
</ref>
<ref id="B8">
<label>8</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Joel</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Persico</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Salhov</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Berman</surname>
<given-names>Z</given-names>
</name>
<name>
<surname>Oligschläger</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Meilijson</surname>
<given-names>I</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Analysis of Human Brain Structure Reveals that the Brain “Types” Typical of Males Are Also Typical of Females, and Vice Versa</article-title>
<source>Front Hum Neurosci</source>
<year iso-8601-date="2018">2018</year>
<volume>12</volume>
<elocation-id>399</elocation-id>
<pub-id pub-id-type="doi">10.3389/fnhum.2018.00399</pub-id>
<pub-id pub-id-type="pmid">30405373</pub-id>
<pub-id pub-id-type="pmcid">PMC6204758</pub-id>
</element-citation>
</ref>
<ref id="B9">
<label>9</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ebel</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Domin</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Neumann</surname>
<given-names>N</given-names>
</name>
<name>
<surname>Schmidt</surname>
<given-names>CO</given-names>
</name>
<name>
<surname>Lotze</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Stanke</surname>
<given-names>M</given-names>
</name>
</person-group>
<article-title>Classifying sex with volume-matched brain MRI</article-title>
<source>Neuroimage Rep</source>
<year iso-8601-date="2023">2023</year>
<volume>3</volume>
<elocation-id>100181</elocation-id>
<pub-id pub-id-type="doi">10.1016/j.ynirp.2023.100181</pub-id>
<pub-id pub-id-type="pmid">40567385</pub-id>
<pub-id pub-id-type="pmcid">PMC12172721</pub-id>
</element-citation>
</ref>
<ref id="B10">
<label>10</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ruigrok</surname>
<given-names>AN</given-names>
</name>
<name>
<surname>Salimi-Khorshidi</surname>
<given-names>G</given-names>
</name>
<name>
<surname>Lai</surname>
<given-names>MC</given-names>
</name>
<name>
<surname>Baron-Cohen</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Lombardo</surname>
<given-names>MV</given-names>
</name>
<name>
<surname>Tait</surname>
<given-names>RJ</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>A meta-analysis of sex differences in human brain structure</article-title>
<source>Neurosci Biobehav Rev</source>
<year iso-8601-date="2014">2014</year>
<volume>39</volume>
<fpage>34</fpage>
<lpage>50</lpage>
<pub-id pub-id-type="doi">10.1016/j.neubiorev.2013.12.004</pub-id>
<pub-id pub-id-type="pmid">24374381</pub-id>
<pub-id pub-id-type="pmcid">PMC3969295</pub-id>
</element-citation>
</ref>
<ref id="B11">
<label>11</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beacher</surname>
<given-names>FD</given-names>
</name>
<name>
<surname>Minati</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Baron-Cohen</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Lombardo</surname>
<given-names>MV</given-names>
</name>
<name>
<surname>Lai</surname>
<given-names>MC</given-names>
</name>
<name>
<surname>Gray</surname>
<given-names>MA</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Autism attenuates sex differences in brain structure: a combined voxel-based morphometry and diffusion tensor imaging study</article-title>
<source>AJNR Am J Neuroradiol</source>
<year iso-8601-date="2012">2012</year>
<volume>33</volume>
<fpage>83</fpage>
<lpage>9</lpage>
<pub-id pub-id-type="doi">10.3174/ajnr.A2880</pub-id>
<pub-id pub-id-type="pmid">22173769</pub-id>
<pub-id pub-id-type="pmcid">PMC6345364</pub-id>
</element-citation>
</ref>
<ref id="B12">
<label>12</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Collins</surname>
<given-names>DW</given-names>
</name>
<name>
<surname>Kimura</surname>
<given-names>D</given-names>
</name>
</person-group>
<article-title>A large sex difference on a two-dimensional mental rotation task</article-title>
<source>Behav Neurosci</source>
<year iso-8601-date="1997">1997</year>
<volume>111</volume>
<fpage>845</fpage>
<lpage>9</lpage>
<pub-id pub-id-type="doi">10.1037//0735-7044.111.4.845</pub-id>
<pub-id pub-id-type="pmid">9267662</pub-id>
</element-citation>
</ref>
<ref id="B13">
<label>13</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cui</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Jin</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>W</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Age- and sex-related differences in cortical morphology and their relationships with cognitive performance in healthy middle-aged and older adults</article-title>
<source>Quant Imaging Med Surg</source>
<year iso-8601-date="2023">2023</year>
<volume>13</volume>
<fpage>1083</fpage>
<lpage>99</lpage>
<pub-id pub-id-type="doi">10.21037/qims-22-583</pub-id>
<pub-id pub-id-type="pmid">36819243</pub-id>
<pub-id pub-id-type="pmcid">PMC9929420</pub-id>
</element-citation>
</ref>
<ref id="B14">
<label>14</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dai</surname>
<given-names>Z</given-names>
</name>
<name>
<surname>Zhong</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>F</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>P</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Gray matter correlates of migraine and gender effect: A meta-analysis of voxel-based morphometry studies</article-title>
<source>Neuroscience</source>
<year iso-8601-date="2015">2015</year>
<volume>299</volume>
<fpage>88</fpage>
<lpage>96</lpage>
<pub-id pub-id-type="doi">10.1016/j.neuroscience.2015.04.066</pub-id>
<pub-id pub-id-type="pmid">25943478</pub-id>
</element-citation>
</ref>
<ref id="B15">
<label>15</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Salminen</surname>
<given-names>LE</given-names>
</name>
<name>
<surname>Tubi</surname>
<given-names>MA</given-names>
</name>
<name>
<surname>Bright</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Thomopoulos</surname>
<given-names>SI</given-names>
</name>
<name>
<surname>Wieand</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Thompson</surname>
<given-names>PM</given-names>
</name>
</person-group>
<article-title>Sex is a defining feature of neuroimaging phenotypes in major brain disorders</article-title>
<source>Hum Brain Mapp</source>
<year iso-8601-date="2022">2022</year>
<volume>43</volume>
<fpage>500</fpage>
<lpage>42</lpage>
<pub-id pub-id-type="doi">10.1002/hbm.25438</pub-id>
<pub-id pub-id-type="pmid">33949018</pub-id>
<pub-id pub-id-type="pmcid">PMC8805690</pub-id>
</element-citation>
</ref>
<ref id="B16">
<label>16</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Besson</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Parrish</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Katsaggelos</surname>
<given-names>AK</given-names>
</name>
<name>
<surname>Bandt</surname>
<given-names>SK</given-names>
</name>
</person-group>
<article-title>Geometric deep learning on brain shape predicts sex and age</article-title>
<source>Comput Med Imaging Graph</source>
<year iso-8601-date="2021">2021</year>
<volume>91</volume>
<elocation-id>101939</elocation-id>
<pub-id pub-id-type="doi">10.1016/j.compmedimag.2021.101939</pub-id>
<pub-id pub-id-type="pmid">34082280</pub-id>
</element-citation>
</ref>
<ref id="B17">
<label>17</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bi</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Abrol</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>Z</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Calhoun</surname>
<given-names>V</given-names>
</name>
</person-group>
<article-title>Prediction of gender from longitudinal MRI data via deep learning on adolescent data reveals unique patterns associated with brain structure and change over a two-year period</article-title>
<source>J Neurosci Methods</source>
<year iso-8601-date="2023">2023</year>
<volume>384</volume>
<elocation-id>109744</elocation-id>
<pub-id pub-id-type="doi">10.1016/j.jneumeth.2022.109744</pub-id>
<pub-id pub-id-type="pmid">36400261</pub-id>
</element-citation>
</ref>
<ref id="B18">
<label>18</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brennan</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>J</given-names>
</name>
</person-group>
<article-title>Morphometrical Brain Markers of Sex Difference</article-title>
<source>Cereb Cortex</source>
<year iso-8601-date="2021">2021</year>
<volume>31</volume>
<fpage>3641</fpage>
<lpage>9</lpage>
<pub-id pub-id-type="doi">10.1093/cercor/bhab037</pub-id>
<pub-id pub-id-type="pmid">33774662</pub-id>
</element-citation>
</ref>
<ref id="B19">
<label>19</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Bayanagari</surname>
<given-names>VL</given-names>
</name>
<name>
<surname>Chung</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Lui</surname>
<given-names>YW</given-names>
</name>
</person-group>
<article-title>Deep learning with diffusion MRI as in vivo microscope reveals sex-related differences in human white matter microstructure</article-title>
<source>Sci Rep</source>
<year iso-8601-date="2024">2024</year>
<volume>14</volume>
<elocation-id>9835</elocation-id>
<pub-id pub-id-type="doi">10.1038/s41598-024-60340-y</pub-id>
<pub-id pub-id-type="pmid">38744901</pub-id>
<pub-id pub-id-type="pmcid">PMC11094063</pub-id>
</element-citation>
</ref>
<ref id="B20">
<label>20</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dibaji</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Ospel</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Souza</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Bento</surname>
<given-names>M</given-names>
</name>
</person-group>
<article-title>Sex differences in brain MRI using deep learning toward fairer healthcare outcomes</article-title>
<source>Front Comput Neurosci</source>
<year iso-8601-date="2024">2024</year>
<volume>18</volume>
<elocation-id>1452457</elocation-id>
<pub-id pub-id-type="doi">10.3389/fncom.2024.1452457</pub-id>
<pub-id pub-id-type="pmid">39606583</pub-id>
<pub-id pub-id-type="pmcid">PMC11598355</pub-id>
</element-citation>
</ref>
<ref id="B21">
<label>21</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dhamala</surname>
<given-names>E</given-names>
</name>
<name>
<surname>Jamison</surname>
<given-names>KW</given-names>
</name>
<name>
<surname>Sabuncu</surname>
<given-names>MR</given-names>
</name>
<name>
<surname>Kuceyeski</surname>
<given-names>A</given-names>
</name>
</person-group>
<article-title>Sex classification using long-range temporal dependence of resting-state functional MRI time series</article-title>
<source>Hum Brain Mapp</source>
<year iso-8601-date="2020">2020</year>
<volume>41</volume>
<fpage>3567</fpage>
<lpage>79</lpage>
<pub-id pub-id-type="doi">10.1002/hbm.25030</pub-id>
<pub-id pub-id-type="pmid">32627300</pub-id>
<pub-id pub-id-type="pmcid">PMC7416025</pub-id>
</element-citation>
</ref>
<ref id="B22">
<label>22</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fan</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Su</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Qin</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>H</given-names>
</name>
</person-group>
<article-title>A Deep Network Model on Dynamic Functional Connectivity With Applications to Gender Classification and Intelligence Prediction</article-title>
<source>Front Neurosci</source>
<year iso-8601-date="2020">2020</year>
<volume>14</volume>
<elocation-id>881</elocation-id>
<pub-id pub-id-type="doi">10.3389/fnins.2020.00881</pub-id>
<pub-id pub-id-type="pmid">33013292</pub-id>
<pub-id pub-id-type="pmcid">PMC7461846</pub-id>
</element-citation>
</ref>
<ref id="B23">
<label>23</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feis</surname>
<given-names>DL</given-names>
</name>
<name>
<surname>Brodersen</surname>
<given-names>KH</given-names>
</name>
<name>
<surname>von Cramon</surname>
<given-names>DY</given-names>
</name>
<name>
<surname>Luders</surname>
<given-names>E</given-names>
</name>
<name>
<surname>Tittgemeyer</surname>
<given-names>M</given-names>
</name>
</person-group>
<article-title>Decoding gender dimorphism of the human brain using multimodal anatomical and diffusion MRI data</article-title>
<source>Neuroimage</source>
<year iso-8601-date="2013">2013</year>
<volume>70</volume>
<fpage>250</fpage>
<lpage>7</lpage>
<pub-id pub-id-type="doi">10.1016/j.neuroimage.2012.12.068</pub-id>
<pub-id pub-id-type="pmid">23298750</pub-id>
</element-citation>
</ref>
<ref id="B24">
<label>24</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ge</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Long</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Frangou</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Vila-Rodriguez</surname>
<given-names>F</given-names>
</name>
</person-group>
<article-title>Sex effects on cortical morphological networks in healthy young adults</article-title>
<source>Neuroimage</source>
<year iso-8601-date="2021">2021</year>
<volume>233</volume>
<elocation-id>117945</elocation-id>
<pub-id pub-id-type="doi">10.1016/j.neuroimage.2021.117945</pub-id>
<pub-id pub-id-type="pmid">33711482</pub-id>
</element-citation>
</ref>
<ref id="B25">
<label>25</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>Z</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>L</given-names>
</name>
</person-group>
<article-title>Gender identification based on human brain structural MRI with a multi-layer 3D convolution extreme learning machine</article-title>
<source>Cogn Comput Syst</source>
<year iso-8601-date="2019">2019</year>
<volume>1</volume>
<fpage>91</fpage>
<lpage>6</lpage>
<pub-id pub-id-type="doi">10.1049/ccs.2018.0018</pub-id>
</element-citation>
</ref>
<ref id="B26">
<label>26</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jeon</surname>
<given-names>YJ</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>SE</given-names>
</name>
<name>
<surname>Baek</surname>
<given-names>HM</given-names>
</name>
</person-group>
<article-title>Predicting Brain Age and Gender from Brain Volume Data Using Variational Quantum Circuits</article-title>
<source>Brain Sci</source>
<year iso-8601-date="2024">2024</year>
<volume>14</volume>
<elocation-id>401</elocation-id>
<pub-id pub-id-type="doi">10.3390/brainsci14040401</pub-id>
<pub-id pub-id-type="pmid">38672050</pub-id>
<pub-id pub-id-type="pmcid">PMC11048383</pub-id>
</element-citation>
</ref>
<ref id="B27">
<label>27</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Leming</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Suckling</surname>
<given-names>J</given-names>
</name>
</person-group>
<article-title>Deep learning for sex classification in resting-state and task functional brain networks from the UK Biobank</article-title>
<source>Neuroimage</source>
<year iso-8601-date="2021">2021</year>
<volume>241</volume>
<elocation-id>118409</elocation-id>
<pub-id pub-id-type="doi">10.1016/j.neuroimage.2021.118409</pub-id>
<pub-id pub-id-type="pmid">34293465</pub-id>
<pub-id pub-id-type="pmcid">PMC8456752</pub-id>
</element-citation>
</ref>
<ref id="B28">
<label>28</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname>
<given-names>Z</given-names>
</name>
<name>
<surname>Hou</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>D</given-names>
</name>
</person-group>
<article-title>Gender Identification of Human Cortical 3-D Morphology Using Hierarchical Sparsity</article-title>
<source>Front Hum Neurosci</source>
<year iso-8601-date="2019">2019</year>
<volume>13</volume>
<elocation-id>29</elocation-id>
<pub-id pub-id-type="doi">10.3389/fnhum.2019.00029</pub-id>
<pub-id pub-id-type="pmid">30792634</pub-id>
<pub-id pub-id-type="pmcid">PMC6374327</pub-id>
</element-citation>
</ref>
<ref id="B29">
<label>29</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Matte</surname>
<given-names>Bon G</given-names>
</name>
<name>
<surname>Kraft</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Comasco</surname>
<given-names>E</given-names>
</name>
<name>
<surname>Derntl</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Kaufmann</surname>
<given-names>T</given-names>
</name>
</person-group>
<article-title>Modeling brain sex in the limbic system as phenotype for female-prevalent mental disorders</article-title>
<source>Biol Sex Differ</source>
<year iso-8601-date="2024">2024</year>
<volume>15</volume>
<elocation-id>42</elocation-id>
<pub-id pub-id-type="doi">10.1186/s13293-024-00615-1</pub-id>
<pub-id pub-id-type="pmid">38750598</pub-id>
<pub-id pub-id-type="pmcid">PMC11097569</pub-id>
</element-citation>
</ref>
<ref id="B30">
<label>30</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mendes</surname>
<given-names>SL</given-names>
</name>
<name>
<surname>Pinaya</surname>
<given-names>WHL</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Sato</surname>
<given-names>JR</given-names>
</name>
</person-group>
<article-title>Estimating Gender and Age from Brain Structural MRI of Children and Adolescents: A 3D Convolutional Neural Network Multitask Learning Model</article-title>
<source>Comput Intell Neurosci</source>
<year iso-8601-date="2021">2021</year>
<volume>2021</volume>
<elocation-id>5550914</elocation-id>
<pub-id pub-id-type="doi">10.1155/2021/5550914</pub-id>
<pub-id pub-id-type="pmid">34122531</pub-id>
<pub-id pub-id-type="pmcid">PMC8172319</pub-id>
</element-citation>
</ref>
<ref id="B31">
<label>31</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nebli</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Rekik</surname>
<given-names>I</given-names>
</name>
</person-group>
<article-title>Gender differences in cortical morphological networks</article-title>
<source>Brain Imaging Behav</source>
<year iso-8601-date="2020">2020</year>
<volume>14</volume>
<fpage>1831</fpage>
<lpage>9</lpage>
<pub-id pub-id-type="doi">10.1007/s11682-019-00123-6</pub-id>
<pub-id pub-id-type="pmid">31102167</pub-id>
<pub-id pub-id-type="pmcid">PMC7572349</pub-id>
</element-citation>
</ref>
<ref id="B32">
<label>32</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Patel</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Orlichenko</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Patel</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Qu</surname>
<given-names>G</given-names>
</name>
<name>
<surname>Wilson</surname>
<given-names>TW</given-names>
</name>
<name>
<surname>Stephen</surname>
<given-names>JM</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Explainable multimodal graph isomorphism network for interpreting sex differences in adolescent neurodevelopment</article-title>
<source>Appl Sci</source>
<year iso-8601-date="2024">2024</year>
<volume>14</volume>
<elocation-id>4144</elocation-id>
<pub-id pub-id-type="doi">10.3390/app14104144</pub-id>
</element-citation>
</ref>
<ref id="B33">
<label>33</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ryali</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>de Los Angeles</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Supekar</surname>
<given-names>K</given-names>
</name>
<name>
<surname>Menon</surname>
<given-names>V</given-names>
</name>
</person-group>
<article-title>Deep learning models reveal replicable, generalizable, and behaviorally relevant sex differences in human functional brain organization</article-title>
<source>Proc Natl Acad Sci U S A</source>
<year iso-8601-date="2024">2024</year>
<volume>121</volume>
<elocation-id>e2310012121</elocation-id>
<pub-id pub-id-type="doi">10.1073/pnas.2310012121</pub-id>
<pub-id pub-id-type="pmid">38377194</pub-id>
<pub-id pub-id-type="pmcid">PMC10907309</pub-id>
</element-citation>
</ref>
<ref id="B34">
<label>34</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sanchis-Segura</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Aguirre</surname>
<given-names>N</given-names>
</name>
<name>
<surname>Cruz-Gómez</surname>
<given-names>ÁJ</given-names>
</name>
<name>
<surname>Félix</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Forn</surname>
<given-names>C</given-names>
</name>
</person-group>
<article-title>Beyond “sex prediction”: Estimating and interpreting multivariate sex differences and similarities in the brain</article-title>
<source>Neuroimage</source>
<year iso-8601-date="2022">2022</year>
<volume>257</volume>
<elocation-id>119343</elocation-id>
<pub-id pub-id-type="doi">10.1016/j.neuroimage.2022.119343</pub-id>
<pub-id pub-id-type="pmid">35654377</pub-id>
</element-citation>
</ref>
<ref id="B35">
<label>35</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Satterthwaite</surname>
<given-names>TD</given-names>
</name>
<name>
<surname>Wolf</surname>
<given-names>DH</given-names>
</name>
<name>
<surname>Roalf</surname>
<given-names>DR</given-names>
</name>
<name>
<surname>Ruparel</surname>
<given-names>K</given-names>
</name>
<name>
<surname>Erus</surname>
<given-names>G</given-names>
</name>
<name>
<surname>Vandekar</surname>
<given-names>S</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Linked Sex Differences in Cognition and Functional Connectivity in Youth</article-title>
<source>Cereb Cortex</source>
<year iso-8601-date="2015">2015</year>
<volume>25</volume>
<fpage>2383</fpage>
<lpage>94</lpage>
<pub-id pub-id-type="doi">10.1093/cercor/bhu036</pub-id>
<pub-id pub-id-type="pmid">24646613</pub-id>
<pub-id pub-id-type="pmcid">PMC4537416</pub-id>
</element-citation>
</ref>
<ref id="B36">
<label>36</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sen</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Parhi</surname>
<given-names>KK</given-names>
</name>
</person-group>
<article-title>Predicting Biological Gender and Intelligence From fMRI via Dynamic Functional Connectivity</article-title>
<source>IEEE Trans Biomed Eng</source>
<year iso-8601-date="2021">2021</year>
<volume>68</volume>
<fpage>815</fpage>
<lpage>25</lpage>
<pub-id pub-id-type="doi">10.1109/TBME.2020.3011363</pub-id>
<pub-id pub-id-type="pmid">32746070</pub-id>
</element-citation>
</ref>
<ref id="B37">
<label>37</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sepehrband</surname>
<given-names>F</given-names>
</name>
<name>
<surname>Lynch</surname>
<given-names>KM</given-names>
</name>
<name>
<surname>Cabeen</surname>
<given-names>RP</given-names>
</name>
<name>
<surname>Gonzalez-Zacarias</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>L</given-names>
</name>
<name>
<surname>D’Arcy</surname>
<given-names>M</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Neuroanatomical morphometric characterization of sex differences in youth using statistical learning</article-title>
<source>Neuroimage</source>
<year iso-8601-date="2018">2018</year>
<volume>172</volume>
<fpage>217</fpage>
<lpage>27</lpage>
<pub-id pub-id-type="doi">10.1016/j.neuroimage.2018.01.065</pub-id>
<pub-id pub-id-type="pmid">29414494</pub-id>
<pub-id pub-id-type="pmcid">PMC5967879</pub-id>
</element-citation>
</ref>
<ref id="B38">
<label>38</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shanmugan</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Seidlitz</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Cui</surname>
<given-names>Z</given-names>
</name>
<name>
<surname>Adebimpe</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Bassett</surname>
<given-names>DS</given-names>
</name>
<name>
<surname>Bertolero</surname>
<given-names>MA</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Sex differences in the functional topography of association networks in youth</article-title>
<source>Proc Natl Acad Sci U S A</source>
<year iso-8601-date="2022">2022</year>
<volume>119</volume>
<elocation-id>e2110416119</elocation-id>
<pub-id pub-id-type="doi">10.1073/pnas.2110416119</pub-id>
<pub-id pub-id-type="pmid">35939696</pub-id>
<pub-id pub-id-type="pmcid">PMC9388107</pub-id>
</element-citation>
</ref>
<ref id="B39">
<label>39</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>F</given-names>
</name>
<name>
<surname>Zang</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>D</given-names>
</name>
</person-group>
<article-title>Combined structural and resting-state functional MRI analysis of sexual dimorphism in the young adult human brain: an MVPA approach</article-title>
<source>Neuroimage</source>
<year iso-8601-date="2012">2012</year>
<volume>61</volume>
<fpage>931</fpage>
<lpage>40</lpage>
<pub-id pub-id-type="doi">10.1016/j.neuroimage.2012.03.080</pub-id>
<pub-id pub-id-type="pmid">22498657</pub-id>
</element-citation>
</ref>
<ref id="B40">
<label>40</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Weber</surname>
<given-names>KA 2nd</given-names>
</name>
<name>
<surname>Teplin</surname>
<given-names>ZM</given-names>
</name>
<name>
<surname>Wager</surname>
<given-names>TD</given-names>
</name>
<name>
<surname>Law</surname>
<given-names>CSW</given-names>
</name>
<name>
<surname>Prabhakar</surname>
<given-names>NK</given-names>
</name>
<name>
<surname>Ashar</surname>
<given-names>YK</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Confounds in neuroimaging: A clear case of sex as a confound in brain-based prediction</article-title>
<source>Front Neurol</source>
<year iso-8601-date="2022">2022</year>
<volume>13</volume>
<elocation-id>960760</elocation-id>
<pub-id pub-id-type="doi">10.3389/fneur.2022.960760</pub-id>
<pub-id pub-id-type="pmid">36601297</pub-id>
<pub-id pub-id-type="pmcid">PMC9806266</pub-id>
</element-citation>
</ref>
<ref id="B41">
<label>41</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Weis</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Patil</surname>
<given-names>KR</given-names>
</name>
<name>
<surname>Hoffstaedter</surname>
<given-names>F</given-names>
</name>
<name>
<surname>Nostro</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Yeo</surname>
<given-names>BTT</given-names>
</name>
<name>
<surname>Eickhoff</surname>
<given-names>SB</given-names>
</name>
</person-group>
<article-title>Sex Classification by Resting State Brain Connectivity</article-title>
<source>Cereb Cortex</source>
<year iso-8601-date="2020">2020</year>
<volume>30</volume>
<fpage>824</fpage>
<lpage>35</lpage>
<pub-id pub-id-type="doi">10.1093/cercor/bhz129</pub-id>
<pub-id pub-id-type="pmid">31251328</pub-id>
<pub-id pub-id-type="pmcid">PMC7444737</pub-id>
</element-citation>
</ref>
<ref id="B42">
<label>42</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Qin</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Wan</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Ming</surname>
<given-names>D</given-names>
</name>
</person-group>
<article-title>Gender Differences Are Encoded Differently in the Structure and Function of the Human Brain Revealed by Multimodal MRI</article-title>
<source>Front Hum Neurosci</source>
<year iso-8601-date="2020">2020</year>
<volume>14</volume>
<elocation-id>244</elocation-id>
<pub-id pub-id-type="doi">10.3389/fnhum.2020.00244</pub-id>
<pub-id pub-id-type="pmid">32792927</pub-id>
<pub-id pub-id-type="pmcid">PMC7385398</pub-id>
</element-citation>
</ref>
<ref id="B43">
<label>43</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xin</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y</given-names>
</name>
</person-group>
<article-title>Brain Differences Between Men and Women: Evidence From Deep Learning</article-title>
<source>Front Neurosci</source>
<year iso-8601-date="2019">2019</year>
<volume>13</volume>
<elocation-id>185</elocation-id>
<pub-id pub-id-type="doi">10.3389/fnins.2019.00185</pub-id>
<pub-id pub-id-type="pmid">30906246</pub-id>
<pub-id pub-id-type="pmcid">PMC6418873</pub-id>
</element-citation>
</ref>
<ref id="B44">
<label>44</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Ou</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>YJ</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>LH</given-names>
</name>
</person-group>
<article-title>Sex Differences in Functional Brain Networks for Language</article-title>
<source>Cereb Cortex</source>
<year iso-8601-date="2020">2020</year>
<volume>30</volume>
<fpage>1528</fpage>
<lpage>37</lpage>
<pub-id pub-id-type="doi">10.1093/cercor/bhz184</pub-id>
<pub-id pub-id-type="pmid">31512720</pub-id>
</element-citation>
</ref>
<ref id="B45">
<label>45</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>Q</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>CC</given-names>
</name>
<name>
<surname>Lo</surname>
<given-names>CZ</given-names>
</name>
<name>
<surname>Langley</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Desrivières</surname>
<given-names>S</given-names>
</name>
<etal>et al.</etal>
<collab>IMAGEN consortium</collab>
</person-group>
<article-title>The Human Brain Is Best Described as Being on a Female/Male Continuum: Evidence from a Neuroimaging Connectivity Study</article-title>
<source>Cereb Cortex</source>
<year iso-8601-date="2021">2021</year>
<volume>31</volume>
<fpage>3021</fpage>
<lpage>33</lpage>
<pub-id pub-id-type="doi">10.1093/cercor/bhaa408</pub-id>
<pub-id pub-id-type="pmid">33471126</pub-id>
<pub-id pub-id-type="pmcid">PMC8107794</pub-id>
</element-citation>
</ref>
<ref id="B46">
<label>46</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>M</given-names>
</name>
</person-group>
<article-title>Multimodal Image Analysis of Sexual Dimorphism in Developing Childhood Brain</article-title>
<source>Brain Topogr</source>
<year iso-8601-date="2021">2021</year>
<volume>34</volume>
<fpage>257</fpage>
<lpage>68</lpage>
<pub-id pub-id-type="doi">10.1007/s10548-021-00823-7</pub-id>
<pub-id pub-id-type="pmid">33630209</pub-id>
</element-citation>
</ref>
<ref id="B47">
<label>47</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yeung</surname>
<given-names>HW</given-names>
</name>
<name>
<surname>Stolicyn</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Buchanan</surname>
<given-names>CR</given-names>
</name>
<name>
<surname>Tucker-Drob</surname>
<given-names>EM</given-names>
</name>
<name>
<surname>Bastin</surname>
<given-names>ME</given-names>
</name>
<name>
<surname>Luz</surname>
<given-names>S</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Predicting sex, age, general cognition and mental health with machine learning on brain structural connectomes</article-title>
<source>Hum Brain Mapp</source>
<year iso-8601-date="2023">2023</year>
<volume>44</volume>
<fpage>1913</fpage>
<lpage>33</lpage>
<pub-id pub-id-type="doi">10.1002/hbm.26182</pub-id>
<pub-id pub-id-type="pmid">36541441</pub-id>
<pub-id pub-id-type="pmcid">PMC9980898</pub-id>
</element-citation>
</ref>
<ref id="B48">
<label>48</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Metoki</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Chauvin</surname>
<given-names>RJ</given-names>
</name>
<name>
<surname>Gordon</surname>
<given-names>EM</given-names>
</name>
<name>
<surname>Laumann</surname>
<given-names>TO</given-names>
</name>
<name>
<surname>Kay</surname>
<given-names>BP</given-names>
</name>
<name>
<surname>Krimmel</surname>
<given-names>SR</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Brain functional connectivity, but not neuroanatomy, captures the interrelationship between sex and gender in preadolescents</article-title>
<comment>bioRxiv [Preprint]. 2024 [cited 2026 Jan 19]. Available from: <uri xlink:href="https://pmc.ncbi.nlm.nih.gov/articles/PMC11565917/">https://pmc.ncbi.nlm.nih.gov/articles/PMC11565917/</uri></comment>
</element-citation>
</ref>
</ref-list>
</back>
</article>