<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "https://jats.nlm.nih.gov/publishing/1.3/JATS-journalpublishing1-3.dtd"><article xml:lang="en" article-type="research-article" dtd-version="1.3" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/"><front><journal-meta><journal-id journal-id-type="issn">2527-2799</journal-id><journal-title-group><journal-title>Bioeksperimen: Jurnal Penelitian Biologi</journal-title><abbrev-journal-title>Bioeksperimen</abbrev-journal-title></journal-title-group><issn pub-type="epub">2527-2799</issn><issn pub-type="ppub">2460-1365</issn><publisher><publisher-name>Universitas Muhammadiyah Surakarta</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.23917/bioeksperimen.v12i1.14233</article-id><title-group><article-title>Phylogenetic Analysis of Representative Mammalian MUC16 Supported by Comparative SEA Domain and Tandem Repeat Variation</article-title></title-group><contrib-group><contrib contrib-type="author"><name><surname>Foenna</surname><given-names>Yudi Gebri</given-names></name><address><country>Indonesia</country><email>yudigebri97@gmail.com</email></address><xref ref-type="aff" rid="AFF-1"></xref><xref ref-type="corresp" rid="cor-0"></xref></contrib><contrib contrib-type="author"><name><surname>Yulisma</surname><given-names>Ardhana</given-names></name><address><country>Indonesia</country></address><xref ref-type="aff" rid="AFF-2"></xref></contrib><contrib contrib-type="author"><name><surname>Calapoğlu</surname><given-names>Nilüfer Şahin</given-names></name><address><country>Turkey</country></address><xref ref-type="aff" rid="AFF-3"></xref></contrib></contrib-group><aff id="AFF-1"><institution-wrap><institution>Universitas Medan Area</institution><institution-id institution-id-type="ror">https://ror.org/046581250</institution-id></institution-wrap><country country="ID">Indonesia</country></aff><aff id="AFF-2">Universitas U’budiyah Indonesia</aff><aff id="AFF-3"><institution-wrap><institution>Süleyman Demirel Üniversitesi</institution><institution-id institution-id-type="ror">https://ror.org/04fjtte88</institution-id></institution-wrap><country country="TR">Türkiye</country></aff><author-notes><corresp id="cor-0">Corresponding author: Yudi Gebri Foenna, Universitas Medan Area.  Email: <email>yudigebri97@gmail.com</email></corresp></author-notes><pub-date date-type="pub" iso-8601-date="2026-3-31" publication-format="electronic"><day>31</day><month>3</month><year>2026</year></pub-date><volume>12</volume><issue>1</issue><fpage>1</fpage><lpage>13</lpage><history><date date-type="received" iso-8601-date="2025-12-12"><day>12</day><month>12</month><year>2025</year></date><date date-type="rev-recd" iso-8601-date="2026-2-6"><day>6</day><month>2</month><year>2026</year></date><date date-type="accepted" iso-8601-date="2026-3-31"><day>31</day><month>3</month><year>2026</year></date></history><permissions><copyright-statement>Copyright (c) 2026 Bioeksperimen: Jurnal Penelitian Biologi</copyright-statement><copyright-year>2026</copyright-year><copyright-holder>Bioeksperimen: Jurnal Penelitian Biologi</copyright-holder><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by-nc/4.0/"><ali:license_ref xmlns:ali="http://www.niso.org/schemas/ali/1.0/">https://creativecommons.org/licenses/by-nc/4.0/</ali:license_ref><license-p>This work is licensed under a Creative Commons Attribution-NonCommercial 4.0 International License.</license-p></license></permissions><self-uri xlink:href="https://journals2.ums.ac.id/bioeksperimen/article/view/14233" xlink:title="Phylogenetic Analysis of Representative Mammalian MUC16 Supported by Comparative SEA Domain and Tandem Repeat Variation">Phylogenetic Analysis of Representative Mammalian MUC16 Supported by Comparative SEA Domain and Tandem Repeat Variation</self-uri><abstract><p>MUC16 is one of the largest mammalian mucins and exhibits substantial evolutionary variation in both sequence composition and structural modularity. Comparative analysis of SEA domain composition and tandem repeat architecture is therefore essential for understanding the evolutionary diversification of this gene across mammals. This study investigates the phylogenetic relationships of mammalian MUC16 and examines how variation in SEA domains and tandem repeats contributes to lineage-specific structural divergence. MUC16 nucleotide and protein sequences from 20 mammalian species representing Primates and Rodentia were retrieved from public databases. Multiple sequence alignment and phylogenetic reconstruction were conducted using the Neighbor-Joining method with 1,000 bootstrap replicates. SEA domains were annotated using the SMART database, while tandem repeats were identified with Tandem Repeats Finder. Structural features were evaluated using descriptive statistics, hierarchical clustering, and Spearman’s rank correlation analysis. Phylogenetic reconstruction revealed a clear molecular separation between Primates and Rodentia with strong bootstrap support. Primate species generally exhibited conserved sequences and expanded SEA domain and tandem repeat architectures, whereas rodents displayed higher sequence divergence and reduced structural complexity. A moderate positive association between SEA domain number and tandem repeat count (ρ = 0.44) was observed, although this relationship did not reach statistical significance and is therefore interpreted as a biologically suggestive trend rather than evidence of coordinated evolution. Overall, the results indicate that MUC16 evolution follows lineage-dependent patterns shaped by both sequence divergence and domain-level remodeling. This comparative framework provides an evolutionary context for understanding structural diversity in mammalian mucins and offers a foundation for future functional and genomic investigations.</p></abstract><kwd-group><kwd>MUC16</kwd><kwd>SEA domain</kwd><kwd>tandem repeat</kwd><kwd>mammalian evolution</kwd><kwd>phylogenetics</kwd><kwd>comparative genomics</kwd></kwd-group><custom-meta-group><custom-meta><meta-name>File created by JATS Editor</meta-name><meta-value><ext-link xlink:href="https://jatseditor.com" xlink:title="JATS Editor" ext-link-type="uri">JATS Editor</ext-link></meta-value></custom-meta><custom-meta><meta-name>issue-created-year</meta-name><meta-value>2026</meta-value></custom-meta></custom-meta-group></article-meta></front><body><sec><title>Introduction</title><p>Recent advances in comparative genomic and proteomic have revealed substantial evolutionary diversity within mucin gene families, particularly MUC16, one of the largest and most structurally complex transmembrane glycoproteins in mammals <xref ref-type="bibr" rid="BIBR-8">(Faruque et al., 2025)</xref><xref ref-type="bibr" rid="BIBR-32">(Zhang et al., 2024)</xref>. MUC16 represents a compelling model for studying the evolutionary dynamics of large, repeat-rich genes that combine extensive sequence divergence with conserved functional architecture <xref ref-type="bibr" rid="BIBR-19">(Pajic et al., 2022)</xref>. Comparative analyses across mammals indicate that MUC16 exhibits pronounced interspecies variation in gene length, repeat organization, and domain composition, suggesting that its evolution has been shaped by lineage-specific selective pressures <xref ref-type="bibr" rid="BIBR-19">(Pajic et al., 2022)</xref><xref ref-type="bibr" rid="BIBR-8">(Faruque et al., 2025)</xref>.</p><p>In human, the MUC16 gene is located on chromosome 19 (19p13.2) and spans more than 430 kb (<xref ref-type="bibr" rid="BIBR-21">(Perez &amp; Gipson, 2008)</xref>; <xref ref-type="bibr" rid="BIBR-3">(Aithal et al., 2018)</xref>; <xref ref-type="bibr" rid="BIBR-32">(Zhang et al., 2024)</xref>), encoding a protein exceeding 22,000 amino acids (<xref ref-type="bibr" rid="BIBR-21">(Perez &amp; Gipson, 2008)</xref>; <xref ref-type="bibr" rid="BIBR-32">(Zhang et al., 2024)</xref>; <xref ref-type="bibr" rid="BIBR-5">(Das et al., 2015)</xref>). Its extraordinary size is largely attributable to extensive tandem repeat regions and the presence of multiple SEA (sea urchin sperm protein, enterokinase, agrin) domains, which are characteristic features of membrane-associated mucins. These structural modules are functionally important for proteolytic cleavage, membrane tethering, and regulation of extracellular interactions <xref ref-type="bibr" rid="BIBR-8">(Faruque et al., 2025)</xref><xref ref-type="bibr" rid="BIBR-30">(White et al., 2022)</xref>. Comparative genomic studies have shown that while chromosomal synteny of MUC16 is broadly conserved among mammals, repeat-rich regions and domain copy numbers vary substantially, indicating recurrent expansion and contraction events during evolution <xref ref-type="bibr" rid="BIBR-12">(Gipson et al., 2014)</xref>.</p><p>Functionally, MUC16 contributes to epithelial barrier integrity, cell-cell interactions, and modulation of immune responses <xref ref-type="bibr" rid="BIBR-14">(Kufe, 2022)</xref>. In specific biological context, including reproduction and cancer, altered MUC16 expression or processing has been associated with changes in cell adhesion (<xref rid="BIBR-21" ref-type="bibr">(Perez &amp; Gipson, 2008)</xref>; <xref rid="BIBR-13" ref-type="bibr">(Gipson et al., 2008)</xref>), signaling pathways <xref ref-type="bibr" rid="BIBR-12">(Gipson et al., 2014)</xref>, and immune recognition <xref ref-type="bibr" rid="BIBR-32">(Zhang et al., 2024)</xref>. However, most previous studies have emphasized these biomedical roles, whereas the evolutionary diversification of MUC16 across mammalian lineages has received comparatively limited attention. As a result, the extent to which structural variation in MUC16 reflects broader evolutionary patterns remains insufficiently characterized <xref ref-type="bibr" rid="BIBR-8">(Faruque et al., 2025)</xref><xref ref-type="bibr" rid="BIBR-30">(White et al., 2022)</xref>.</p><p>Among the defining features of MUC16, SEA domains and tandem repeat arrays are particularly informative from an evolutionary perspective. SEA domains are evolutionarily conserved modules present in several mucins and are implicated in protein cleavage and structural stability. Although their core structure is conserved, both the number and sequence composition of SEA domains vary among species, suggesting lineage-dependent duplication and divergence <xref ref-type="bibr" rid="BIBR-8">(Faruque et al., 2025)</xref><xref ref-type="bibr" rid="BIBR-7">(Duraisamy et al., 2007)</xref><xref ref-type="bibr" rid="BIBR-30">(White et al., 2022)</xref>. Tandem repeat regions, by contrast, evolve rapidly through mechanisms such as replication slippage and unequal crossing-over, generating species-specific architectures that influence glycosylation density and surface properties. Variation in repeat number (VNTR) and organization has therefore been widely used as an indicator of molecular adaptation in mucin genes <xref ref-type="bibr" rid="BIBR-26">(Sulovari et al., 2019)</xref>.</p><p>Although prior studies have mapped the genomic structure of MUC16 across several species, most focus narrowly on its biomedical or diagnostic roles rather than its evolutionary context <xref ref-type="bibr" rid="BIBR-7">(Duraisamy et al., 2007)</xref><xref ref-type="bibr" rid="BIBR-8">(Faruque et al., 2025)</xref>. Phylogenetic investigations are scarce and often limited by incomplete sequence annotation or by neglecting repetitive regions <xref rid="BIBR-7" ref-type="bibr">(Duraisamy et al., 2007)</xref><xref ref-type="bibr" rid="BIBR-17">(Maeda et al., 2004)</xref>. Consequently, the evolutionary relationships among mammalian MUC16 orthologs and the contribution of domain-level remodeling to lineage divergence remain incompletely resolved.</p><p>In order to address this gap, the present study conducts a comparative phylogenetic analysis of MUC16 across representative mammalian species, with particular emphasis on the relationship between evolutionary divergence, SEA domain architecture, and tandem repeat variation. By integrating sequence-based phylogenetic reconstruction with structural annotation and quantitative analysis, this study aims to clarify how modular features of MUC16 have diversified among major mammalian lineages. Rather than testing functional mechanisms directly, the analysis provides an evolutionary framework that generates biologically informed hypotheses regarding the structural evolution of MUC16 and its potential implications for mammalian adaptation.</p></sec><sec><title>Materials and methods</title><sec><title>1. Study Design and Workflow</title><p>This study employed a comparative molecular evolutionary framework to investigate phylogenetic relationships and structural variation of the MUC16 gene across representative mammalian species. The analytical workflow consisted of sequence retrieval, multiple sequence alignment, phylogenetic reconstruction, structural annotation of SEA domains and tandem repeats, and quantitative statistical analysis. All analyses were conducted between September and November 2025 at the Ecology and Physiology Laboratory, Universitas Medan Area.</p></sec><sec><title>2. Hardware and Software</title><p>All computational analyses were performed on a Lenovo LOQ Essential 15IAX9E labtop (Intel® CoreTM i5-12450HX (2,4 GHz), 12 GB RAM, RTX3050 GPU, 512 GB SSD and a Windows 11 operating system. Sequence retrieval, alignment, and phylogenetic reconstruction were carried out using MEGA version 12. SEA domain identification was performed using the SMART (Simple Modular Architecture Research Tool) web server, while tandem repeat detection was conducted using Tandem Repeats Finder (TRF). Statistical analyses were performed using IBM SPSS Statistics version 20, and clustering heatmaps were generated using RStudio. Figures were finalized using Microsoft Excel.</p></sec><sec><title>3. Data Set</title><p>MUC16 nucleotide sequences from twenty mammalian species representing the orders Primates and Rodentia were retrieved from the NCBI Nucleotide Database using the Nucleotide Search interface. Species were selected based on the availability of complete or high-quality partial MUC16 gene sequences. The nucleotide accession numbers obtained were as follows: <italic>Homo sapiens</italic> (NM 001401501.2), <italic>Pan paniscus</italic> (XM 055102885.2), <italic>Gorilla gorilla gorilla</italic> (XM 055371568.2), <italic>Symphalangus syndactylus</italic> (XM 055237836.1), <italic>Nomascus leucogenys</italic> (XM 030821778.1), <italic>Hylobates moloch</italic> (XM 058425754.1), <italic>Papio anubis</italic> (XM 031659988.1), <italic>Theropithecus gelada</italic> (XM 025367835.1), <italic>Cercocebus atys</italic> (XM 012077369.1), <italic>Macaca mulatta</italic> (XM 028840242.1), <italic>Chlorocebus sabaeus</italic> (XM 073016992.1), <italic>Colobus angolensis palliatus</italic> (XM 011954968.1), <italic>Trachypithecus francoisi </italic>(XM 033195391.1), <italic>Rhinopithecus roxellana</italic> (XM 030936547.1), <italic>Cebus imitator</italic> (XM 037728349.1), <italic>Sapajus apella</italic> (XM 032251910.1), <italic>Myodes glareolus</italic> (XM 048434638.1), <italic>Mus musculus</italic> (NM 001428752.1), <italic>Apodemus sylvaticus</italic> (XM 052189402.1), dan <italic>Rattus norvegicus</italic> (NM 001428753.1). All nucleotide datasets were downloaded in FASTA format and stored locally for downstream analyses.</p><p>Corresponding MUC16 protein sequences for each species were also retrieved from the NCBI Protein Database through the same NCBI platform. The protein accession numbers were as follows: <italic>Homo sapiens</italic> (NP_001388430.1), <italic>Pan paniscus</italic> (XP_054958860.2), <italic>Gorilla gorilla gorilla</italic> (XP_055227543.1), <italic>Symphalangus syndactylus</italic> (XP_055093811.1), <italic>Nomascus leucogenys</italic> (XP_030677638.1), <italic>Hylobates moloch</italic> (XP_058281737.1), <italic>Papio anubis</italic> (XP_031515848.1), <italic>Theropithecus gelada</italic> (XP_025223620.1), <italic>Cercocebus atys</italic> (XP_011932759.1), <italic>Macaca mulatta</italic> (XP_028696075.1), <italic>Chlorocebus sabaeus</italic> (XP_072873093.1), <italic>Colobus angolensis palliatus</italic> (XP_011810358.1), <italic>Trachypithecus francoisi</italic> (XP_033051282.1), <italic>Rhinopithecus roxellana</italic> (XP_030792407.1), <italic>Cebus imitator</italic> (XP_037584277.1), <italic>Sapajus apella</italic> (XP_032107801.1), <italic>Myodes glareolus</italic> (XP_048290595.1), <italic>Mus musculus</italic> (NP_001415681.1), <italic>Apodemus sylvaticus</italic> (XP_052045362.1), and <italic>Rattus norvegicus</italic> (NP_001415682.1).</p><p>Both nucleotide and amino acid datasets were also used to evaluate variation in sequence length, number of SEA domains, and tandem repeat organization, forming the basis for comparative structural and phylogenetic analyses.</p></sec><sec><title>4. Multiple Sequence Alignment and Quality Control</title><p>Multiple sequence alignment (MSA) of MUC16 nucleotide sequences was performed using the ClustalW algorithm implemented in MEGA 12. Given the repeat-rich architecture of MUC16, alignment trimming was conducted conservatively to remove ambiguously aligned regions while retaining homologous segments shared across taxa. Tandem repeat regions were retained to preserve biologically meaningful variation; however, their contribution to the phylogenetic signal was interpreted cautiously. Manual inspection focused on repeat-rich segments exhibiting excessive gap density or uncertain homology to ensure alignment reliability. Preliminary inspection indicated that exclusion of highly repetitive segments did not alter the higher-level topology separating Primates and Rodentia, suggesting that the inferred phylogenetic relationships are robust to repeat-associated alignment variability. The final alignments were exported in MEGA format for downstream phylogenetic reconstruction.</p></sec><sec><title>5. Phylogenetic Reconstruction</title><p>Phylogenetic relationships among mammalian MUC16 sequences were reconstructed using the Neighbor-Joining (NJ) method <xref ref-type="bibr" rid="BIBR-23">(Saito &amp; Nei, 1987)</xref> as implemented in MEGA 12 <xref ref-type="bibr" rid="BIBR-15">(Kumar et al., 2024)</xref>. NJ was selected due to its computational efficiency and robustness when applied to extremely large, low-complexity, and repeat-rich genes such as MUC16, for which model-based approaches may be computationally prohibitive or sensitive to alignment uncertainty (<xref ref-type="bibr" rid="BIBR-16">(Kurt et al., 2024)</xref>; <xref ref-type="bibr" rid="BIBR-31">(Yoshida &amp; Nei, 2016)</xref>. Evolutionary distances were calculated using the p-distance model, and gaps or missing data were treated using pairwise deletion to reduce bias associated with low-complexity regions. Node support was assessed using bootstrap resampling with 1,000 replicates <xref ref-type="bibr" rid="BIBR-9">(Felsenstein, 1985)</xref>. The resulting topology was interpreted primarily for comparative and topological consistency with established mammalian taxonomy rather than for model-rich evolutionary parameter estimation. Accordingly, phylogenetic inference in this study is restricted to major clade-level relationships, and future analyses incorporating Maximum Likelihood or Bayesian frameworks may further refine evolutionary estimates for MUC16.</p></sec><sec><title>6. SEA Domain Annotation</title><p>SEA domains were identified using the SMART database based on full-length MUC16 protein sequences. All sequences were analyzed using the SMART “Normal Mode” search, which applies hidden Markov models to detect conserved domain architectures. Annotated SEA domains were recorded. Only confidently annotated SEA domains were included in downstream quantitative analyses.</p></sec><sec><title>7. Tandem Repeat Identification</title><p>Tandem repeat regions were identified using Tandem Repeats Finder (TRF) with default parameters (match = 2, mismatch = 7, indel = 7, minimum alignment score = 50, maximum period size = 500). Analyses were performed on nucleotide sequences, as TRF operates at the DNA level. Repeat regions exhibiting clear repeat units were retained, while overlapping or degenerate repeats were evaluated manually. Only non-everlapping tandem repeat segments were counted to ensure consistency across species.</p></sec><sec><title>8. Statistical and Comparative Analysis</title><p>Descriptive statistics were calculated for SEA domain counts and tandem repeat numbers across species. Because normality assumptions were not met for one or more variables, non-parametric statistical approaches were applied. Differences between Primates and Rodentia were evaluated using appropriate non-parametric tests, and Spearman’s rank correlation coefficient was used to assess the association between SEA domain number and tandem repeat variation. In order to explore multivariate patterns, hierarchical clustering was performed using Z-score-standardized domain features, and results were visualized as heatmaps.</p></sec></sec><sec><title>Results and discussion</title><sec><title>1. Phylogenetic Reconstruction of Mammalian MUC16</title><p>The evolutionary relationships and cross-taxonomic conservation of MUC16 were examined through phylogenetic reconstruction based on orthologous nucleotide sequences derived from twenty representative mammalian species. This comparative approach enables an assessment of how MUC16 has diversified across major mammalian lineages, while situating observed sequence variation within a broader evolutionary context. By applying a standardized phylogenetic framework, the resulting topology highlights patterns of divergence and conservation that are broadly consistent with establish mammalian taxonomy. The reconstructed phylogeny, presented in <xref ref-type="fig" rid="figure-1">Figure 1</xref>, serves as a reference framework for interpreting lineage-specific variation and evolutionary separation of MUC16 among the examined taxa.</p><fig ignoredToc="" id="figure-1"><label>Figure 1</label><caption><p>Neighbor-Joining phylogenetic tree of MUC16 from 20 mammalian species.</p></caption><graphic mime-subtype="png" mimetype="image" xlink:href="https://journals2.ums.ac.id/bioeksperimen/article/download/14233/5371/67744"><alt-text>Image</alt-text></graphic></fig><p>The Neighbor-Joining phylogenetic analysis of MUC16 across twenty mammalian species produced a well-resolved topology that largely mirrors accepted mammalian evolutionary relationships, while also revealing lineage-specific divergence within the gene. The inferred tree shows a major bifurcation separating Primates and Rodentia, accompanied by pronounced differences in branch lengths that reflect variation in evolutionary rates among lineages.</p><p>Within primate, Old World monkeys (including <italic>Papio anubis, Theropithecus gelada, Cercopithecus aethiops, Macaca mulatta,</italic> and <italic>Chlorocebus sabaeus</italic>) form a compact and strongly supported cluster, with bootstrap values consistently approaching or reaching 100. The short branch lengths observed within this group indicate high sequence conservation and relatively slow divergence of MUC16 between Cercopithecidae. A closely related Colobinae subgroup (<italic>Colobus angolensis palliatus</italic>, <italic>Trachypithecus francoisi</italic>, and <italic>Rhinopithecus roxellana</italic>) also exhibits maximal bootstrap support and minimal branch distances, suggesting recent common ancestry and a stable MUC16 sequence configuration across these taxa.</p><p>The Hominoidea clade (including <italic>Homo sapiens, Pan paniscus, Gorilla gorilla</italic>, <italic>Hylobates moloch, Symphalangus syndactylus</italic>, and <italic>Nomascus leucogenys</italic>) shows a clearly defined branching pattern with robust bootstrap support (predominantly 98-100), indicating strong topological confidence. Great apes cluster closely with short internal branches, reflecting minimal divergence among their MUC16 orthologs, whereas lesser apes form a sister lineage characterized by moderately longer branches. This pattern suggests slightly higher divergence rates in lesser apes relative to great apes, though still lower than those observed in other primate groups.</p><p>New World monkeys (<italic>Cebus imitator</italic> and <italic>Sapajus apella</italic>) occupy a distinct position within the primate clade, supported by high bootstrap values (&gt;90) but characterized by longer branch lengths compared with Catarrhini. This pattern indicates increased sequence divergence and potential lineage-specific modifications of MUC16 within Platyrrhini.</p><p>Rodents species form a distinct and well-supported clade comprising <italic>Muc musculus, Rattus norvegicus, Apodemus sylvaticus,</italic> and <italic>Myodes glareolus</italic>. This clade is characterized by markedly longer branch lengths relative to primates, suggesting higher substitution rates and accelerated molecular evolution of MUC16 within Rodentia. In particular, the extended external branches observed for <italic>Apodemus sylvaticus</italic> and <italic>Myodes glareolus</italic> indicate pronounced lineage-specific divergence. All rodent nodes are strongly supported (bootstrap values ranging from 92 to 100), reinforcing the reliability of the inferred relationships.</p><p>Overall, bootstrap analysis based on 1000 replicates demonstrates high confidence across major nodes, particularly within primate subclades where values frequently reach 100, indicating strong topological stability. In contrast, deeper ancestral nodes separating major mammalian lineages show moderately lower support, a pattern expected given the substantial evolutionary distances involved. Branch lenghts, representing estimated substitutions per site, vary considerably among lineages. Short branch lengths within Hominoidea and Cercopithecidae suggest relatively conservative evolution of MUC16 in these groups, consistent with functional constraints acting on core regions of the gene associated with epithelial protection, immune modulation, and cell-cell interactions (<xref ref-type="bibr" rid="BIBR-12">(Gipson et al., 2014)</xref>; <xref ref-type="bibr" rid="BIBR-21">(Perez &amp; Gipson, 2008)</xref>). Conversely, the longer branches observed in rodents are indicative of accelerated molecular evolution and greater lineage-specific divergence, a trend previously reported for mucin genes under selective pressures related to reproduction, immune challenges, and environmental exposure <xref ref-type="bibr" rid="BIBR-7">(Duraisamy et al., 2007)</xref><xref rid="BIBR-30" ref-type="bibr">(White et al., 2022)</xref>.</p></sec><sec><title>2. Comparative Structural Organization of MUC16</title><p>In order to contextualize the phylogenetic patterns observed for MUC16, a comparative analysis of domain-level structural organization was conducted across representative mammalian lineages. While phylogenetic reconstruction elucidates evolutionary relatedness, examination of structural architecture provides complementary insight into how specific regions of MUC16 are conserved or diversified among species. Owing to the exceptional size and repetitive nature of MUC16, schematic comparisons were restricted to three representative taxa (<italic>H. sapiens, C. atys,</italic> and <italic>M. glareolus</italic>) to facilitate clear visualization of lineage-specific structural patterns (<xref ref-type="fig" rid="figure-2">Figure 2</xref>).</p><fig id="figure-2" ignoredToc=""><label>Figure 2</label><caption><p>Schematic comparison of MUC16 structural organization in three mammalian species: (A) <italic>Homo sapiens</italic>, (B) <italic>Cercocebus atys</italic>, and (C) <italic>Myodes glareolus</italic>. Diagrams illustrate the major extracellular domains, including the tandem repeat region, SEA domains proximal to the transmembrane segment, and the conserved cytoplasmic tail.</p></caption><graphic mime-subtype="png" mimetype="image" xlink:href="https://journals2.ums.ac.id/bioeksperimen/article/download/14233/5371/67745"><alt-text>Image</alt-text></graphic></fig><p>As shown in <xref ref-type="fig" rid="figure-2">Figure 2</xref>, MUC16 exhibits pronounced interspecies variation in modular architecture despite sharing a conserved overall organization consisting of an extensive extracellular domain, tandem repeat, SEA domains, and a C-terminal transmembrane-cytoplasmic module. In <italic>H. sapiens</italic>, both the N-terminal region and tandem repeat are markedly expanded, consistent with the documented structural complexity and functional specialization of human MUC16 in mucosal protection and disease-associated processes. <italic>Cercocebus atys</italic> displays an intermediate architectural profile, retaining substantial tandem repeat regions but exhibiting fewer SEA domains, reflecting moderate divergence among non-human primates. In contrast, the rodent <italic>M. glareolus</italic> shows a compact configuration characterized by reduced tandem repeat content and a limited number of SEA domains, a pattern consistent with streamlined mucin architectures commonly reported in Rodentia <xref ref-type="bibr" rid="BIBR-17">(Maeda et al., 2004)</xref>.</p><p>When interpreted alongside the phylogenetic reconstruction, these structural differences align closely with evolutionary relationships among species. Primate lineages generally exhibit expanded SEA domain clusters and larger tandem repeat, supporting previous observations that mucins in higher primates have undergone modular proliferation, potentially enhancing glycosylation diversity and epithelial barrier complexity <xref ref-type="bibr" rid="BIBR-8">(Faruque et al., 2025)</xref><xref ref-type="bibr" rid="BIBR-32">(Zhang et al., 2024)</xref>. The particularly elaborate architecture of human MUC16 has been associated with its established roles in immune modulation, reproductive biology, and tumor progression <xref ref-type="bibr" rid="BIBR-14">(Kufe, 2022)</xref>. Conversely, the reduced structural organization observed in rodents supports the view that selective pressures in this lineage may favor genomic streamlining rather than extensive expansion of mucin modularity <xref ref-type="bibr" rid="BIBR-17">(Maeda et al., 2004)</xref>.</p><p>The three illustrated species thus represent a biologically informative cross section of mammalian MUC16 diversity, capturing structurally elaborate, intermediate, and compact architectures across evolutionary distance. By emphasizing proportional domain organization rather than absolute sequence length, the schematic provides a conceptual framework for visualizing lineage-dependent structural variation in MUC16, complementing the sequence-based phylogenetic analysis.</p></sec><sec><title>3. Quantitative Comparison of SEA Domains and Tandem Repeats</title><p>A quantitative comparison was conducted to characterize interspecific variation in MUC16 structural architecture by examining its two principal modular components (tandem repeats and SEA domains) across twenty mammalian species representing Primates and Rodentia. This analysis enables assessment of structural expansion or reduction within and between major lineages, providing a complementary perspective to sequence-based phylogenetic inference. Variation in tandem repeat number and SEA domain composition has long been recognized as a defining feature of mucin evolution and is shaped by lineage-specific selective pressures acting on mucosal defense, immune modulation, and reproductive function <xref ref-type="bibr" rid="BIBR-7">(Duraisamy et al., 2007)</xref>. The distribution patterns are summarized in <xref ref-type="fig" rid="figure-3">Figure 3</xref>.</p><fig id="figure-3" ignoredToc=""><label>Figure 3</label><caption><p>Comparative distribution of MUC16 structural features across selected mammalian species. Bar chart illustrates the number of tandem repeats and SEA domains identified in MUC16 from 20 species representing Primates and Rodentia.</p></caption><graphic xlink:href="https://journals2.ums.ac.id/bioeksperimen/article/download/14233/5371/67746" mime-subtype="png" mimetype="image"><alt-text>Image</alt-text></graphic></fig><p>As shown in <xref ref-type="fig" rid="figure-3">Figure 3</xref>, primate species generally exhibit higher numbers of both tandem repeats and SEA domains than rodents, indicating greater structural complexity of MUC16 within the primate lineage. This pattern is consistent with previous genomic analyses of mucin genes, including MUC5AC and MUC5B, which reported increased protein length variability in primates driven largely by variation in tandem repeat number <xref rid="BIBR-22" ref-type="bibr">(Plender et al., 2024)</xref>. Several primates, including <italic>H. moloch, P. anubis,</italic> and <italic>P. paniscus</italic>, show pronounced SEA domain expansion (≥10 domains), a feature also reported for other membrane-associated mucins such as MUC1 and MUC4 (<xref ref-type="bibr" rid="BIBR-14">(Kufe, 2022)</xref>; <xref ref-type="bibr" rid="BIBR-11">(Ganguly et al., 2020)</xref>; <xref ref-type="bibr" rid="BIBR-20">(Pei &amp; Grishin, 2017)</xref>; <xref ref-type="bibr" rid="BIBR-6">(Dhar &amp; McAuley, 2019)</xref>).</p><p>Despite substantial variation in SEA domain counts, tandem repeat numbers among primates remain relatively conserved, with most species exhibiting six to eight repeat units. This pattern aligns with earlier findings indicating that tandem repeat arrays, while highly variable across mammals, tend to be more conserved within closely related primate lineages (<xref ref-type="bibr" rid="BIBR-2">(Ahmad et al., 2020)</xref>; <xref ref-type="bibr" rid="BIBR-4">(Arabfard et al., 2022)</xref>; <xref ref-type="bibr" rid="BIBR-8">(Faruque et al., 2025)</xref>). Notable exceptions include <italic>T. gelada</italic> and <italic>T. francoisi</italic>, which display extensive SEA domain expansion while maintaining moderate tandem repeat counts. <italic>Homo sapiens</italic> exhibits a balanced structural profile characterized by both high SEA domain numbers and an expanded tandem repeat region, consistent with the documented structural elaboration of human MUC16 and its established roles in mucosal defense and tumor biology<xref ref-type="bibr" rid="BIBR-14">(Kufe, 2022)</xref>.</p><p>In contrast, rodent species (including <italic>R. norvegicus, A. sylvaticus, M. musculus</italic>, and <italic>M. glareolus</italic>) display markedly reduced structural architectures. Tandem repeat counts are minimal, often ≤2, and SEA domain numbers remain low, reflecting contraction of mucin gene families commonly observed in Rodentia <xref rid="BIBR-19" ref-type="bibr">(Pajic et al., 2022)</xref>. This pattern is consistent with reported genomic streamlining and reduced selective pressure for mucin diversification in rodents, particularly for genes associated with mucosal surface specialization <xref ref-type="bibr" rid="BIBR-19">(Pajic et al., 2022)</xref><xref rid="BIBR-24" ref-type="bibr">(Roycroft et al., 2021)</xref>.</p><p>To complement the absolute feature counts shown in <xref ref-type="fig" rid="figure-3">Figure 3</xref>, hierarchical clustering based on standardized tandem repeat and SEA domain features was performed to examine relational patterns among species (<xref ref-type="fig" rid="figure-4">Figure 4</xref>). This multivariate approach highlights relative similarity rather than magnitude and has been widely applied in comparative analyses of mucin modular organization (<xref rid="BIBR-25" ref-type="bibr">(Shen &amp; Li, 2016)</xref>; <xref ref-type="bibr" rid="BIBR-1">(Adams &amp; Collyer, 2019)</xref>).</p><fig id="figure-4" ignoredToc=""><label>Figure 4</label><caption><p>Hierarchical clustering heatmap of MUC16 structural features derived standardized tandem repeat and SEA domain counts across 20 mammalian species.</p></caption><graphic mime-subtype="png" mimetype="image" xlink:href="https://journals2.ums.ac.id/bioeksperimen/article/download/14233/5371/67747"><alt-text>Image</alt-text></graphic></fig><p>The heatmap reveals distinct clustering patterns that broadly correspond to taxonomic affiliations, with primates forming groups separate from rodents. Species with similar domain architectures cluster closely, whereas others occupy more isolated positions, indicating unique structural profiles. These multivariate patterns reinforce the evolutionary relationships inferred from both sequence-based phylogeny and absolute structural feature comparisons <xref ref-type="bibr" rid="BIBR-19">(Pajic et al., 2022)</xref><xref ref-type="bibr" rid="BIBR-24">(Roycroft et al., 2021)</xref>.</p></sec><sec><title>4. Association Between SEA Domains and Tandem Repeats</title><p>Structural variation in MUC16 across the examined mammalian species was quantitatively characterized by summarizing the distribution of SEA domain and tandem repeat numbers. These features represent key components of mucin modular architecture and are widely recognized as major contributors to interspecies differences in glycoprotein structure and evolutionary diversification (<xref rid="BIBR-21" ref-type="bibr">(Perez &amp; Gipson, 2008)</xref>; <xref ref-type="bibr" rid="BIBR-8">(Faruque et al., 2025)</xref>; <xref ref-type="bibr" rid="BIBR-30">(White et al., 2022)</xref>). Descriptive statistics provide an essential quantitative framework for evaluating the extent of structural expansion and contraction prior to inferential assessment. Summary metrics are presented in<xref ref-type="table" rid="table-1">Table 1</xref>.</p><table-wrap id="table-1" ignoredToc=""><label>Table 1</label><caption><p>Summary statistics of SEA domain and tandem repeat counts</p><p>across 20 mammalian species</p></caption><table frame="box" rules="all"><thead><tr><th align="left" colspan="1" valign="top"><bold>Variable</bold></th><th valign="top" align="left" colspan="1"><bold>Mean</bold></th><th valign="top" align="left" colspan="1"><bold>SD</bold></th><th valign="top" align="left" colspan="1"><bold>Median</bold></th><th valign="top" align="left" colspan="1"><bold>Min</bold></th><th valign="top" align="left" colspan="1"><bold>Max</bold></th></tr></thead><tbody><tr><td valign="top" align="left" colspan="1">SEA domain</td><td align="left" colspan="1" valign="top">7.40</td><td align="left" colspan="1" valign="top">3.41</td><td valign="top" align="left" colspan="1">8.50</td><td valign="top" align="left" colspan="1">1</td><td valign="top" align="left" colspan="1">13</td></tr><tr><td align="left" colspan="1" valign="top">Tandem repeat</td><td align="left" colspan="1" valign="top">5.015</td><td colspan="1" valign="top" align="left">2.54</td><td colspan="1" valign="top" align="left">6.00</td><td valign="top" align="left" colspan="1">0</td><td align="left" colspan="1" valign="top">9</td></tr></tbody></table></table-wrap><p>SEA domain numbers exhibit substantial heterogeneity, ranging from 1 to 13 units (mean = 7.40; SD = 3.41). The median value (8.50) exceeds the mean, indicating a right-skewed distribution driven primarily by species with expanded SEA domain arrays. Such patterns are consistent with prior observations that membrane-associated mucins undergo lineage-specific modulation of SEA domain architecture <xref rid="BIBR-8" ref-type="bibr">(Faruque et al., 2025)</xref><xref rid="BIBR-32" ref-type="bibr">(Zhang et al., 2024)</xref>.</p><p>Tandem repeat counts display a mean of 5.02 and a standard deviation of 2.54, reflecting moderate dispersion relative to SEA domains. The observed range extends from the absence of detectable repeats in several rodents to pronounced repeat amplification in multiple primate taxa. Variation in tandem repeat number is consistent with established models of mucin evolution, in which repeat expansion contributes to increased glycan density and surface complexity <xref ref-type="bibr" rid="BIBR-26">(Sulovari et al., 2019)</xref><xref ref-type="bibr" rid="BIBR-11">(Ganguly et al., 2020)</xref><xref ref-type="bibr" rid="BIBR-28">(Verbiest et al., 2022)</xref><xref ref-type="bibr" rid="BIBR-27">(Taniguchi et al., 2017)</xref>. Together, these descriptive patterns indicate that MUC16 structural diversification is highly lineage dependent.</p><p>In order to examine whether variation in SEA domain number is associated with corresponding changes in tandem repeat content, a nonparametric Spearman’s rank correlation analysis was performed. This method is appropriate for datasets that deviate from normality and for evolutionary traits shaped by repetitive sequence dynamics <xref ref-type="bibr" rid="BIBR-10">(Fotsing et al., 2019)</xref><xref ref-type="bibr" rid="BIBR-19">(Pajic et al., 2022)</xref><xref ref-type="bibr" rid="BIBR-29">(Wang et al., 2024)</xref>. The relationship between the two structural features is illustrated in <xref ref-type="fig" rid="figure-5">Figure 5</xref>.</p><fig id="figure-5" ignoredToc=""><label>Figure 5</label><caption><p>Scatterplot showing the association between SEA domain and tandem repeat count across 20 mammalian species. Abbreviations: Hsa (<italic>Homo sapiens</italic>), Ppa (<italic>Pan paniscus</italic>), Ggo (<italic>Gorilla gorilla gorilla</italic>), Ssy (<italic>Symphalangus syndactylus</italic>), Nle (<italic>Nomascus leucogenys</italic>), Hmo (<italic>Hylobates moloch</italic>), Pan (<italic>Papio anubis</italic>), Tge (<italic>Theropithecus gelada</italic>), Cat (<italic>Cercocebus atys</italic>), Mmu (<italic>Macaca mulatta</italic>), Csa (<italic>Chlorocebus sabaeus</italic>), Cap (<italic>Colobus angolensis palliatus</italic>), Tfr (<italic>Trachypithecus francoisi</italic>), Rro (<italic>Rhinopithecus roxellana</italic>), Cim (<italic>Cebus imitator</italic>), Sap (<italic>Sapajus apella</italic>), Mgl (<italic>Myodes glareolus</italic>), MmuS (<italic>Mus musculus</italic>), Asy (<italic>Apodemus sylvaticus</italic>), and Rno (<italic>Rattus norvegicus</italic>).</p></caption><graphic mime-subtype="png" mimetype="image" xlink:href="https://journals2.ums.ac.id/bioeksperimen/article/download/14233/5371/67748"><alt-text>Image</alt-text></graphic></fig><p>The analysis reveals a moderate positive association (ρ = 0.44) between SEA domain and tandem repeat counts; however, this relationship does not reach conventional statistical significance (p = 0.052). Accordingly, the result should be interpreted as a biologically suggestive trend rather than evidence of coordinated evolution. Similar tendencies toward parallel expansion of mucin structural modules have been reported in comparative genomic studies, although such patterns are often shaped by lineage-specific constraints and stochastic variation <xref ref-type="bibr" rid="BIBR-7">(Duraisamy et al., 2007)</xref><xref ref-type="bibr" rid="BIBR-26">(Sulovari et al., 2019)</xref>.</p><p>Visual inspection of the scatterplot indicates lineage-associated clustering. Primate species tend to occupy regions corresponding to higher values of both structural features, whereas rodents cluster at lower values, reflecting compact MUC16 architectures. These distributions are consistent with previously reported contrasts in mucin gene organization between Primates and Rodentia <xref ref-type="bibr" rid="BIBR-17">(Maeda et al., 2004)</xref><xref ref-type="bibr" rid="BIBR-19">(Pajic et al., 2022)</xref>. Intermediate positions observed in several primate taxa further suggest that MUC16 structural evolution proceeds along a continuum rather than discrete categorical states.</p><p>This study provides a comparative evolutionary framework that integrates phylogenetic reconstruction with quantitative and domain-level structural analyses of MUC16 across representative mammalian lineages. Unlike previous studies that primarily emphasized biomedical relevance or limited taxonomic scope (<xref rid="BIBR-18" ref-type="bibr">(McLemore &amp; Aouizerat, 2005)</xref>; <xref ref-type="bibr" rid="BIBR-8">(Faruque et al., 2025)</xref>; <xref ref-type="bibr" rid="BIBR-32">(Zhang et al., 2024)</xref>; <xref rid="BIBR-30" ref-type="bibr">(White et al., 2022)</xref>), the present work highlights lineage-specific variation in SEA domains and tandem repeats as key contributors to MUC16 diversification. Representative structural models of <italic>H. sapiens, C. atys, </italic>and<italic> M. glareolus</italic> further demonstrate how sequence divergence translates into distinct architectural patterns.</p><p>Several limitations should be acknowledged. The present analysis is restricted to representative species from Primates and Rodentia, and therefore the inferred evolutionary patterns should be interpreted within this taxonomic scope rather than as general features of all mammals. Domain annotation and tandem repeat detection depend on the quality of publicly available genomic resources, and the Neighbor-Joining method provides limited modeling resolution compared with likelihood-based approaches. In addition, SEA domain identification relied on a single annotation platform (SMART), which has been widely applied for domain annotation in mucin proteins. While cross-validation using complementary databases such as Pfam or InterPro would further strengthen confidence in domain assignment.</p><p>Future studies expanding taxonomic sampling, applying model-based phylogenetic inference, integrating multiple annotation platforms and incorporating glycoproteomic or functional data will be valuable for testing the biological implications of MUC16 modular variation, which should be regarded as hypotheses rather than direct outcomes of the present analysis.</p></sec></sec><sec><title>Conclusion</title><p>This study presents a comparative evolutionary analysis of MUC16 across mammalian lineages by integrating phylogenetic reconstruction with quantitative assessments of SEA domain and tandem repeat variation. The clear molecular separation between Primates and Rodentia reflects lineage-specific evolutionary trajectories, with primates exhibiting expanded domain architectures and rodents retaining comparatively compact structures. Although a moderate positive association between SEA domain number and tandem repeat count was observed, this relationship should be interpreted as a biologically suggestive trend rather than evidence of coordinated evolution. Collectively, these findings demonstrate that MUC16 diversification follows structured, lineage-dependent patterns rather than random variation. This evolutionary framework provides a foundation for future studies examining the functional and adaptive significance of mucin modularity across mammals..</p></sec><sec><title>Author Statements</title><p><bold>Acknowledgements and funding statements:</bold> The authors express their sincere appreciation to the Department of Biology, Faculty of Sciences and Technology, Universitas Medan Area, for providing research facilities and institutional support during the study. This research did not receive any specific grant from funding agencies in the public, commercial, or not-for-profit sectors.</p><p>Competing of interest: The authors declare that there are no financial or personal relationships that could be construed as a potential conflict of interest.</p><p><bold>Author’s contributions:</bold> YGF was responsible for conceptualization, study design, data curation, formal analysis, methodology, visualization, and manuscript drafting. AY performed data analysis, validation, literature review, and critical revision of the manuscript. NŞC provided supervision, methodological guidance, interpretation of results, and final approval of the manuscript.</p><p><bold>Generative AI:</bold> Not applicable</p><p><bold>Data availability:</bold> All data used in this study were obtained from publicly available databases, including the NCBI Nucleotide and Protein repositories. The accession number of all sequences analyzed are provided within the Materials and Methods section. Processed data and additional analytical outputs supporting the findings of this study are available from the corresponding author upon reasonable request.</p></sec></body><back><ref-list><title>References</title><ref id="BIBR-1"><element-citation publication-type="article-journal"><article-title>Phylogenetic Comparative Methods and the Evolution of Multivariate Phenotypes</article-title><source>Annual Review of Ecology, Evolution, and Systematics</source><volume>50</volume><issue>1</issue><person-group person-group-type="author"><name><surname>Adams</surname><given-names>D.</given-names></name><name><surname>Collyer</surname><given-names>M.</given-names></name></person-group><year>2019</year><fpage>1</fpage><lpage>21</lpage><page-range>1-21</page-range><pub-id pub-id-type="doi">10.1146/annurev-ecolsys-110218-024555</pub-id></element-citation></ref><ref id="BIBR-2"><element-citation publication-type="article-journal"><article-title>Dark Matter of Primate Genomes: Satellite DNA Repeats and Their Evolutionary Dynamics</article-title><source>Cells</source><volume>9</volume><issue>12</issue><person-group person-group-type="author"><name><surname>Ahmad</surname><given-names>S.</given-names></name><name><surname>Singchat</surname><given-names>W.</given-names></name><name><surname>Jehangir</surname><given-names>M.</given-names></name><name><surname>Suntronpong</surname><given-names>A.</given-names></name><name><surname>Panthum</surname><given-names>T.</given-names></name><name><surname>Malaivijitnond</surname><given-names>S.</given-names></name><name><surname>Srikulnath</surname><given-names>K.</given-names></name></person-group><year>2020</year><page-range>2714</page-range><pub-id pub-id-type="doi">10.3390/cells9122714</pub-id></element-citation></ref><ref id="BIBR-3"><element-citation publication-type="article-journal"><article-title>MUC16 as a novel target for cancer therapy</article-title><source>Expert Opinion on Therapeutic Targets</source><volume>22</volume><person-group person-group-type="author"><name><surname>Aithal</surname><given-names>A.</given-names></name><name><surname>Rauth</surname><given-names>S.</given-names></name><name><surname>Kshirsagar</surname><given-names>P.</given-names></name><name><surname>Shah</surname><given-names>A.</given-names></name><name><surname>Lakshmanan</surname><given-names>I.</given-names></name><name><surname>Junker</surname><given-names>W.</given-names></name><name><surname>Jain</surname><given-names>M.</given-names></name><name><surname>Ponnusamy</surname><given-names>M.</given-names></name><name><surname>Batra</surname><given-names>S.</given-names></name></person-group><year>2018</year><fpage>675</fpage><lpage>686</lpage><page-range>675-686</page-range><pub-id pub-id-type="doi">10.1080/14728222.2018.1498845</pub-id></element-citation></ref><ref id="BIBR-4"><element-citation publication-type="article-journal"><article-title>Global abundance of short tandem repeats is non-random in rodents and primates</article-title><source>BMC Genomic Data</source><volume>23</volume><issue>1</issue><person-group person-group-type="author"><name><surname>Arabfard</surname><given-names>M.</given-names></name><name><surname>Salesi</surname><given-names>M.</given-names></name><name><surname>Nourian</surname><given-names>Y.</given-names></name><name><surname>Arabipour</surname><given-names>I.</given-names></name><name><surname>Maddi</surname><given-names>A.</given-names></name><name><surname>Kavousi</surname><given-names>K.</given-names></name><name><surname>Ohadi</surname><given-names>M.</given-names></name></person-group><year>2022</year><page-range>77</page-range><pub-id pub-id-type="doi">10.1186/s12863-022-01092-4</pub-id></element-citation></ref><ref id="BIBR-5"><element-citation publication-type="article-journal"><article-title>Membrane proximal ectodomain cleavage of MUC16 occurs in the acidifying Golgi/post-Golgi compartments</article-title><source>Scientific Reports</source><volume>5</volume><person-group person-group-type="author"><name><surname>Das</surname><given-names>S.</given-names></name><name><surname>Majhi</surname><given-names>P.</given-names></name><name><surname>Al‐Mugotir</surname><given-names>M.</given-names></name><name><surname>Rachagani</surname><given-names>S.</given-names></name><name><surname>Sorgen</surname><given-names>P.</given-names></name><name><surname>Batra</surname><given-names>S.</given-names></name></person-group><year>2015</year><page-range>9759</page-range><pub-id pub-id-type="doi">10.1038/srep09759</pub-id></element-citation></ref><ref id="BIBR-6"><element-citation publication-type="article-journal"><article-title>The Role of the Cell Surface Mucin MUC1 as a Barrier to Infection and Regulator of Inflammation</article-title><source>Frontiers in Cellular and Infection Microbiology</source><volume>9</volume><person-group person-group-type="author"><name><surname>Dhar</surname><given-names>P.</given-names></name><name><surname>McAuley</surname><given-names>J.</given-names></name></person-group><year>2019</year><page-range>117</page-range><pub-id pub-id-type="doi">10.3389/fcimb.2019.00117</pub-id></element-citation></ref><ref id="BIBR-7"><element-citation publication-type="article-journal"><article-title>Distinct evolution of the human carcinoma-associated transmembrane mucins, MUC1, MUC4 AND MUC16</article-title><source>Gene</source><volume>373</volume><person-group person-group-type="author"><name><surname>Duraisamy</surname><given-names>S.</given-names></name><name><surname>Ramasamy</surname><given-names>S.</given-names></name><name><surname>Kharbanda</surname><given-names>S.</given-names></name><name><surname>Kufe</surname><given-names>D.</given-names></name></person-group><year>2007</year><fpage>28</fpage><lpage>34</lpage><page-range>28-34</page-range><pub-id pub-id-type="doi">10.1016/j.gene.2005.12.021</pub-id></element-citation></ref><ref id="BIBR-8"><element-citation publication-type="article-journal"><article-title>Deciphering Deleterious nsSNPs in MUC16&#39;s SEA Domain: Structural and Functional Implications in Cancer Metastasis via Computational Analysis</article-title><source>J Cell Mol Med</source><volume>29</volume><person-group person-group-type="author"><name><surname>Faruque</surname><given-names>M.</given-names></name><name><surname>Medha</surname><given-names>M.M.</given-names></name><name><surname>Mahfuz</surname><given-names>A.M.U.B.</given-names></name><name><surname>Islam</surname><given-names>M.M.</given-names></name><name><surname>Siraj</surname><given-names>M.A.</given-names></name></person-group><year>2025</year><page-range>70633</page-range><pub-id pub-id-type="doi">10.1111/jcmm.70633</pub-id></element-citation></ref><ref id="BIBR-9"><element-citation publication-type="article-journal"><article-title>Confidence limits on phylogenies: An approach using the bootstrap</article-title><source>Evolution</source><volume>39</volume><person-group person-group-type="author"><name><surname>Felsenstein</surname><given-names>J.</given-names></name></person-group><year>1985</year><fpage>783</fpage><lpage>791</lpage><page-range>783-791</page-range></element-citation></ref><ref id="BIBR-10"><element-citation publication-type="article-journal"><article-title>The impact of short tandem repeat variation on gene expression</article-title><source>Nature genetics</source><volume>51</volume><person-group person-group-type="author"><name><surname>Fotsing</surname><given-names>S.</given-names></name><name><surname>Margoliash</surname><given-names>J.</given-names></name><name><surname>Wang</surname><given-names>C.</given-names></name><name><surname>Saini</surname><given-names>S.</given-names></name><name><surname>Yanicky</surname><given-names>R.</given-names></name><name><surname>Shleizer-Burko</surname><given-names>S.</given-names></name><name><surname>Goren</surname><given-names>A.</given-names></name><name><surname>Gymrek</surname><given-names>M.</given-names></name></person-group><year>2019</year><fpage>1652</fpage><lpage>1659</lpage><page-range>1652-1659</page-range><pub-id pub-id-type="doi">10.1038/s41588-019-0521-9</pub-id></element-citation></ref><ref id="BIBR-11"><element-citation publication-type="article-journal"><article-title>Unraveling mucin domains in cancer and metastasis: when protectors become predators</article-title><source>Cancer metastasis reviews</source><volume>39</volume><issue>3</issue><person-group person-group-type="author"><name><surname>Ganguly</surname><given-names>K.</given-names></name><name><surname>Rauth</surname><given-names>S.</given-names></name><name><surname>Marimuthu</surname><given-names>S.</given-names></name><name><surname>Kumar</surname><given-names>S.</given-names></name><name><surname>Batra</surname><given-names>S.K.</given-names></name></person-group><year>2020</year><fpage>647</fpage><lpage>659</lpage><page-range>647-659</page-range><pub-id pub-id-type="doi">10.1007/s10555-020-09896-5</pub-id></element-citation></ref><ref id="BIBR-12"><element-citation publication-type="article-journal"><article-title>Comparison of the Transmembrane Mucins MUC1 and MUC16 in Epithelial Barrier Function</article-title><source>PLoS ONE</source><volume>9</volume><issue>6</issue><person-group person-group-type="author"><name><surname>Gipson</surname><given-names>I.</given-names></name><name><surname>Spurr-Michaud</surname><given-names>S.</given-names></name><name><surname>Tisdale</surname><given-names>A.</given-names></name><name><surname>Menon</surname><given-names>B.</given-names></name></person-group><year>2014</year><page-range>100393</page-range><pub-id pub-id-type="doi">10.1371/journal.pone.0100393</pub-id></element-citation></ref><ref id="BIBR-13"><element-citation publication-type="article-journal"><article-title>MUC16 Is Lost from the Uterodome (Pinopode</article-title><source>Surface of the Receptive Human Endometrium: In Vitro Evidence That MUC16 Is a Barrier to Trophoblast Adherence1</source><volume>78</volume><issue>1</issue><person-group person-group-type="author"><name><surname>Gipson</surname><given-names>I.</given-names></name><name><surname>Blalock</surname><given-names>T.</given-names></name><name><surname>Tisdale</surname><given-names>A.</given-names></name><name><surname>Spurr-Michaud</surname><given-names>S.</given-names></name><name><surname>Allcorn</surname><given-names>S.</given-names></name><name><surname>Stavreus-Evers</surname><given-names>A.</given-names></name><name><surname>Gemzell</surname><given-names>K.</given-names></name></person-group><year>2008</year><fpage>134</fpage><lpage>142</lpage><page-range>134-142</page-range><pub-id pub-id-type="doi">10.1095/biolreprod.106.058347</pub-id></element-citation></ref><ref id="BIBR-14"><element-citation publication-type="article-journal"><article-title>Chronic activation of MUC1-C in wound repair promotes progression to cancer stem cells</article-title><source>J Cancer Metastasis Treat</source><volume>8</volume><person-group person-group-type="author"><name><surname>Kufe</surname><given-names>D.W.</given-names></name></person-group><year>2022</year><page-range>12</page-range><pub-id pub-id-type="doi">10.20517/2394-4722.2022.03</pub-id></element-citation></ref><ref id="BIBR-15"><element-citation publication-type="article-journal"><article-title>Molecular Evolutionary Genetics Analysis Version 12 for adaptive and green computing</article-title><source>Molecular Biology and Evolution</source><volume>41</volume><issue>12</issue><person-group person-group-type="author"><name><surname>Kumar</surname><given-names>S.</given-names></name><name><surname>Stecher</surname><given-names>G.</given-names></name><name><surname>Suleski</surname><given-names>M.</given-names></name><name><surname>Sanderford</surname><given-names>M.</given-names></name><name><surname>Sharma</surname><given-names>S.</given-names></name><name name-style="given-only"><given-names>Tamura</given-names></name></person-group><year>2024</year><page-range>263</page-range><pub-id pub-id-type="doi">10.1093/molbev/msae263</pub-id></element-citation></ref><ref id="BIBR-16"><element-citation publication-type="article-journal"><article-title>Sparse Neighbor Joining: rapid phylogenetic inference using a sparse distance matrix</article-title><source>Bioinformatics</source><volume>40</volume><issue>12</issue><person-group person-group-type="author"><name><surname>Kurt</surname><given-names>S.</given-names></name><name><surname>Bouchard-Côté</surname><given-names>A.</given-names></name><name><surname>Lagergren</surname><given-names>J.</given-names></name></person-group><year>2024</year><page-range>701</page-range><pub-id pub-id-type="doi">10.1093/bioinformatics/btae701</pub-id></element-citation></ref><ref id="BIBR-17"><element-citation publication-type="article-journal"><article-title>Solution Structure of the SEA Domain from the Murine Homologue of Ovarian Cancer Antigen CA125 (MUC16)*</article-title><source>Journal of Biological Chemistry</source><volume>279</volume><issue>13</issue><person-group person-group-type="author"><name><surname>Maeda</surname><given-names>T.</given-names></name><name><surname>Inoue</surname><given-names>M.</given-names></name><name><surname>Koshiba</surname><given-names>S.</given-names></name><name><surname>Yabuki</surname><given-names>T.</given-names></name><name><surname>Aoki</surname><given-names>M.</given-names></name><name><surname>Nunokawa</surname><given-names>E.</given-names></name><name><surname>Seki</surname><given-names>E.</given-names></name><name><surname>Matsuda</surname><given-names>T.</given-names></name><name><surname>Motoda</surname><given-names>Y.</given-names></name><name><surname>Kobayashi</surname><given-names>A.</given-names></name><name><surname>Hiroyasu</surname><given-names>F.</given-names></name><name><surname>Shirouzu</surname><given-names>M.</given-names></name><name><surname>Terada</surname><given-names>T.</given-names></name><name><surname>Hayami</surname><given-names>N.</given-names></name><name><surname>Ishizuka</surname><given-names>Y.</given-names></name><name><surname>Shinya</surname><given-names>N.</given-names></name><name><surname>Tatsuguchi</surname><given-names>A.</given-names></name><name><surname>Yoshida</surname><given-names>M.</given-names></name><name><surname>Hirota</surname><given-names>H.</given-names></name><name><surname>Matsuo</surname><given-names>Y.</given-names></name><name><surname>Tani</surname><given-names>K.</given-names></name><name><surname>Arakawa</surname><given-names>T.</given-names></name><name><surname>Carninci</surname><given-names>P.</given-names></name><name><surname>Kawai</surname><given-names>J.</given-names></name><name><surname>Hayashizaki</surname><given-names>Y.</given-names></name><name><surname>Kigawa</surname><given-names>T.</given-names></name><name><surname>Yokoyama</surname><given-names>S.</given-names></name></person-group><year>2004</year><fpage>13174</fpage><lpage>13182</lpage><page-range>13174-13182</page-range><pub-id pub-id-type="doi">10.1074/jbc.m309417200</pub-id></element-citation></ref><ref id="BIBR-18"><element-citation publication-type="article-journal"><article-title>Introducing the MUC16 gene: implications for prevention and early detection in epithelial ovarian cancer</article-title><source>Biological Research for Nursing</source><volume>6</volume><issue>4</issue><person-group person-group-type="author"><name><surname>McLemore</surname><given-names>M.R.</given-names></name><name><surname>Aouizerat</surname><given-names>B.</given-names></name></person-group><year>2005</year><fpage>262</fpage><lpage>267</lpage><page-range>262-267</page-range><pub-id pub-id-type="doi">10.1177/1099800404274445</pub-id></element-citation></ref><ref id="BIBR-19"><element-citation publication-type="article-journal"><article-title>A mechanism of gene evolution generating mucin function</article-title><source>Science Advances</source><volume>8</volume><person-group person-group-type="author"><name><surname>Pajic</surname><given-names>P.</given-names></name><name><surname>Shen</surname><given-names>S.</given-names></name><name><surname>Qu</surname><given-names>J.</given-names></name><name><surname>May</surname><given-names>A.</given-names></name><name><surname>Knox</surname><given-names>S.</given-names></name><name><surname>Ruhl</surname><given-names>S.</given-names></name><name><surname>Gokcumen</surname><given-names>O.</given-names></name></person-group><year>2022</year><page-range>8757</page-range><pub-id pub-id-type="doi">10.1126/sciadv.abm8757</pub-id></element-citation></ref><ref id="BIBR-20"><element-citation publication-type="article-journal"><article-title>Expansion of divergent SEA domains in cell surface proteins and nucleoporin 54</article-title><source>Protein Science</source><volume>26</volume><issue>3</issue><person-group person-group-type="author"><name><surname>Pei</surname><given-names>J.</given-names></name><name><surname>Grishin</surname><given-names>N.V.</given-names></name></person-group><year>2017</year><fpage>617</fpage><lpage>630</lpage><page-range>617-630</page-range><pub-id pub-id-type="doi">10.1002/pro.3096</pub-id></element-citation></ref><ref id="BIBR-21"><element-citation publication-type="article-journal"><article-title>Focus on Molecules: human mucin MUC16</article-title><source>Experimental Eye Research</source><volume>87</volume><issue>5</issue><person-group person-group-type="author"><name><surname>Perez</surname><given-names>B.</given-names></name><name><surname>Gipson</surname><given-names>I.</given-names></name></person-group><year>2008</year><fpage>400</fpage><lpage>401</lpage><page-range>400-401</page-range><pub-id pub-id-type="doi">10.1016/j.exer.2007.12.008</pub-id></element-citation></ref><ref id="BIBR-22"><element-citation publication-type="article-journal"><article-title>Structural and genetic diversity in the secreted mucins MUC5AC and MUC5B</article-title><source>American Journal of Human Genetics</source><volume>111</volume><issue>8</issue><person-group person-group-type="author"><name><surname>Plender</surname><given-names>E.</given-names></name><name><surname>Prodanov</surname><given-names>T.</given-names></name><name><surname>Hsieh</surname><given-names>P.</given-names></name><name><surname>Nizamis</surname><given-names>E.</given-names></name><name><surname>Harvey</surname><given-names>W.</given-names></name><name><surname>Sulovari</surname><given-names>A.</given-names></name><name><surname>Munson</surname><given-names>K.</given-names></name><name><surname>Kaufman</surname><given-names>E.</given-names></name><name><surname>O’Neal</surname><given-names>W.</given-names></name><name><surname>Valdmanis</surname><given-names>P.</given-names></name><name><surname>Marschall</surname><given-names>T.</given-names></name><name><surname>Bloom</surname><given-names>J.</given-names></name><name><surname>Eichler</surname><given-names>E.</given-names></name></person-group><year>2024</year><fpage>1700</fpage><lpage>1716</lpage><page-range>1700-1716</page-range><pub-id pub-id-type="doi">10.1016/j.ajhg.2024.06.007</pub-id></element-citation></ref><ref id="BIBR-23"><element-citation publication-type="article-journal"><article-title>The neighbor-joining method: A new method for reconstructing phhylogenetic trees</article-title><source>Molecular Biology and Evolution</source><volume>4</volume><issue>4</issue><person-group person-group-type="author"><name><surname>Saito</surname><given-names>N.</given-names></name><name><surname>Nei</surname><given-names>M.</given-names></name></person-group><year>1987</year><fpage>406</fpage><lpage>425</lpage><page-range>406-425</page-range><pub-id pub-id-type="doi">10.1093/oxfordjournals.molbev.a040454</pub-id></element-citation></ref><ref id="BIBR-24"><element-citation publication-type="article-journal"><article-title>Molecular Evolution of Ecological Specialisation: Genomic Insights from the Diversification of Murine Rodents</article-title><source>Genome Biology and Evolution</source><volume>13</volume><issue>7</issue><person-group person-group-type="author"><name><surname>Roycroft</surname><given-names>E.</given-names></name><name><surname>Achmadi</surname><given-names>A.</given-names></name><name><surname>Callahan</surname><given-names>C.</given-names></name><name><surname>Esselstyn</surname><given-names>J.</given-names></name><name><surname>Good</surname><given-names>J.</given-names></name><name><surname>Moussalli</surname><given-names>A.</given-names></name><name><surname>Rowe</surname><given-names>K.</given-names></name></person-group><year>2021</year><page-range>103</page-range><pub-id pub-id-type="doi">10.1093/gbe/evab103</pub-id></element-citation></ref><ref id="BIBR-25"><element-citation publication-type="article-journal"><article-title>A novel algorithm for detecting multiple covariance and clustering of biological sequences</article-title><source>Scientific Reports</source><volume>6</volume><person-group person-group-type="author"><name><surname>Shen</surname><given-names>W.</given-names></name><name><surname>Li</surname><given-names>Y.</given-names></name></person-group><year>2016</year><page-range>30425</page-range><pub-id pub-id-type="doi">10.1038/srep30425</pub-id></element-citation></ref><ref id="BIBR-26"><element-citation publication-type="article-journal"><article-title>Human-specific tandem repeat expansion and differential gene expression during primate evolution</article-title><source>Proceedings of the National Academy of Sciences</source><volume>116</volume><issue>46</issue><person-group person-group-type="author"><name><surname>Sulovari</surname><given-names>A.</given-names></name><name><surname>Li</surname><given-names>R.</given-names></name><name><surname>Audano</surname><given-names>P.</given-names></name><name><surname>Porubsky</surname><given-names>D.</given-names></name><name><surname>Vollger</surname><given-names>M.</given-names></name><name><surname>Logsdon</surname><given-names>G.</given-names></name><name><surname>Warren</surname><given-names>W.</given-names></name><name><surname>Pollen</surname><given-names>A.</given-names></name><name><surname>Chaisson</surname><given-names>M.</given-names></name><name><surname>Eichler</surname><given-names>E.</given-names></name></person-group><year>2019</year><fpage>23243</fpage><lpage>23253</lpage><page-range>23243-23253</page-range><pub-id pub-id-type="doi">10.1073/pnas.1912175116</pub-id></element-citation></ref><ref id="BIBR-27"><element-citation publication-type="article-journal"><article-title>N-Glycosylation affects the stability and barrier function of the MUC16 mucin</article-title><source>The Journal of Biological Chemistry</source><volume>292</volume><issue>26</issue><person-group person-group-type="author"><name><surname>Taniguchi</surname><given-names>T.</given-names></name><name><surname>Woodward</surname><given-names>A.</given-names></name><name><surname>Magnelli</surname><given-names>P.</given-names></name><name><surname>McColgan</surname><given-names>N.</given-names></name><name><surname>Lehoux</surname><given-names>S.</given-names></name><name><surname>Jacobo</surname><given-names>S.</given-names></name><name><surname>Mauris</surname><given-names>J.</given-names></name><name><surname>Argüeso</surname><given-names>P.</given-names></name></person-group><year>2017</year><fpage>11079</fpage><lpage>11090</lpage><page-range>11079-11090</page-range><pub-id pub-id-type="doi">10.1074/jbc.m116.770123</pub-id></element-citation></ref><ref id="BIBR-28"><element-citation publication-type="article-journal"><article-title>Mutation and selection processes regulating short tandem repeats give rise to genetic and phenotypic diversity across species</article-title><source>Journal of Evolutionary Biology</source><volume>36</volume><issue>2</issue><person-group person-group-type="author"><name><surname>Verbiest</surname><given-names>M.</given-names></name><name><surname>Maksimov</surname><given-names>M.</given-names></name><name><surname>Jin</surname><given-names>Y.</given-names></name><name><surname>Anisimova</surname><given-names>M.</given-names></name><name><surname>Gymrek</surname><given-names>M.</given-names></name><name><surname>Sonay</surname><given-names>T.</given-names></name></person-group><year>2022</year><fpage>321</fpage><lpage>336</lpage><page-range>321-336</page-range><pub-id pub-id-type="doi">10.1111/jeb.14106</pub-id></element-citation></ref><ref id="BIBR-29"><element-citation publication-type="article-journal"><article-title>A Revised Molecular Model of Ovarian Cancer Biomarker CA125 (MUC16) Enabled by Long-read Sequencing</article-title><source>Cancer Research Communications</source><volume>4</volume><issue>1</issue><person-group person-group-type="author"><name><surname>Wang</surname><given-names>C.</given-names></name><name><surname>Weaver</surname><given-names>S.</given-names></name><name><surname>Boonpattrawong</surname><given-names>N.</given-names></name><name><surname>Schuster-Little</surname><given-names>N.</given-names></name><name><surname>Pantakar</surname><given-names>M.</given-names></name><name><surname>Whelan</surname><given-names>R.</given-names></name></person-group><year>2024</year><fpage>253</fpage><lpage>263</lpage><page-range>253-263</page-range><pub-id pub-id-type="doi">10.1158/2767-9764.crc-23-0327</pub-id></element-citation></ref><ref id="BIBR-30"><element-citation publication-type="article-journal"><article-title>Crystal structure of a human MUC16 SEA domain reveals insight into the nature of the CA125 tumor marker</article-title><source>Proteins: Structure</source><volume>90</volume><issue>5</issue><person-group person-group-type="author"><name><surname>White</surname><given-names>B.</given-names></name><name><surname>Patterson</surname><given-names>M.</given-names></name><name><surname>Karnwal</surname><given-names>S.</given-names></name><name><surname>Brooks</surname><given-names>C.</given-names></name></person-group><year>2022</year><fpage>1210</fpage><lpage>1218</lpage><page-range>1210-1218</page-range><pub-id pub-id-type="doi">10.1002/prot.26303</pub-id></element-citation></ref><ref id="BIBR-31"><element-citation publication-type="article-journal"><article-title>Efficiencies of the NJp, Maximum Likelihood, and Bayesian Methods of Phylogenetic Construction for Compositional and Noncompositional Genes</article-title><source>Molecular biology and evolution</source><volume>33</volume><issue>6</issue><person-group person-group-type="author"><name><surname>Yoshida</surname><given-names>R.</given-names></name><name><surname>Nei</surname><given-names>M.</given-names></name></person-group><year>2016</year><fpage>1618</fpage><lpage>1624</lpage><page-range>1618-1624</page-range><pub-id pub-id-type="doi">10.1093/molbev/msw042</pub-id></element-citation></ref><ref id="BIBR-32"><element-citation publication-type="article-journal"><article-title>MUC16: clinical targets with great potential</article-title><source>Clinical and Experimental Medicine</source><volume>24</volume><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>X.</given-names></name><name><surname>Hong</surname><given-names>L.</given-names></name><name><surname>Ling</surname><given-names>Z.</given-names></name></person-group><year>2024</year><page-range>101</page-range><pub-id pub-id-type="doi">10.1007/s10238-024-01365-5</pub-id></element-citation></ref></ref-list></back></article>