<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article SYSTEM "http://jats.nlm.nih.gov/archiving/1.2/JATS-archivearticle1.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="1.2" article-type="research-article" xml:lang="en"><?properties open_access?><front><journal-meta><journal-id journal-id-type="publisher-id">41467</journal-id><journal-id journal-id-type="doi">10.1038/41467.2041-1723</journal-id><journal-title-group><journal-title>Nature Communications</journal-title><abbrev-journal-title abbrev-type="publisher">Nat Commun</abbrev-journal-title></journal-title-group><issn pub-type="epub">2041-1723</issn><publisher><publisher-name>Nature Publishing Group UK</publisher-name><publisher-loc>London</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">s41467-021-26166-2</article-id><article-id pub-id-type="manuscript">26166</article-id><article-id pub-id-type="doi">10.1038/s41467-021-26166-2</article-id><article-categories><subj-group subj-group-type="heading"><subject>Article</subject></subj-group><subj-group subj-group-type="SubjectPath"><subject>/631/181/2474</subject></subj-group><subj-group subj-group-type="SubjectPath"><subject>/631/181/735</subject></subj-group><subj-group subj-group-type="SubjectPath"><subject>/631/208/177</subject></subj-group><subj-group subj-group-type="SubjectPath"><subject>/631/208/514/1948</subject></subj-group><subj-group subj-group-type="TechniquePath"><subject>/38/39</subject></subj-group><subj-group subj-group-type="TechniquePath"><subject>/45</subject></subj-group><subj-group subj-group-type="TechniquePath"><subject>/45/91</subject></subj-group><subj-group subj-group-type="TechniquePath"><subject>/45/23</subject></subj-group><subj-group subj-group-type="TechniquePath"><subject>/45/22</subject></subj-group><subj-group subj-group-type="TechniquePath"><subject>/49</subject></subj-group><subj-group subj-group-type="TechniquePath"><subject>/49/91</subject></subj-group><subj-group subj-group-type="TechniquePath"><subject>/49/23</subject></subj-group><subj-group subj-group-type="TechniquePath"><subject>/64</subject></subj-group><subj-group subj-group-type="NatureArticleTypeID"><subject>article</subject></subj-group></article-categories><title-group><article-title xml:lang="en">Mapping epigenetic divergence in the massive radiation of Lake Malawi cichlid fishes</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes" id="Au1"><contrib-id contrib-id-type="orcid">http://orcid.org/0000-0001-8942-2370</contrib-id><name><surname>Vernaz</surname><given-names>Grégoire</given-names></name><xref ref-type="aff" rid="Aff1">1</xref><xref ref-type="aff" rid="Aff2">2</xref><xref ref-type="aff" rid="Aff3">3</xref><xref ref-type="corresp" rid="IDs41467021261662_cor1">a</xref></contrib><contrib contrib-type="author" id="Au2"><contrib-id contrib-id-type="orcid">http://orcid.org/0000-0002-1462-6317</contrib-id><name><surname>Malinsky</surname><given-names>Milan</given-names></name><xref ref-type="aff" rid="Aff3">3</xref><xref ref-type="aff" rid="Aff7">7</xref></contrib><contrib contrib-type="author" id="Au3"><name><surname>Svardal</surname><given-names>Hannes</given-names></name><xref ref-type="aff" rid="Aff3">3</xref><xref ref-type="aff" rid="Aff8">8</xref><xref ref-type="aff" rid="Aff9">9</xref></contrib><contrib contrib-type="author" id="Au4"><name><surname>Du</surname><given-names>Mingliu</given-names></name><xref ref-type="aff" rid="Aff1">1</xref><xref ref-type="aff" rid="Aff2">2</xref><xref ref-type="aff" rid="Aff3">3</xref></contrib><contrib contrib-type="author" id="Au5"><name><surname>Tyers</surname><given-names>Alexandra M.</given-names></name><xref ref-type="aff" rid="Aff4">4</xref><xref ref-type="aff" rid="Aff10">10</xref></contrib><contrib contrib-type="author" id="Au6"><contrib-id contrib-id-type="orcid">http://orcid.org/0000-0003-3158-7935</contrib-id><name><surname>Santos</surname><given-names>M. Emília</given-names></name><xref ref-type="aff" rid="Aff5">5</xref></contrib><contrib contrib-type="author" id="Au7"><contrib-id contrib-id-type="orcid">http://orcid.org/0000-0002-9130-1006</contrib-id><name><surname>Durbin</surname><given-names>Richard</given-names></name><xref ref-type="aff" rid="Aff2">2</xref><xref ref-type="aff" rid="Aff3">3</xref></contrib><contrib contrib-type="author" id="Au8"><contrib-id contrib-id-type="orcid">http://orcid.org/0000-0003-1117-9168</contrib-id><name><surname>Genner</surname><given-names>Martin J.</given-names></name><xref ref-type="aff" rid="Aff6">6</xref></contrib><contrib contrib-type="author" id="Au9"><contrib-id contrib-id-type="orcid">http://orcid.org/0000-0003-0099-7261</contrib-id><name><surname>Turner</surname><given-names>George F.</given-names></name><xref ref-type="aff" rid="Aff4">4</xref></contrib><contrib contrib-type="author" corresp="yes" id="Au10"><contrib-id contrib-id-type="orcid">http://orcid.org/0000-0002-4450-576X</contrib-id><name><surname>Miska</surname><given-names>Eric A.</given-names></name><xref ref-type="aff" rid="Aff1">1</xref><xref ref-type="aff" rid="Aff2">2</xref><xref ref-type="aff" rid="Aff3">3</xref><xref ref-type="corresp" rid="IDs41467021261662_cor10">k</xref></contrib><aff id="Aff1"><label>1</label><institution-wrap><institution-id institution-id-type="GRID">grid.5335.0</institution-id><institution-id institution-id-type="ISNI">0000000121885934</institution-id><institution content-type="org-division">Wellcome/CRUK Gurdon Institute</institution><institution content-type="org-name">University of Cambridge</institution></institution-wrap><addr-line content-type="city">Cambridge</addr-line><country country="GB">UK</country></aff><aff id="Aff2"><label>2</label><institution-wrap><institution-id institution-id-type="GRID">grid.5335.0</institution-id><institution-id institution-id-type="ISNI">0000000121885934</institution-id><institution content-type="org-division">Department of Genetics</institution><institution content-type="org-name">University of Cambridge</institution></institution-wrap><addr-line content-type="city">Cambridge</addr-line><country country="GB">UK</country></aff><aff id="Aff3"><label>3</label><institution-wrap><institution-id institution-id-type="GRID">grid.10306.34</institution-id><institution-id institution-id-type="ISNI">0000 0004 0606 5382</institution-id><institution content-type="org-name">Wellcome Sanger Institute</institution></institution-wrap><addr-line content-type="city">Cambridge</addr-line><country country="GB">UK</country></aff><aff id="Aff4"><label>4</label><institution-wrap><institution-id institution-id-type="GRID">grid.7362.0</institution-id><institution-id institution-id-type="ISNI">0000000118820937</institution-id><institution content-type="org-division">School of Natural Sciences</institution><institution content-type="org-name">Sciences, Bangor University</institution></institution-wrap><addr-line content-type="city">Bangor</addr-line><country country="GB">UK</country></aff><aff id="Aff5"><label>5</label><institution-wrap><institution-id institution-id-type="GRID">grid.5335.0</institution-id><institution-id institution-id-type="ISNI">0000000121885934</institution-id><institution content-type="org-division">Department of Zoology</institution><institution content-type="org-name">University of Cambridge</institution></institution-wrap><addr-line content-type="city">Cambridge</addr-line><country country="GB">UK</country></aff><aff id="Aff6"><label>6</label><institution-wrap><institution-id institution-id-type="GRID">grid.5337.2</institution-id><institution-id institution-id-type="ISNI">0000 0004 1936 7603</institution-id><institution content-type="org-division">School of Biological Sciences</institution><institution content-type="org-name">University of Bristol</institution></institution-wrap><addr-line content-type="city">Bristol</addr-line><country country="GB">UK</country></aff><aff id="Aff7"><label>7</label><institution-wrap><institution-id institution-id-type="GRID">grid.5734.5</institution-id><institution-id institution-id-type="ISNI">0000 0001 0726 5157</institution-id><institution content-type="org-division">Institute of Ecology and Evolution</institution><institution content-type="org-name">University of Bern</institution></institution-wrap><addr-line content-type="city">Bern</addr-line><country country="CH">Switzerland</country></aff><aff id="Aff8"><label>8</label><institution-wrap><institution-id institution-id-type="GRID">grid.5284.b</institution-id><institution-id institution-id-type="ISNI">0000 0001 0790 3681</institution-id><institution content-type="org-division">Department of Biology</institution><institution content-type="org-name">University of Antwerp</institution></institution-wrap><addr-line content-type="city">Antwerp</addr-line><country country="BE">Belgium</country></aff><aff id="Aff9"><label>9</label><institution-wrap><institution-id institution-id-type="GRID">grid.425948.6</institution-id><institution-id institution-id-type="ISNI">0000 0001 2159 802X</institution-id><institution content-type="org-name">Naturalis Biodiversity Center</institution></institution-wrap><addr-line content-type="city">Leiden</addr-line><country country="NL">The Netherlands</country></aff><aff id="Aff10"><label>10</label><institution-wrap><institution-id institution-id-type="GRID">grid.419502.b</institution-id><institution-id institution-id-type="ISNI">0000 0004 0373 6590</institution-id><institution content-type="org-name">Max Planck Institute for Biology of Ageing</institution></institution-wrap><addr-line content-type="city">Cologne</addr-line><country country="DE">Germany</country></aff></contrib-group><author-notes><corresp id="IDs41467021261662_cor1"><label>a</label><email>gv268@cam.ac.uk</email></corresp><corresp id="IDs41467021261662_cor10"><label>k</label><email>eam29@cam.ac.uk</email></corresp></author-notes><pub-date date-type="pub" publication-format="electronic"><day>7</day><month>10</month><year>2021</year></pub-date><pub-date date-type="collection" publication-format="electronic"><month>12</month><year>2021</year></pub-date><volume>12</volume><issue seq="25777">1</issue><elocation-id>5870</elocation-id><history><date date-type="registration"><day>23</day><month>9</month><year>2021</year></date><date date-type="received"><day>7</day><month>1</month><year>2021</year></date><date date-type="accepted"><day>14</day><month>9</month><year>2021</year></date><date date-type="online"><day>7</day><month>10</month><year>2021</year></date></history><permissions><copyright-statement>© Crown 2021</copyright-statement><copyright-year>2021</copyright-year><license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/"><license-p><bold>Open Access</bold> This article is licensed under a Creative Commons Attribution 4.0 International License, which permits use, sharing, adaptation, distribution and reproduction in any medium or format, as long as you give appropriate credit to the original author(s) and the source, provide a link to the Creative Commons license, and indicate if changes were made. The images or other third party material in this article are included in the article’s Creative Commons license, unless indicated otherwise in a credit line to the material. If material is not included in the article’s Creative Commons license and your intended use is not permitted by statutory regulation or exceeds the permitted use, you will need to obtain permission directly from the copyright holder. To view a copy of this license, visit <ext-link xlink:href="http://creativecommons.org/licenses/by/4.0/" ext-link-type="url">http://creativecommons.org/licenses/by/4.0/</ext-link>.</license-p></license></permissions><abstract id="Abs1" xml:lang="en"><title>Abstract</title><p id="Par1">Epigenetic variation modulates gene expression and can be heritable. However, knowledge of the contribution of epigenetic divergence to adaptive diversification in nature remains limited. The massive evolutionary radiation of Lake Malawi cichlid fishes displaying extensive phenotypic diversity despite extremely low sequence divergence is an excellent system to study the epigenomic contribution to adaptation. Here, we present a comparative genome-wide methylome and transcriptome study, focussing on liver and muscle tissues in phenotypically divergent cichlid species. In both tissues we find substantial methylome divergence among species. Differentially methylated regions (DMR), enriched in evolutionary young transposons, are associated with transcription changes of ecologically-relevant genes related to energy expenditure and lipid metabolism, pointing to a link between dietary ecology and methylome divergence. Unexpectedly, half of all species-specific DMRs are shared across tissues and are enriched in developmental genes, likely reflecting distinct epigenetic developmental programmes. Our study reveals substantial methylome divergence in closely-related cichlid fishes and represents a resource to study the role of epigenetics in species diversification.</p></abstract><abstract id="Abs2" xml:lang="en"><p id="Par2">The Lake Malawi cichlid fishes are an example of extreme vertebrate radiation; however, there is very little sequence divergence among the species. Here the authors present a comparative genome-wide methylome study to suggest DNA methylation played a major role in the extensive phenotypic diversity amongst these fishes.</p></abstract><funding-group><award-group><funding-source><institution-wrap><institution>Wellcome Trust (Wellcome)</institution><institution-id institution-id-type="doi" vocab="open-funder-registry">https://doi.org/10.13039/100004440</institution-id></institution-wrap></funding-source><award-id award-type="FundRef grant">104640/Z/14/Z; 219475/Z/19/Z</award-id><principal-award-recipient><name><surname>Miska</surname><given-names>Eric A.</given-names></name></principal-award-recipient></award-group><award-group><funding-source><institution-wrap><institution>Cancer Research UK (CRUK)</institution><institution-id institution-id-type="doi" vocab="open-funder-registry">https://doi.org/10.13039/501100000289</institution-id></institution-wrap></funding-source><award-id award-type="FundRef grant">C13474/A27826</award-id><principal-award-recipient><name><surname>Miska</surname><given-names>Eric A.</given-names></name></principal-award-recipient></award-group></funding-group><custom-meta-group><custom-meta><meta-name>publisher-imprint-name</meta-name><meta-value>Nature Portfolio</meta-value></custom-meta><custom-meta><meta-name>volume-issue-count</meta-name><meta-value>1</meta-value></custom-meta><custom-meta><meta-name>issue-article-count</meta-name><meta-value>5872</meta-value></custom-meta><custom-meta><meta-name>issue-toc-levels</meta-name><meta-value>0</meta-value></custom-meta><custom-meta><meta-name>issue-pricelist-year</meta-name><meta-value>2021</meta-value></custom-meta><custom-meta><meta-name>issue-copyright-holder</meta-name><meta-value>The Author(s)</meta-value></custom-meta><custom-meta><meta-name>issue-copyright-year</meta-name><meta-value>2021</meta-value></custom-meta><custom-meta><meta-name>article-contains-esm</meta-name><meta-value>Yes</meta-value></custom-meta><custom-meta><meta-name>article-numbering-style</meta-name><meta-value>Unnumbered</meta-value></custom-meta><custom-meta><meta-name>article-registration-date-year</meta-name><meta-value>2021</meta-value></custom-meta><custom-meta><meta-name>article-registration-date-month</meta-name><meta-value>9</meta-value></custom-meta><custom-meta><meta-name>article-registration-date-day</meta-name><meta-value>23</meta-value></custom-meta><custom-meta><meta-name>article-toc-levels</meta-name><meta-value>0</meta-value></custom-meta><custom-meta><meta-name>toc-levels</meta-name><meta-value>0</meta-value></custom-meta><custom-meta><meta-name>volume-type</meta-name><meta-value>Regular</meta-value></custom-meta><custom-meta><meta-name>journal-product</meta-name><meta-value>NonStandardArchiveJournal</meta-value></custom-meta><custom-meta><meta-name>numbering-style</meta-name><meta-value>Unnumbered</meta-value></custom-meta><custom-meta><meta-name>article-grants-type</meta-name><meta-value>OpenChoice</meta-value></custom-meta><custom-meta><meta-name>metadata-grant</meta-name><meta-value>OpenAccess</meta-value></custom-meta><custom-meta><meta-name>abstract-grant</meta-name><meta-value>OpenAccess</meta-value></custom-meta><custom-meta><meta-name>bodypdf-grant</meta-name><meta-value>OpenAccess</meta-value></custom-meta><custom-meta><meta-name>bodyhtml-grant</meta-name><meta-value>OpenAccess</meta-value></custom-meta><custom-meta><meta-name>bibliography-grant</meta-name><meta-value>OpenAccess</meta-value></custom-meta><custom-meta><meta-name>esm-grant</meta-name><meta-value>OpenAccess</meta-value></custom-meta><custom-meta><meta-name>online-first</meta-name><meta-value>false</meta-value></custom-meta><custom-meta><meta-name>pdf-file-reference</meta-name><meta-value>BodyRef/PDF/41467_2021_Article_26166.pdf</meta-value></custom-meta><custom-meta><meta-name>pdf-type</meta-name><meta-value>Typeset</meta-value></custom-meta><custom-meta><meta-name>target-type</meta-name><meta-value>OnlinePDF</meta-value></custom-meta><custom-meta><meta-name>issue-type</meta-name><meta-value>Regular</meta-value></custom-meta><custom-meta><meta-name>article-type</meta-name><meta-value>OriginalPaper</meta-value></custom-meta><custom-meta><meta-name>journal-subject-primary</meta-name><meta-value>Science, Humanities and Social Sciences, multidisciplinary</meta-value></custom-meta><custom-meta><meta-name>journal-subject-secondary</meta-name><meta-value>Science, Humanities and Social Sciences, multidisciplinary</meta-value></custom-meta><custom-meta><meta-name>journal-subject-secondary</meta-name><meta-value>Science, multidisciplinary</meta-value></custom-meta><custom-meta><meta-name>journal-subject-collection</meta-name><meta-value>Science (multidisciplinary)</meta-value></custom-meta><custom-meta><meta-name>open-access</meta-name><meta-value>true</meta-value></custom-meta></custom-meta-group></article-meta></front><body><sec id="Sec1" sec-type="introduction"><title>Introduction</title><p id="Par3">Trait inheritance and phenotypic diversification are primarily explained by the transmission of genetic information encoded in the DNA sequence. In addition, a variety of epigenetic processes have recently been reported to mediate heritable transmission of phenotypes in animals and plants<sup><xref ref-type="bibr" rid="CR1">1</xref>–<xref ref-type="bibr" rid="CR7">7</xref></sup>. However, the current understanding of the evolutionary significance of epigenetic processes, and of their roles in organismal diversification, is in its infancy.</p><p id="Par4">DNA methylation, or the covalent addition of a methyl group onto the 5th carbon of cytosine (mC) in DNA, is a reversible epigenetic mark present across multiple kingdoms<sup><xref ref-type="bibr" rid="CR8">8</xref>–<xref ref-type="bibr" rid="CR10">10</xref></sup>, can be heritable, and has been linked to transmission of acquired phenotypes in plants and animals<sup><xref ref-type="bibr" rid="CR2">2</xref>,<xref ref-type="bibr" rid="CR5">5</xref>,<xref ref-type="bibr" rid="CR6">6</xref>,<xref ref-type="bibr" rid="CR11">11</xref>–<xref ref-type="bibr" rid="CR13">13</xref></sup>. The importance of this mechanism is underlined by the fact that proteins involved in the deposition of mC (‘writers’, DNA methyltransferases [DNMTs]), in mC maintenance during cell division, and in the removal of mC (‘erasers’, ten-eleven translocation methylcytosine dioxygenases [TETs]), are mostly essential and show high degrees of conservation across vertebrates species<sup><xref ref-type="bibr" rid="CR14">14</xref>–<xref ref-type="bibr" rid="CR17">17</xref></sup>. In addition, some ancestral functions of methylated cytosines are highly conserved, such as in the transcriptional silencing of exogenous genomic elements (transposons)<sup><xref ref-type="bibr" rid="CR18">18</xref>,<xref ref-type="bibr" rid="CR19">19</xref></sup>. In vertebrates, DNA methylation functions have evolved to play an important role in the orchestration of cell differentiation during normal embryogenesis/development through complex interactions with histone post-translational modifications (DNA accessibility) and mC-sensitive readers (such as transcription factors)<sup><xref ref-type="bibr" rid="CR19">19</xref>–<xref ref-type="bibr" rid="CR25">25</xref></sup>, in particular at <italic>cis</italic>-regulatory regions (i.e., promoters, enhancers). Early-life establishment of stable DNA methylation patterns can thus affect transcriptional activity in the embryo and persist into fully differentiated cells<sup><xref ref-type="bibr" rid="CR26">26</xref></sup>. DNA methylation variation has also been postulated to have evolved in the context of natural selection by promoting phenotypic plasticity and thus possibly facilitating adaptation, speciation, and adaptive radiation<sup><xref ref-type="bibr" rid="CR2">2</xref>,<xref ref-type="bibr" rid="CR4">4</xref>,<xref ref-type="bibr" rid="CR12">12</xref>,<xref ref-type="bibr" rid="CR27">27</xref></sup>.</p><p id="Par5">Studies in plants have revealed how covarying environmental factors and DNA methylation variation underlie stable and heritable transcriptional changes in adaptive traits<sup><xref ref-type="bibr" rid="CR2">2</xref>,<xref ref-type="bibr" rid="CR6">6</xref>,<xref ref-type="bibr" rid="CR11">11</xref>–<xref ref-type="bibr" rid="CR13">13</xref>,<xref ref-type="bibr" rid="CR28">28</xref></sup>. Some initial evidence is also present in vertebrates<sup><xref ref-type="bibr" rid="CR2">2</xref>,<xref ref-type="bibr" rid="CR5">5</xref>,<xref ref-type="bibr" rid="CR29">29</xref>–<xref ref-type="bibr" rid="CR31">31</xref></sup>. In the cavefish, for example, an early developmental process—eye degeneration—has been shown to be mediated by DNA methylation, suggesting mC variation as an evolutionary factor generating adaptive phenotypic plasticity during development and evolution<sup><xref ref-type="bibr" rid="CR29">29</xref>,<xref ref-type="bibr" rid="CR32">32</xref></sup>. However, whether correlations between environmental variation and DNA methylation patterns promote phenotypic diversification more widely among natural vertebrate populations remains unknown.</p><p id="Par6">In this study, we sought to quantify, map and characterise natural divergence in DNA methylation in the context of the Lake Malawi haplochromine cichlid adaptive radiation, one of the most spectacular examples of rapid vertebrate phenotypic diversification<sup><xref ref-type="bibr" rid="CR33">33</xref></sup>. In total, the radiation comprises over 800 endemic species<sup><xref ref-type="bibr" rid="CR34">34</xref></sup>, that are estimated to have evolved from common ancestry approximately 800,000 years ago<sup><xref ref-type="bibr" rid="CR35">35</xref></sup>. Species within the radiation can be grouped into seven distinct ecomorphological groups based on their ecology, morphology, and genetic differences: (1) shallow benthic, (2) deep benthic, (3) deep pelagic zooplanktivorous/piscivorous <italic>Diplotaxodon</italic>, (4) the rock-dwelling ‛mbuna’, (5) zooplanktivorous ‛utaka’, (6) <italic>Astatotilapia calliptera</italic> specialised for shallow weedy habitats (also found in surrounding rivers and lakes), and (7) the midwater pelagic piscivores <italic>Rhamphochromis</italic><sup><xref ref-type="bibr" rid="CR36">36</xref>,<xref ref-type="bibr" rid="CR37">37</xref></sup>. Recent large-scale genetic studies have revealed that the Lake Malawi cichlid flock is characterised by an overall very low genetic divergence among species (0.1−0.25%), combined with a low mutation rate, a high rate of hybridisation and extensive incomplete lineage sorting (shared retention of ancestral genetic variation across species)<sup><xref ref-type="bibr" rid="CR34">34</xref>,<xref ref-type="bibr" rid="CR36">36</xref>,<xref ref-type="bibr" rid="CR38">38</xref>,<xref ref-type="bibr" rid="CR39">39</xref></sup>. Multiple molecular mechanisms may be at work to enable such an explosive phenotypic diversification. Therefore, investigating the epigenetic mechanisms in Lake Malawi cichlids represents a remarkable opportunity to expand our comprehension of the processes underlying phenotypic diversification and adaptation.</p><p id="Par7">Here we describe, quantify, and assess the divergence in liver methylomes in six cichlid species spanning five of the seven ecomorphological groups of the Lake Malawi haplochromine radiation by generating high-coverage whole-genome liver bisulfite sequencing (WGBS). We find that Lake Malawi haplochromine cichlids exhibit substantial methylome divergence, despite conserved underlying DNA sequences, and are enriched in evolutionary young transposable elements. Next, we generated whole liver transcriptome sequencing (RNAseq) in four of the six species and showed that differential transcriptional activity is significantly associated with between-species methylome divergence, most prominently in genes involved in key hepatic metabolic functions. Finally, by generating WGBS from muscle tissues in three cichlid species, we show that half of methylome divergence between species is tissue-unspecific and pertains to embryonic and developmental processes, possibly contributing to the early establishment of phenotypic diversity. This represents a comparative analysis of natural methylome variation in Lake Malawi cichlids and provides initial evidence for substantial species-specific epigenetic divergence in <italic>cis</italic>-regulatory regions of ecologically-relevant genes. Our study represents a resource that lays the groundwork for future epigenomic research in the context of phenotypic diversification and adaptation.</p></sec><sec id="Sec2" sec-type="results"><title>Results</title><sec id="Sec3"><title>The methylomes of Lake Malawi cichlids feature conserved vertebrate characteristics</title><p id="Par8">To characterise the methylome variation and assess possible functional relationships in natural populations of Lake Malawi cichlids, we performed high-coverage whole-genome bisulfite sequencing of methylomes (WGBS) from liver tissues of six different cichlid species. Muscle methylome (WGBS) data for three of the six species were also generated to assess the extent to which methylome divergence was tissue-specific. Moreover, to examine the correlation between transcriptome and methylome divergences, total transcriptomes (RNAseq) from both liver and muscle tissues of four species were generated. Only wild-caught male specimens (2−3 biological replicates for each tissue and each species) were used for all sequencing datasets (Fig. <xref rid="Fig1" ref-type="fig">1a–c</xref>, Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">1</xref>, Supplementary Data <xref ref-type="supplementary-material" rid="MOESM4">1</xref>, and Supplementary Table <xref ref-type="supplementary-material" rid="MOESM1">1</xref>). The species selected were: <italic>Rhamphochromis longiceps</italic> (RL), a pelagic piscivore (Rhamphochromis group); <italic>Diplotaxodon limnothrissa</italic> (DL), <italic>a</italic> deep-water pelagic carnivore (Diplotaxodon group); <italic>Maylandia zebra</italic> (MZ) and <italic>Petrotilapia genalutea</italic> (PG), two rock-dwelling algae eaters (Mbuna group); <italic>Aulonocara stuartgranti</italic> (AS), a benthic invertebrate-eating sand/rock-dweller that is genetically part of the deep-benthic group; <italic>Astatotilapia calliptera</italic> (AC), a species of rivers and lake margins<sup><xref ref-type="bibr" rid="CR40">40</xref></sup> (Fig. <xref rid="Fig1" ref-type="fig">1b</xref>).<fig id="Fig1"><label>Fig. 1</label><caption xml:lang="en"><title>The methylome of Lake Malawi cichlids.</title><p><bold>a</bold> Map of Africa (main river systems are highlighted in white) and magnification of Lake Malawi (scale bar: 40 km). <bold>b</bold> Photographs (not to scale) of the six Lake Malawi cichlid species part of this study spanning five of the seven described eco-morphological groups. The symbols represent the different habitats (pelagic/benthic [wave symbol], rock/sand-dwelling/littoral [rock symbol] and adjacent rivers part of Lake Malawi catchment), and the type of diet (fish, fish/zooplankton, algae, invertebrates) for each group. The species representing each group are indicated by their initials (see below). <bold>c</bold> Diagram summarising the sampling and sequencing strategies for liver and muscle methylome (whole-genome bisulfite sequencing, WGBS) and whole transcriptome (RNAseq) datasets. See “Methods”, Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">1</xref> and Supplementary Table <xref ref-type="supplementary-material" rid="MOESM1">1</xref>. <bold>d</bold> Violin plots showing the distribution of liver DNA methylation levels in CG sequence context (averaged mCG/CG levels over 50 bp-long bins genome-wide) in different genomic regions: overall, gene bodies, exons, promoter regions (TSS ± 500 bp), CpG-islands in promoters and outside (orphan) and in repeat/transposon regions. mC levels for two different repeat classes are given: DNA transposon superfamily Tc2-Mariner (<italic>n</italic> = 5,378) and LINE I (<italic>n</italic> = 407). <bold>e</bold> Average liver mCG profiles across genes differ depending on their transcriptional activity in liver: from non-expressed (0) to genes showing low (1), intermediate (2), high (3) and highest (4) expression levels (“Methods”). Results shown in (<bold>d,</bold><bold>e</bold>) are for Mbuna MZ (liver, <italic>n</italic> = 3) and are representative of the results for all other species, and are based on average mC/C in 50 bp non-overlapping windows. <italic>RL, Rhamphochromis longiceps; DL, Diplotaxodon limnothrissa; MZ, Maylandia zebra; PG, Petrotilapia genalutea; AS, Aulonocara stuartgranti; AC, Astatotilapia calliptera</italic>. Credits—Fish photographs: Hannes Svardal and M. Emília Santos. Geographical map modified from <ext-link xlink:href="http://www.d-maps.com/" ext-link-type="url">www.d-maps.com/</ext-link>.</p></caption><p><graphic specific-use="HTML" mime-subtype="PNG" xlink:href="MediaObjects/41467_2021_26166_Fig1_HTML.png"/></p></fig></p><p id="Par9">On average, 285.51 ± 55.6 million paired-end reads (see Supplementary Data <xref ref-type="supplementary-material" rid="MOESM4">1</xref>) for liver and muscle methylomes were generated with WGBS, yielding ~10−15x per-sample coverage at CG dinucleotide sites (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">2a−d</xref>; see “Methods” and <xref ref-type="supplementary-material" rid="MOESM1">Supplementary Notes</xref>). To account for species-specific genotype and avoid methylation biases due to species-specific single nucleotide polymorphism (SNP), WGBS reads were mapped to SNP-corrected versions of the <italic>Maylandia zebra</italic> reference genome (UMD2a; see Methods). Mapping rates were not significantly different among all WGBS samples (Dunn’s test with Bonferroni correction, <italic>p</italic> &gt; 0.05; Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">2e</xref>), reflecting the high level of conservation at the DNA sequence level across the Malawi radiation (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">3</xref>). In parallel, liver and muscle transcriptomes were generated for four species using the same specimens as used for WGBS, yielding on average 11.9 ± 0.7 million paired-end reads (mean ± sd; Fig. <xref rid="Fig1" ref-type="fig">1c</xref>, Supplementary Data <xref ref-type="supplementary-material" rid="MOESM4">1</xref> and “Methods”).</p><p id="Par10">We first characterised global features of the methylome of Lake Malawi cichlids. The genome of Lake Malawi cichlid was found to have copies of DNA methyltransferases (DNMTs) and ten-eleven translocation methylcytosine dioxygenases (TETs), the ‘readers’ and ‘erasers’ of DNA methylation respectively (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">4a−c</xref>). Like that of mammals and other teleost fish, the genomes of Lake Malawi cichlids have high levels of DNA methylation genome-wide in the CG dinucleotide sequence context, consistently across all samples in both tissues analysed (Fig. <xref rid="Fig1" ref-type="fig">1d</xref> and Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">2a−c</xref>). Gene bodies generally show higher methylation levels than the genome-wide average, while the majority of promoter regions are unmethylated (Fig. <xref rid="Fig1" ref-type="fig">1d</xref>). CpG islands (CGIs; i.e., CpG-rich regions—abundant in Lake Malawi cichlid genomes; Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">5a−i</xref>, <xref ref-type="supplementary-material" rid="MOESM1">Supplementary Notes</xref> and Methods) are almost entirely devoid of methylation in promoters, while ‘orphan’ CGIs, residing outside promoters, are mostly highly methylated (Fig. <xref rid="Fig1" ref-type="fig">1d</xref> and Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">5f, g</xref>). While 70% of mammalian promoters contain CGIs<sup><xref ref-type="bibr" rid="CR41">41</xref></sup>, only 15−20% of promoters in Lake Malawi cichlids harbour CGIs (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">5d</xref>), similar to frog and zebrafish genomes<sup><xref ref-type="bibr" rid="CR41">41</xref></sup>. Notably, orphan CGIs, which may have important <italic>cis</italic>-regulatory functions<sup><xref ref-type="bibr" rid="CR42">42</xref></sup>, compose up to 80% of all predicted CGIs in Lake Malawi cichlids (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">5e</xref>). Furthermore, repetitive regions, as well as transposable elements, are particularly enriched for cytosine methylation, suggesting a methylation-mediated silencing of their transcription (Fig. <xref rid="Fig1" ref-type="fig">1d</xref>, Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">6a−d</xref>), similar to that observed in zebrafish and other animals<sup><xref ref-type="bibr" rid="CR8">8</xref>,<xref ref-type="bibr" rid="CR18">18</xref></sup>. Interestingly, certain transposon families, such as LINE I and Tc2-<italic>Mariner</italic>, part of the DNA transposon family—the most abundant TE family predicted in Lake Malawi cichlid genome (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">6a, b</xref>, <xref ref-type="supplementary-material" rid="MOESM1">Supplementary Notes</xref>, and ref. <sup><xref ref-type="bibr" rid="CR38">38</xref></sup>)—have recently expanded considerably in the Mbuna genome (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">6c</xref> and refs. <sup><xref ref-type="bibr" rid="CR38">38</xref>,<xref ref-type="bibr" rid="CR43">43</xref></sup>). While Tc2-<italic>Mar</italic> DNA transposons show the highest median methylation levels, LINE I elements have some of the lowest, yet most variable, methylation levels of all transposon families, which correlates with their evolutionary recent expansion in the genome (Fig. <xref rid="Fig1" ref-type="fig">1d, e</xref> and Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">6d, e</xref>). Finally, transcriptional activity in liver and muscle tissues of Lake Malawi cichlids was negatively correlated with methylation in promoter regions (Spearman’s correlation test, <italic>ρ</italic> = −0.40, <italic>p</italic> &lt; 0.002), while being weakly positively correlated with methylation in gene bodies (<italic>ρ</italic> = 0.1, <italic>p</italic> &lt; 0.002; Fig. <xref rid="Fig1" ref-type="fig">1e</xref> and Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">7a−d</xref> and Supplementary Table <xref ref-type="supplementary-material" rid="MOESM1">2</xref>). This is consistent with previous studies highlighting high methylation levels in bodies of active genes in plants and animals, and high levels of methylation at promoters of weakly expressed genes in vertebrates<sup><xref ref-type="bibr" rid="CR8">8</xref>,<xref ref-type="bibr" rid="CR24">24</xref></sup>. We conclude that the methylomes of Lake Malawi cichlids share many regulatory features, and possibly associated functions, with those of other vertebrates, which renders Lake Malawi cichlids a promising model system in this context.</p></sec><sec id="Sec4"><title>Methylome divergence in Lake Malawi cichlids</title><p id="Par11">To assess the possible role of DNA methylation in phenotypic diversification, we then sought to quantify and characterise the differences in liver and muscle methylomes across the genomes of Lake Malawi haplochromine cichlids. Despite overall very low sequence divergence<sup><xref ref-type="bibr" rid="CR36">36</xref></sup> (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">3</xref>), Lake Malawi cichlids were found to show substantial methylome divergence across species within each tissue type, while within-species biological replicates always clustered together (Fig. <xref rid="Fig2" ref-type="fig">2a</xref>). The species relationships inferred by clustering of the liver methylomes at conserved individual CG dinucleotides recapitulate some of the genetic relationship inferred from DNA sequence<sup><xref ref-type="bibr" rid="CR36">36</xref></sup>, with one exception—the methylome clusters <italic>A. calliptera</italic> samples as an outgroup, not a sister group to Mbuna (Fig. <xref rid="Fig2" ref-type="fig">2a</xref> and Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">3a, b</xref>). This is consistent with its unique position as a riverine species, while all species are obligate lake dwellers (Fig. <xref rid="Fig1" ref-type="fig">1b</xref>).<fig id="Fig2"><label>Fig. 2</label><caption xml:lang="en"><title>Species-specific methylome divergence in Lake Malawi cichlids is enriched in promoters, CpG-islands, and young transposons.</title><p><bold>a</bold> Unbiased hierarchical clustering and heatmap of Spearman’s rank correlation scores for genome-wide methylome variation in Lake Malawi cichlids at conserved CG dinucleotides. Dotted boxes group samples by species within each tissue. <bold>b</bold> Observed/Expected ratios (O/E ratio, enrichment) for some genomic localisations of differentially methylated regions (DMRs) predicted between livers (green) and between muscles (purple) of three Lake Malawi cichlid species, and between tissues (within-species, grey); <italic>χ</italic><sup>2</sup> tests for between categories (<italic>p</italic> &lt; 0.0001), for O/E between liver and muscle DMRs (<italic>p</italic> = 0.99) and between Liver+Muscle vs Tissues <italic>(p</italic> = 0.04). Expected values were determined by randomly shuffling DMRs of each DMR type across the genome (1000 iterations). Categories are not mutually exclusive. <bold>c</bold> Gene ontology (GO) enrichment for DMRs found between liver methylomes localised in promoters. GO terms: Kyoto Encyclopaedia of Genes and Genomes (KEGG), molecular functions (MF), cellular component (CC), and biological processes (BP). Only GO terms with FDR &lt; 0.05 shown. <italic>N</italic> indicates the number of genes associated with each GO term. Only GO terms with <italic>p</italic> &lt; 0.05 (Benjamini−Hochberg false discovery rate [FDR]-corrected <italic>p</italic>-values) are shown. <bold>d</bold> Genomic localisation of liver DMRs containing repeats/transposons (TE-DMRs). <bold>e</bold>. O/E ratios for species TE-DMRs for each TE family. Only O/E ≥ 2 and ≤0.5 shown. <italic>χ</italic><sup>2</sup> tests, <italic>p</italic> &lt; 0.0001. <bold>f</bold> Violin plots showing TE sequence divergence (namely, CpG-adjusted Kimura substitution level as given by RepeatMasker) in <italic>M. zebra</italic> genome for species TE-DMRs, TEs outside species DMRs (‘outside’) and randomly shuffled TE-DMRs (500 iterations, ‘shuffle’). Mean values indicated by red dots, median values by black lines and shown above each graph. Total DMR counts indicated below each graph. Two-sided <italic>p</italic>-values for Kruskal–Wallis test are shown above the graph. DMR, differentially methylated region; TE, repeat/transposon regions; CGI, predicted CpG islands.</p></caption><p><graphic specific-use="HTML" mime-subtype="PNG" xlink:href="MediaObjects/41467_2021_26166_Fig2_HTML.png"/></p></fig></p><p id="Par12">As DNA methylation variation tends to correlate over genomic regions consisting of several neighbouring CG sites, we defined and sought to characterise differentially methylated regions (DMRs) among Lake Malawi cichlid species (≥50 bp-long, ≥4 CG dinucleotide, and ≥25% methylation difference across any pair of species, <italic>p</italic> &lt; 0.05; see Methods). In total, 13,331 between-species DMRs were found among the liver methylomes of the six cichlid species (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">8a</xref>). We then compared the three species for which liver and muscle WGBS data were available and found 5,875 and 4,290 DMRs among the liver and muscle methylomes, respectively. By contrast, 27,165 within-species DMRs were found in the between-tissue comparisons (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">8b</xref>). Overall, DMRs in Lake Malawi cichlids were predicted to be as long as 5,000 bp (95% CI of median size: 282−298 bp; Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">8c</xref>). While the methylation differences between liver and muscle were the most prominent at single CG dinucleotide resolution (Fig. <xref rid="Fig2" ref-type="fig">2a</xref>) and resulted in the highest number of DMRs, we found DMRs to be slightly larger and methylation differences within them substantially stronger among species than between tissues (Dunn’s test, <italic>p</italic> &lt; 2.2 × 10<sup>−16</sup>; Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">8c, d</xref>).</p><p id="Par13">Next, we characterised the genomic features enriched for between-species methylome divergence in the three cichlid species for which both muscle and liver WGBS data were available (i.e., RL, PG, DL; Fig. <xref rid="Fig1" ref-type="fig">1c</xref>). In the liver, promoter regions and orphan CGIs have 3.0- and 3.6-fold enrichment respectively for between-species liver DMRs over random expectation (<italic>χ</italic><sup>2</sup> test, <italic>p</italic> &lt; 0.0001; Fig. <xref rid="Fig2" ref-type="fig">2b</xref>)—between-species muscle DMRs show similar patterns as well (<italic>p</italic> = 0.99, compared to liver O/E ratios). Methylome variation at promoter regions has been shown to affect transcription activity via a number of mechanisms (e.g., transcription factor binding affinity, chromatin accessibility)<sup><xref ref-type="bibr" rid="CR21">21</xref>,<xref ref-type="bibr" rid="CR44">44</xref></sup> and, in this way, may participate in phenotypic adaptive diversification in Lake Malawi cichlids. In particular, genes with DMRs in their promoter regions show enrichment for enzymes involved in hepatic metabolic functions (Fig. <xref rid="Fig2" ref-type="fig">2c</xref>). Furthermore, the high enrichment of DMRs in intergenic orphan CGIs (Fig. <xref rid="Fig2" ref-type="fig">2b</xref>), accounting for <italic>n</italic> = 691 (11.94%) of total liver DMRs, suggests that intergenic CGIs may have DNA methylation-mediated regulatory functions.</p><p id="Par14">The majority of between-species liver DMRs (65.0%, <italic>n</italic> = 3,764) are within TE regions (TE-DMRs; Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">8a, b, e</xref>), approximately two-thirds of which are located in unannotated intergenic regions (Fig. <xref rid="Fig2" ref-type="fig">2d</xref>). However, a small fraction of TE-DMRs are located in gene promoters (12% of all TE-DMRs) and are significantly enriched in genes associated with metabolic pathways (Fig. <xref rid="Fig2" ref-type="fig">2d</xref> and Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">8f</xref>). While there is only a 1.1-fold enrichment of DMRs globally across all TEs (Fig. <xref rid="Fig2" ref-type="fig">2b</xref>), some TE families are particularly enriched for DMRs, most notably the DNA transposons hAT (hAT6, 10.5-fold), LINE/l (&gt;3.7-fold) and the retrotransposons SINE/Alu (&gt;3.5-fold). On the other hand, the degree of methylation in a number of other TE families shows unexpected conservation among species, with substantial DMR depletion (e.g., LINE/R2-Hero, DNA/Maverick; Fig. <xref rid="Fig2" ref-type="fig">2e</xref>). Overall, we observe a pattern whereby between-species methylome differences are significantly localised in younger transposon sequences (Dunn’s test, <italic>p</italic> = 2.2 × 10<sup>−16</sup>; Fig. <xref rid="Fig2" ref-type="fig">2f</xref>). Differential methylation in TE sequences may affect their transcription and transposition activities, possibly altering or establishing new transcriptional activity networks via <italic>cis</italic>-regulatory functions<sup><xref ref-type="bibr" rid="CR45">45</xref>–<xref ref-type="bibr" rid="CR47">47</xref></sup>. Indeed, the movement of transposable elements has recently been shown to contribute to phenotypic diversification in Lake Malawi cichlids<sup><xref ref-type="bibr" rid="CR48">48</xref></sup>.</p><p id="Par15">In contrast to the between-species liver DMRs, within-species DMRs based on comparison of liver against muscle methylomes show much less variation in enrichment across genomic features. Only gene bodies show weak enrichment for methylome variation (Fig. <xref rid="Fig2" ref-type="fig">2b</xref>). Moreover, both CGI classes, as well as repetitive and intergenic regions show considerable tissue-DMR depletion, suggesting a smaller DNA methylation-related contribution of these elements to tissue differentiation (Fig. <xref rid="Fig2" ref-type="fig">2b</xref> and Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">8e</xref>).</p></sec><sec id="Sec5"><title>Methylome divergence is associated with transcriptional changes in the livers</title><p id="Par16">We hypothesised that adaptation to different diets in Lake Malawi cichlids could be associated with distinct hepatic functions, manifesting as differences in transcriptional patterns which, in turn, could be influenced by divergent methylation patterns. To investigate this, we first performed differential gene expression analysis. In total, 3,437 genes were found to be differentially expressed between livers of the four Lake Malawi cichlid species investigated (RL, DL, MZ, and PG; Wald test, false discovery rate adjusted two sided <italic>p</italic>-value using Benjamini−Hochberg [FDR] &lt; 0.01; Fig. <xref rid="Fig3" ref-type="fig">3a</xref> and Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">9a−c</xref>; see “Methods”). As with methylome variation, transcriptome variation clustered individuals by species (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">9d</xref>), consistent with species-specific functional liver transcriptome activity.<fig id="Fig3"><label>Fig. 3</label><caption xml:lang="en"><title>Methylome divergence is associated with differential transcriptional activity in Lake Malawi cichlids.</title><p><bold>a</bold> Heatmap and unsupervised hierarchical clustering of gene expression values (<italic>Z</italic>-score) of all differentially expressed genes (DEGs) found among livers of four Lake Malawi cichlid species (Wald tests corrected for multiple testing using false discovery rate FDR &lt; 1%). GO enrichment analysis for three DEG clusters are shown in Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">9c</xref>. <bold>b</bold> Significant overlap between DEG and differentially expressed regions (DMRs; <italic>p</italic> &lt; 0.05) linked to a gene (exact hypergeometric test, <italic>p</italic> = 4.71 × 10<sup>−5</sup>), highlighting putative functional DMRs (pfDMRs). <bold>c</bold> Bar plot showing the percentage of pfDMRs localised in either promoters, intergenic regions (0.5−4kbp away from genes), or in gene bodies, with the proportion of TE content for each group. <bold>d</bold> Heatmap representing significant GO terms for DEGs associated with pfDMRs for each genomic feature. GO categories: BP, Biological Process; MF, Molecular Function. Only GO terms with Benjamini−Hochberg FDR-corrected <italic>p</italic>-values &lt; 0.05 are shown. Examples of pfDMRs significantly associated with species-specific liver transcriptional changes for the genes thiosulfate:glutathione sulfurtransferase <italic>tstd1</italic>-like (LOC101468457; <italic>q</italic> = 6.82 × 10<sup>−16</sup>) (<bold>e</bold>), carbonyl reductase [NADPH]-1 <italic>cbr1</italic>-like (LOC101465189; MZ vs DL, <italic>q</italic> = 0.002; MZ vs RL, <italic>q</italic> = 1.18 × 10<sup>−7</sup>) (<bold>f</bold>) and perforin-1 <italic>prf1</italic>-like (LOC101465185; MZ vs DL, <italic>q</italic> = 3.68 × 10<sup>−</sup><sup>19</sup>; MZ vs RL, <italic>q</italic> = 0.00034) (<bold>g</bold>). Liver and muscle methylome profiles in green and purple, respectively (averaged mCG/CG levels [%] in 50 bp bins; <italic>n</italic> = 3 biological replicates for liver DL, PG, and MZ; <italic>n</italic> = 2 biological replicates for liver RL, AS, and AC, and muscle DL, RL, and PG). <bold>h</bold>−<bold>j</bold> Boxplots showing gene expression values (transcript per million) for the genes in (<bold>e</bold>−<bold>g</bold>). in livers (green) and muscle (pink). <italic>n</italic> = 3 biological replicates for liver DL, MZ, PG; <italic>n</italic> = 2 biological replicates for liver RL and muscle DL, MZ, PG, and RL. Two-sided <italic>q</italic> values for Wald tests corrected for multiple testing (Benjamini−Hochberg FDR) are shown in graphs. Box plots indicate median (middle line), 25th, 75th percentile (box), and 5th and 95th percentile (whiskers) as well as outliers (single points). CGI, CpG islands; Repeats, transposons and repetitive regions.</p></caption><p><graphic specific-use="HTML" mime-subtype="PNG" xlink:href="MediaObjects/41467_2021_26166_Fig3_HTML.png"/></p></fig></p><p id="Par17">Next, we checked for the association between liver DMRs and transcriptional changes. Of the 6,797 among-species DMRs that could be assigned to a specific gene (i.e., DMRs within promoters, gene bodies or located 0.5−4 kbp away from a gene; see “Methods”), 871 were associated with differentially expressed genes, which is greater than expected by chance (Fig. <xref rid="Fig3" ref-type="fig">3b</xref>; <italic>p</italic> &lt; 4.7 × 10<sup>−5</sup>), suggesting that DMRs are significantly associated with liver gene expression. Of these 871 putative functional DMRs (pfDMRs), the majority (42.8%) are localised over gene bodies, hinting at possible intronic <italic>cis</italic>-regulatory elements or alternative splicing<sup><xref ref-type="bibr" rid="CR49">49</xref></sup>. The remaining pfDMRs are in intergenic (30.2%) or promoters (27%) (Fig. <xref rid="Fig3" ref-type="fig">3c</xref>). The majority of pfDMRs contain younger TE sequences, in particular in intronic regions, while only few contain CGIs (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">10a−c</xref>). In promoters and intergenic regions, ≥63% of pfDMR sequences contain TEs (Fig. <xref rid="Fig3" ref-type="fig">3c</xref>). As methylation levels at <italic>cis</italic>-regulatory regions may be associated with altered transcription factor (TF) activity<sup><xref ref-type="bibr" rid="CR22">22</xref>,<xref ref-type="bibr" rid="CR24">24</xref>,<xref ref-type="bibr" rid="CR25">25</xref></sup>, we performed TF binding motif enrichment analysis using between-species liver DMRs and found significant enrichment for specific TF recognition binding motifs. Several TF genes known to recognise some of the enriched binding motifs are differentially expressed among the livers of the three cichlid species and have liver-associated functions (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">10d, e</xref>). For example, the gene of the transcription factor hepatocyte nuclear factor 4 alpha (hnf4a), with important functions in lipid homeostasis regulation and in liver-specific gene expression<sup><xref ref-type="bibr" rid="CR50">50</xref></sup>, is &gt;2.5x-fold downregulated (<italic>q</italic> ≤ 9 × 10<sup>−</sup><sup>5</sup>) in the rock-dwelling algae-eater <italic>P. genalutea</italic> compared to the pelagic piscivores <italic>D. limnothrissa</italic> and <italic>R. longiceps</italic>, possibly in line with adaptation to different diets (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">10e</xref>).</p><p id="Par18">Furthermore, genomic regions containing pfDMRs are also significantly associated in the livers with altered transcription of many other genes involved in hepatic and metabolic oxidation-reduction processes (Fig. <xref rid="Fig3" ref-type="fig">3d</xref> and Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">10f</xref>). These include genes encoding haem-containing cytochrome P450 enzymes (such as cyp3a4, cy7b1; Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">10f</xref>), which are important metabolic factors in steroid and fatty acid metabolism, as well as genes encoding other hepatic enzymes involved in energy balance processes. This enrichment is associated with significant methylome divergence among species, in particular in promoter regions and gene bodies (Fig. <xref rid="Fig3" ref-type="fig">3d</xref>). For example, the gene sulfurtransferase <italic>tstd1</italic>-like, an enzyme involved in energy balance and the mitochondrial metabolism, is expressed exclusively in the liver of the deep-water pelagic species <italic>D. limnothrissa,</italic> where it shows ~80% reduced methylation levels in a gene-body DMR compared to all the other species (Fig. <xref rid="Fig3" ref-type="fig">3e, h</xref>). Another example is the promoter of the enzyme carbonyl reductase [NADPH] 1 (<italic>cbr1</italic>) which shows significant hypomethylation (2.2kbp-long DMR) in the algae-eaters MZ and PG, associated with up to ~60-fold increased gene expression in their livers compared to the predatory <italic>Rhamphochromis</italic> and <italic>Diplotaxodon</italic> (Fig. <xref rid="Fig3" ref-type="fig">3f, i</xref>). Interestingly, <italic>cbr1</italic> is involved in the metabolism of various fatty acids in the liver and has been associated with fatty acid-mediated cellular signalling in response to environmental perturbation<sup><xref ref-type="bibr" rid="CR51">51</xref></sup>. As a final example, we highlight the cytotoxic effector perforin 1-like (<italic>prf1-</italic>like), an important player in liver-mediated energy balance and immune functions<sup><xref ref-type="bibr" rid="CR52">52</xref></sup>. Its promoter is hypermethylated (&gt;88% mCG/CG) exclusively in the liver of the deep-water species DL, while having low methylation levels (~25%) in the four other species (Fig. <xref rid="Fig3" ref-type="fig">3g</xref>). This gene is not expressed in DL livers but is highly expressed in the livers of the other species that all show low methylation levels at their promoters (Fig. <xref rid="Fig3" ref-type="fig">3j</xref>). Taken together, these results suggest that species-specific methylome divergence is associated with transcriptional remodelling of ecologically-relevant genes, which might facilitate phenotypic diversification associated with adaption to different diets.</p></sec><sec id="Sec6"><title>Multi-tissue methylome divergence is enriched in genes related to early development</title><p id="Par19">We further hypothesised that between-species DMRs that are found in both the liver and muscle methylomes could relate to functions associated with early development/embryogenesis. Given that liver is endoderm-derived and muscle mesoderm-derived, such shared multi-tissue DMRs could be involved in processes that find their origins prior to or early in gastrulation. Such DMRs could also have been established early on during embryogenesis and may have core cellular functions. Therefore, we focussed on the three species for which methylome data were available for both tissues (Fig. <xref rid="Fig1" ref-type="fig">1c</xref>) to explore the overlap between muscle and liver DMRs (Fig. <xref rid="Fig4" ref-type="fig">4a</xref>). Based on pairwise species comparisons (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">11a, b</xref>), we identified methylome patterns unique to one of the three species. We found that 40−48% of these were found in both tissues (‘multi-tissue’ DMRs), while 39−43% were liver-specific and only 13−18% were muscle-specific (Fig. <xref rid="Fig4" ref-type="fig">4b</xref>).<fig id="Fig4"><label>Fig. 4</label><caption xml:lang="en"><title>Multi-tissue methylome divergence in Lake Malawi cichlids is associated with early development/embryogenesis.</title><p><bold>a</bold> Distinct species-specific methylome patterns in Lake Malawi cichlids can be found in liver or muscle tissues, or in both tissues (‘multi-tissue’). <bold>b</bold> Histograms showing the total counts of ‘species’ DMRs that are either liver-, muscle-specific or present in both (multi). Only ‘species’ DMRs showing distinct DNA methylation patterns in one species are shown. <bold>c</bold> GO enrichment plots for each DMR class. Only GO terms with Benjamini−Hochberg FDR-corrected <italic>p</italic>-values &lt; 0.05 are shown. <bold>d</bold>−<bold>f</bold> Examples of ‘species’ multi-tissue DMRs in genes related to embryonic and developmental processes. Namely, in the genes coding for visual system homeobox 2 <italic>vsx2</italic> (LOC101486458), growth-associated protein 43 <italic>gap43</italic> (LOC101472990) and teneurin transmembrane protein 2 <italic>tenm2</italic> (LOC101470261). Liver and muscle methylome profiles shown in green and purple, respectively (averaged mCG/CG levels [%] in 50 bp bins for ≥2 samples per tissue per species; scale indicated below each graph).</p></caption><p><graphic specific-use="HTML" mime-subtype="PNG" xlink:href="MediaObjects/41467_2021_26166_Fig4_HTML.png"/></p></fig></p><p id="Par20">The relatively high proportion of multi-tissue DMRs suggests there may be extensive among-species divergence in core cellular or metabolic pathways. To investigate this further, we performed GO enrichment analysis. As expected, liver-specific DMRs are particularly enriched for hepatic metabolic functions, while muscle-specific DMRs are significantly associated with muscle-related functions, such as glycogen catabolic pathways (Fig. <xref rid="Fig4" ref-type="fig">4c</xref>). Multi-tissue DMRs, however, are significantly enriched for genes involved in development and embryonic processes, in particular related to cell differentiation and brain development (Fig. <xref rid="Fig4" ref-type="fig">4c–f</xref>), and show different properties from tissue-specific DMRs. Indeed, in all the three species, multi-tissue DMRs are three times longer on average (median length of multi-tissue DMRs: 726 bp; Dunn’s test, <italic>p</italic> &lt; 0.0001; Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">11c</xref>), are significantly enriched for TE sequences (Dunn’s test, <italic>p </italic> ≤ 0.03; Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">11d</xref>) and are more often localised in promoter regions (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">11e</xref>) compared to liver and muscle DMRs. Furthermore, multi-tissue species-specific methylome patterns show significant enrichment for specific TF binding motif sequences. These binding motifs are bound by TFs with functions related to embryogenesis and development, such as the transcription factors Forkhead box protein K1 (foxk1) and Forkhead box protein A2 (foxa2), with important roles during liver development<sup><xref ref-type="bibr" rid="CR53">53</xref></sup> (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">11f</xref>), possibly facilitating core phenotypic divergence early on during development.</p><p id="Par21">Several examples of multi-tissue DMRs are worth highlighting as generating hypotheses for potential future functional studies (Fig. <xref rid="Fig4" ref-type="fig">4d–f</xref>). The visual system homeobox 2 (<italic>vsx2</italic>) gene in the offshore deep-water species <italic>Diplotaxodon limnothrissa</italic> is almost devoid of methylation in both liver and muscle, in contrast to the other species (1.9 kbp-long DMR; Fig. <xref rid="Fig4" ref-type="fig">4d</xref> and Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">11g</xref>). <italic>vsx2</italic> has been reported to play an essential role in the development of the eye and retina in zebrafish with embryonic and postnatal active transcription localised in bipolar cells and retinal progenitor cells<sup><xref ref-type="bibr" rid="CR54">54</xref></sup>. <italic>D. limnothrissa</italic> populates the deepest parts of the lake of all cichlid species (down to approximately 250 m, close to the limits of oxygenation) and features morphological adaptations to dimly-lit environments, such as larger eye size<sup><xref ref-type="bibr" rid="CR55">55</xref></sup>. <italic>vsx2</italic> may therefore participate in the visual adaptation of <italic>Diplotaxodon</italic> to the dimmer parts of the lake via DNA methylation-mediated gene regulation during development. Another example of a multi-tissue DMR specific to <italic>D. limnothrissa</italic> is located in the promoter of the gene coding for the growth-associated protein 43 (<italic>gap43</italic>) involved in neural development and plasticity, and also neuronal axon regeneration<sup><xref ref-type="bibr" rid="CR56">56</xref></sup>. The promoter of <italic>gap43</italic> is largely devoid of methylation (overall &lt;5% average mCG/CG levels over this 5.2 kbp-long DMR) in both muscle and liver tissues of <italic>D. limnothrissa</italic>, while being highly methylated (&gt;86% mCG/CG) in the other species (Fig. <xref rid="Fig4" ref-type="fig">4e</xref>). In <italic>A. calliptera</italic>, the transcription of <italic>gap43</italic> is restricted to the brain and embryo (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">11h</xref>), consistent with a role in neural development and in the adult brain. Finally, another multi-tissue DMR potentially involved in neural embryonic functions is located in the promoter region of the gene <italic>tenm2</italic>, coding for teneurin transmembrane protein (Fig. <xref rid="Fig4" ref-type="fig">4f</xref>). <italic>tenm2</italic> is a gene expressed early on during zebrafish embryogenesis as well as in cichlid brain and embryo (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">11i</xref>) and is involved in neurodevelopment and neuron migration-related cell signalling<sup><xref ref-type="bibr" rid="CR57">57</xref></sup>. This 2.7 kbp-long DMR is completely unmethylated in the algae-eating rock-dweller <italic>Petrotilapia genalutea</italic> (almost 80% reduction in methylation levels overall compared to the other species) and may mediate species-specific adaptive phenotypic plasticity related to synapse formation and neuronal networks.</p></sec></sec><sec id="Sec7" sec-type="discussion"><title>Discussion</title><p id="Par22">The molecular mechanisms underlying adaptive phenotypic diversification are subject of intense interest<sup><xref ref-type="bibr" rid="CR34">34</xref>,<xref ref-type="bibr" rid="CR36">36</xref>,<xref ref-type="bibr" rid="CR38">38</xref>,<xref ref-type="bibr" rid="CR58">58</xref>,<xref ref-type="bibr" rid="CR59">59</xref></sup> and the extent of the role of epigenetic processes is hotly debated<sup><xref ref-type="bibr" rid="CR2">2</xref>,<xref ref-type="bibr" rid="CR4">4</xref>,<xref ref-type="bibr" rid="CR60">60</xref></sup>. However, in-depth molecular epigenetic studies remain rare in evolutionary genomics and its key model systems<sup><xref ref-type="bibr" rid="CR2">2</xref>,<xref ref-type="bibr" rid="CR4">4</xref>,<xref ref-type="bibr" rid="CR29">29</xref>,<xref ref-type="bibr" rid="CR60">60</xref></sup>. Here, we focussed on the genetically closely related haplochromine cichlids of Lake Malawi, representing a unique system to investigate the epigenetic basis for phenotypic diversification<sup><xref ref-type="bibr" rid="CR36">36</xref>,<xref ref-type="bibr" rid="CR39">39</xref>,<xref ref-type="bibr" rid="CR61">61</xref></sup>. Specifically, we describe genome-wide methylome variation at a single CG dinucleotide resolution as well as transcriptomes of two adult tissues of different embryonic origins in eco-morphologically divergent species (Fig. <xref rid="Fig1" ref-type="fig">1b</xref>). This work investigates epigenetic marks in the context of rapid diversification in natural populations of cichlid fishes and provides evidence of substantial methylome divergence associated with ecologically-relevant genes and correlated with changes in the transcriptional network and in TF activity. Given the resemblances we found between cichlid methylomes and those of warm-blooded vertebrates (Fig. <xref rid="Fig1" ref-type="fig">1d, e</xref>), suggesting evolutionarily conserved functions, our findings are likely to be relevant to other vertebrate evolutionary model systems.</p><p id="Par23">Recent large-scale epigenetic studies in natural populations of <italic>Arabidopsis</italic> have highlighted a functional link between local environments and methylation divergence, with possible adaptive phenotypic functions<sup><xref ref-type="bibr" rid="CR11">11</xref>,<xref ref-type="bibr" rid="CR13">13</xref></sup>. Yet, epigenetic variation in natural populations of vertebrates and its possible functions in the context of adaptive phenotypic diversification have scarcely been studied. Our finding of considerable among-species methylome divergence at conserved underlying DNA sequences, despite overall low among-species genome differentiation, is suggestive of a functional link between DNA methylation and local environments, which may facilitate phenotypic plasticity and diversification. The methylome divergence we found may be driven directly by environmental differences but is also likely to have a genetic component. Our study lays the groundwork for deciphering any genetically encoded component underlying the epigenetic differences. Genetic differences in TF binding domains or in TF sequence recognition motifs, as well as in the proteins involved in the maintenance and deposition of new methyl groups, could for example lead to epigenetic divergence<sup><xref ref-type="bibr" rid="CR11">11</xref>,<xref ref-type="bibr" rid="CR24">24</xref></sup>. While this study provides evidence for species-specific methylome divergence associated with transcriptional changes of ecologically-relevant genes, further experimental work is required to examine the extent to which such species-specific patterns have an adaptive function in a natural context, as well as to determine the degree of plasticity and inheritance of such epigenetic patterns. Recent studies in three-spined stickleback fish have provided initial evidence for stable transmission of methylome patterns across generations associated with adaptation to salinity, some of which are inherited in a genetic-independent manner<sup><xref ref-type="bibr" rid="CR62">62</xref>,<xref ref-type="bibr" rid="CR63">63</xref></sup>. Moreover, epigenetic inheritance and reprogramming greatly vary among teleost fishes. Indeed, recent studies have highlighted important differences in the mechanisms of DNA methylation reprogramming during embryogenesis in teleost fishes. While the genome of the embryo in zebrafish retains the sperm methylome configuration with no global DNA methylation resetting, possibly allowing for the transgenerational inheritance of specific epigenetic states, extensive and global DNA methylation reprogramming instead occurs upon fertilisation in medaka embryos (similar to mammals)<sup><xref ref-type="bibr" rid="CR30">30</xref>,<xref ref-type="bibr" rid="CR64">64</xref>–<xref ref-type="bibr" rid="CR66">66</xref></sup>. Such DNA methylome reprogramming processes are currently unknown in cichlids, which warrants further research.</p><p id="Par24">We found that regions of methylome divergence between species (DMRs) were enriched in promoters and orphan CGIs (Fig. <xref rid="Fig2" ref-type="fig">2b</xref>). Methylation variation in promoter regions is known to have important <italic>cis</italic>-regulatory functions in vertebrates, in particular during development<sup><xref ref-type="bibr" rid="CR20">20</xref>,<xref ref-type="bibr" rid="CR21">21</xref>,<xref ref-type="bibr" rid="CR24">24</xref>,<xref ref-type="bibr" rid="CR29">29</xref>,<xref ref-type="bibr" rid="CR31">31</xref></sup>. Such <italic>cis</italic>-regulatory activity is also apparent in Lake Malawi cichlids, with methylation at promoters negatively correlated with transcriptional activity (Fig. <xref rid="Fig1" ref-type="fig">1e</xref> and Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">7a−d</xref>). This is likely mediated by the tight interaction of DNA methylation with 5mC-sensitive DNA-binding proteins, such as many transcription factors<sup><xref ref-type="bibr" rid="CR22">22</xref></sup> (see below). On the other hand, the functional roles of orphan CGIs are less well understood<sup><xref ref-type="bibr" rid="CR42">42</xref></sup>. However, orphan CGIs have by far the highest enrichment for species methylome divergence (&gt;3-fold over chance; Fig. <xref rid="Fig2" ref-type="fig">2b</xref>)—most of which are located in unannotated genomic regions. Orphan CGIs, as well as intergenic TEs (Fig. <xref rid="Fig2" ref-type="fig">2d</xref>), might include ectopic promoters, enhancers and other distal regulatory elements<sup><xref ref-type="bibr" rid="CR41">41</xref>,<xref ref-type="bibr" rid="CR42">42</xref></sup> that may participate in phenotypic diversification by reshaping transcriptional network. Such putative <italic>cis</italic>-regulatory regions could be validated against a full functional annotation of the genome of Lake Malawi cichlid, which is currently lacking.</p><p id="Par25">We identified that in some species methylome divergence was significantly associated with differential liver transcriptome activity, especially pertaining to hepatic functions involved in steroid hormone and fatty acid metabolism (Fig. <xref rid="Fig3" ref-type="fig">3b, d−j</xref>). Consistent with a functional role of DNA methylation in <italic>cis</italic>-regulatory regions<sup><xref ref-type="bibr" rid="CR21">21</xref>,<xref ref-type="bibr" rid="CR44">44</xref></sup>, we revealed significant methylation divergence in the promoters of differentially transcribed genes involved in liver-mediated energy expenditure processes and metabolism, such as gene <italic>prf1</italic>-like (&gt;60-fold increase in expression; Fig. <xref rid="Fig3" ref-type="fig">3g, j</xref>), associated with obesity in mouse<sup><xref ref-type="bibr" rid="CR44">44</xref></sup>. Such a functional link may promote phenotypic diversification via adaptation to different diets. Our understanding of this would benefit from the knowledge of the extent to which environmental or diet perturbation might result in adaptation-associated functional methylome changes. Further work would also be required to assess the extent to which such changes may be stably inherited. Additionally, the characterisation of the methylomes of Lake Malawi cichlid species from different ecomorphological groups but sharing the same habitat/diet, would inform on the specificity and possible functions of methylome divergence at metabolic genes.</p><p id="Par26">We observed that methylome divergence associated with altered transcription in livers is enriched for binding motifs recognised by specific TFs. Some of those TFs are also differentially expressed in the livers and have important roles in lipid and energy homeostasis (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">10d, e</xref>). This suggests that altered activity of some TFs in livers can be associated with species-specific methylome patterns. Methylome variation in <italic>cis</italic>-regulatory regions is known to affect the binding affinity of methyl-sensitive DNA-binding regulatory factors (such as TFs)<sup><xref ref-type="bibr" rid="CR25">25</xref>,<xref ref-type="bibr" rid="CR44">44</xref>,<xref ref-type="bibr" rid="CR67">67</xref>,<xref ref-type="bibr" rid="CR68">68</xref></sup>. Furthermore, methylation-associated changes in chromatin accessibility may also impede the binding affinity of such factors and could be associated with altered TF activity and changes in transcription<sup><xref ref-type="bibr" rid="CR20">20</xref>,<xref ref-type="bibr" rid="CR67">67</xref></sup>. Alternatively, altered TF activity, arising from species-specific mutations within TF binding sequence motifs or in TF binding domains, has also been reported to generate methylome divergence in <italic>cis</italic> and <italic>trans</italic><sup><xref ref-type="bibr" rid="CR24">24</xref></sup>, and could also underlie species-specific epigenetic divergence. Our results suggest a tight link between TF activity and methylome divergence, that could participate in reshaping the transcriptional network of the livers in Lake Malawi cichlids.</p><p id="Par27">TE and repetitive sequences present on average higher methylation levels than the genome-wide average (Fig. <xref rid="Fig1" ref-type="fig">1d</xref>), although some specific TE classes show more variable and lower levels (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">6d, e</xref>). DNA methylation-mediated transcriptional repression of mostly deleterious TE elements is crucial to the integrity of most eukaryote genomes, from plants to fish and mammals, and can be mediated in both animals and plants by small non-coding RNAs, such as piwi-interacting RNAs (piRNAs) in zebrafish and mammals<sup><xref ref-type="bibr" rid="CR18">18</xref>,<xref ref-type="bibr" rid="CR19">19</xref>,<xref ref-type="bibr" rid="CR69">69</xref></sup>. Notably, the majority (~60%) of species differences in methylation patterns associated with transcriptional changes in liver was significantly localised in evolutionary young transposon/repeat regions, notably in intergenic retroposons in the vicinity of genes and in intronic DNA transposons (Dunn’s test <italic>p</italic> &lt; 10<sup>−10</sup>; Fig. <xref rid="Fig3" ref-type="fig">3c</xref> and Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">10b</xref>). Even though most of TE activity is under tight cellular control to ensure genome stability, transposition events have also been associated with genome evolution and phenotypic diversification. Indeed, TE insertion may represent a source of functional genomic variation and novel <italic>cis</italic>-regulatory elements, underlying altered transcriptional network<sup><xref ref-type="bibr" rid="CR45">45</xref>,<xref ref-type="bibr" rid="CR47">47</xref>,<xref ref-type="bibr" rid="CR48">48</xref>,<xref ref-type="bibr" rid="CR70">70</xref></sup>. In haplochromine cichlids, variation in anal fin egg-spots patterns associated with courtship behaviour, has been linked to a novel <italic>cis</italic>-regulatory element, derived from TE sequences<sup><xref ref-type="bibr" rid="CR46">46</xref></sup>. Additionally, Brawand and colleagues have revealed that most TE insertions near genes in East African cichlids were associated with altered gene expression patterns<sup><xref ref-type="bibr" rid="CR38">38</xref></sup>. Moreover, genes in piRNA-related pathways have been reported to be under positive selection in Lake Malawi cichlid flock, in line with a fast evolving TE sequence landscape observed in cichlids<sup><xref ref-type="bibr" rid="CR36">36</xref></sup>, and these genes may also be associated with TE-related methylome variation, similar to <italic>Arabidopsis</italic><sup><xref ref-type="bibr" rid="CR11">11</xref>,<xref ref-type="bibr" rid="CR71">71</xref></sup>.</p><p id="Par28">Not only can novel TE insertions participate in genome evolution, DNA methylation at TE-derived <italic>cis</italic>-regulatory elements has been shown to affect transcriptional activity of nearby genes<sup><xref ref-type="bibr" rid="CR12">12</xref>,<xref ref-type="bibr" rid="CR45">45</xref></sup>. In rodents, the insertion of one IAP (intra-cisternal A particle) retrotransposon in the upstream <italic>cis</italic>-regulatory region of the agouti gene is associated with considerable phenotypic variation of coat colours and metabolic changes. Differential methylation levels at this TE-derived ectopic promoter directly impacts the activity of the agouti gene<sup><xref ref-type="bibr" rid="CR5">5</xref>,<xref ref-type="bibr" rid="CR28">28</xref></sup>, and such epigenetic patterns of methylation are transmitted to the offspring along with the altered phenotypes in a non-genetic manner<sup><xref ref-type="bibr" rid="CR2">2</xref></sup>. Similarly, in toadflax, the flower symmetry is associated with the variable and heritable methylation patterns in the TE-derived promoter of the <italic>Lcyc</italic> gene, resulting in symmetrical or asymmetrical flowers<sup><xref ref-type="bibr" rid="CR6">6</xref></sup>. Also, in a population-scale study of more than a thousand natural <italic>Arabidopsis</italic> accessions, epigenetic variation was found to be associated with phenotypes, mostly arising from methylation-mediated TE silencing that was significantly associated with altered transcription of adaptive genes such as those determining flowering time<sup><xref ref-type="bibr" rid="CR11">11</xref>,<xref ref-type="bibr" rid="CR71">71</xref></sup>. Our work adds to this by providing further evidence that interactions between TE sequences and between-species methylome divergence might have led to altered transcriptional networks. This lays the groundwork for further investigation of this issue in cichlid fishes.</p><p id="Par29">Finally, we revealed that between-species methylome differences in liver tissues were greater than differences between muscle tissues (Fig. <xref rid="Fig4" ref-type="fig">4b</xref>), possibly highlighting a higher dependence of hepatic functions on natural epigenetic divergence. This indicates that a significant portion of the between-species methylome divergence in the liver may be associated with phenotypic divergence, in particular by affecting genes involved in tissue-specific functions, such as hepatic metabolic processes (Fig. <xref rid="Fig3" ref-type="fig">3c, e–j</xref>). However, almost half of the methylome divergence we observed that was driven by a single species was consistently found in both liver and muscle (Fig. <xref rid="Fig4" ref-type="fig">4b</xref>). This multi-tissue methylome divergence is consistent with epigenetic influences on core cellular functions and may also be relevant to early-life biological processes such as development, cellular differentiation, and embryogenesis (Fig. <xref rid="Fig4" ref-type="fig">4c, d–f</xref>). For example, we identified a large hypomethylated region in the visual homeobox gene <italic>vsx2</italic> in both liver and muscle tissues in the deep-water <italic>Diplotaxodon</italic> (Fig. <xref rid="Fig4" ref-type="fig">4d</xref>). This gene is involved in eye differentiation and may participate in long-lasting visual phenotypic divergences required to populate dimly parts of the lake, similar to the DNA methylation-mediated adaptive eye degeneration in cavefish<sup><xref ref-type="bibr" rid="CR29">29</xref></sup>. Notably, recent studies have highlighted signatures of positive selection and functional substitutions in genes related to visual traits in <italic>D. limnothrissa</italic><sup><xref ref-type="bibr" rid="CR36">36</xref>,<xref ref-type="bibr" rid="CR55">55</xref></sup>. Furthermore, in regions showing multi-tissue species-specific methylome divergence, we identified significant enrichment for binding motifs of specific TFs whose functions are related to embryogenesis and liver development (such as foxa2 and foxk1). This suggests that altered TF activity during development could be associated with species-specific methylome patterns (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">11f</xref>). If multi-tissue methylome divergence has been established very early during differentiation, and has important regulatory functions pertaining to early developmental stages<sup><xref ref-type="bibr" rid="CR26">26</xref></sup> and possibly core cellular functions, then it may promote long-lasting phenotypic divergence unique to each species’ adaptions. Our observations suggest that further characterisation of the methylomes and transcriptomes of different cells of the developing embryo may be valuable to investigate when between-species methylome divergence is established, as well as any functional roles in early-life phenotypic diversification.</p><p id="Par30">To conclude, recent large-scale genomic studies have highlighted that several mechanisms may participate in the phenotypic diversification of Lake Malawi haplochromine cichlids, such as hybridisation and incomplete lineage sorting<sup><xref ref-type="bibr" rid="CR34">34</xref>,<xref ref-type="bibr" rid="CR36">36</xref>,<xref ref-type="bibr" rid="CR61">61</xref>,<xref ref-type="bibr" rid="CR72">72</xref></sup>. Our study adds to these observations by providing initial evidence of substantial methylome divergence associated with altered transcriptome activity of ecologically-relevant genes among closely related Lake Malawi cichlid fish species. This raises the possibility that variation in methylation patterns could facilitate phenotypic divergence in these rapidly evolving species through different mechanisms (such as altered TF binding affinity, gene expression, and TE activity, all possibly associated with methylome divergence at <italic>cis</italic>-regulatory regions). Further work is required to elucidate the extent to which this might result from plastic responses to the environment and the degree of inheritance of such patterns, as well the adaptive role and any genetic basis associated with epigenetic divergence. This study represents an epigenomic study investigating natural methylome variation in the context of phenotypic diversification in genetically similar but ecomorphologically divergent cichlid species part of a massive vertebrate radiation and provides an important resource for further experimental work.</p></sec><sec id="Sec8" sec-type="methods"><title>Methods</title><sec id="Sec9"><title>Sampling overview</title><p id="Par31">All cichlid specimens were bought dead from local fishermen by G.F. Turner, M. Malinsky, H. Svardal, A.M. Tyers, M. Mulumpwa, and M. Du in 2016 in Malawi in collaboration with the Fisheries Research Unit of the Government of Malawi), or in 2015 in Tanzania in collaboration with the Tanzania Fisheries Research Institute (various collaborative projects). Sampling collection and shipping were approved by permits issued to G.F. Turner, M.J. Genner R. Durbin, E.A. Miska by the Fisheries Research Unit of the Government of Malawi and the Tanzania Fisheries Research Institute, and were approved and in accordance with the ethical regulations of the Wellcome Sanger Institute, the University of Cambridge and the University of Bangor (UK). Upon collection, tissues were immediately placed in RNA<italic>later</italic> (Sigma) and were then stored at −80 °C upon return. Information about the collection type, species IDs, and the GPS coordinates for each sample in Supplementary Data <xref ref-type="supplementary-material" rid="MOESM4">1</xref>.</p></sec><sec id="Sec10"><title>SNP-corrected genomes</title><p id="Par32">Because real C &gt; T (or G &gt; A on the reverse strand) mutations are indistinguishable from C &gt; T SNPs generated by the bisulfite treatment, they can add some bias to comparative methylome analyses. To account for this, we used SNP data from Malinsky et al. (2018) (ref. <sup><xref ref-type="bibr" rid="CR36">36</xref></sup>) and, using the <italic>Maylandia zebra</italic> UMD2a reference genome (NCBI_Assembly: GCF_000238955.4) as the template, we substituted C &gt; T (or G &gt; A) SNPs for each of the six species analysed before re-mapping the bisulfite reads onto these ‘updated’ reference genomes.</p><p id="Par33">To translate SNP coordinates from Malinsky et al. (2018) to the UMD2a assembly, we used the UCSC liftOver tool (version 418), based on a whole genome alignment between the original Brawand et al., 2014 (ref. <sup><xref ref-type="bibr" rid="CR38">38</xref></sup>) (<ext-link xlink:href="https://www.ncbi.nlm.nih.gov/assembly/GCF_000238955.1/" ext-link-type="url">https://www.ncbi.nlm.nih.gov/assembly/GCF_000238955.1/</ext-link>) and the UMD2a <italic>M. zebra</italic> genome assemblies. The pairwise whole genome alignment was generated using lastz v1.02<sup><xref ref-type="bibr" rid="CR73">73</xref></sup>, with the following parameters: “B = 2 C = 0 E = 150 H = 0 K = 4500 L = 3000 M = 254 O = 600 Q = human_chimp.v2.q <italic>T</italic> = 2 <italic>Y</italic> = 15000”. This was followed by using USCS genome utilities (<ext-link xlink:href="https://genome.ucsc.edu/util.html" ext-link-type="url">https://genome.ucsc.edu/util.html</ext-link>) axtChain (kent source version 418) tool with -minScore=5000. Additional tools with default parameters were then used following the UCSC whole-genome alignment paradigm (<ext-link xlink:href="http://genomewiki.ucsc.edu/index.php/Whole_genome_alignment_howto" ext-link-type="url">http://genomewiki.ucsc.edu/index.php/Whole_genome_alignment_howto</ext-link>) in order to obtain a contiguous pairwise alignment and the ‘chain’ file input for liftOver (kent source version 418).</p><p id="Par34">The ‘lifted over’ C &gt; T (or G &gt; A) SNPs were then substituted into the UMD2a genome using the evo getWGSeq command with the–whole-genome and–methylome options. The code used is available as a part of the Evo package (<ext-link xlink:href="https://github.com/millanek/evo" ext-link-type="url">https://github.com/millanek/evo</ext-link>; v.0.1 r24, commit99d5b22).</p></sec><sec id="Sec11"><title>Extraction of high-molecular-weight genomic DNA (HMW-gDNA)</title><p id="Par35">The main method to generate WGBS data is summarised in Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">1</xref>. In detail, high-molecular-weight genomic DNA (HMW-gDNA) was extracted from homogenised liver and muscle tissues (&lt;25 mg) using QIAamp DNA Mini Kit (Qiagen 51304) according to the manufacturer’s instructions. Before sonication, unmethylated lambda DNA (Promega, D1521) was spiked in (0.5% w/w) to assess bisulfite conversion efficiency. HMW-gDNA was then fragmented to the target size of ~400 bp (Covaris, S2, and E220). Fragments were then purified with PureLink PCR Purification kit (ThermoFisher). Before any downstream experiments, quality and quantity of gDNA fragments were both assessed using NanoDrop, Qubit, and Tapestation (Agilent).</p></sec><sec id="Sec12"><title>Sequencing library preparation—whole-genome bisulfite sequencing</title><p id="Par36">For each sample, 200 ng of sonicated fragments were used to make NGS (next-generation sequencing) libraries using NEBNext Ultra II DNA Library Prep (New England BioLabs, E7645S) in combination with methylated adaptors (NEB, E7535S), following the manufacturer’s instructions. Adaptor-ligated fragments were then purified with 1.0x Agencourt AMPure Beads (Beckman Coulter, Inc). Libraries were then treated with sodium bisulfite according to the manufacturer’s instructions (Imprint DNA Modification Kit; Sigma, MOD50) and amplified by PCR (10 cycles) using KAPA HiFi HS Uracil+ RM (KAPA Biosystems) and NEBNext Multiplex Oligos for Illumina (NEB E7335S). Bisulfite-converted libraries were finally size-selected and purified using 0.7x Agencourt AMPure Beads. The size and purity of libraries were determined using Tapestation and quantified using Qubit (Agilent). Whole-genome bisulfite sequencing (WGBS) libraries were sequenced on HiSeq 4000 (High Output mode, v.4 SBS chemistry) to generate paired-end 150 bp-long reads. <italic>A. stuartgranti</italic> samples were sequenced on HiSeq 2500 to generate paired-end 125 bp-long reads.</p></sec><sec id="Sec13"><title>Mapping of WGBS reads</title><p id="Par37">TrimGalore (options: --paired --fastqc --illumina; v0.6.2; github.com/FelixKrueger/TrimGalore) was used to determine the quality of sequenced read pairs and to remove Illumina adaptor sequences and low-quality reads/bases (Phred quality score &lt; 20). All adaptor-trimmed paired reads from each species were then aligned to the respective species-specific SNP-corrected <italic>M.zebra</italic> genomes (see above and Supplementary Data <xref ref-type="supplementary-material" rid="MOESM4">1</xref>) and to the lambda genome (to determine bisulfite non-conversion rate) using Bismark<sup><xref ref-type="bibr" rid="CR74">74</xref></sup> (v0.20.0). The alignment parameters were as follows: 0 mismatch allowed with a maximum insert size for valid paired-end alignments of 500 bp (options: -p5 -N 0 –X 500). Clonal mapped reads (i.e., PCR duplicates) were removed using Bismark’s deduplicate_bismark (see Supplementary Data <xref ref-type="supplementary-material" rid="MOESM4">1</xref>). Mapped reads for the same samples generated on multiple HiSeq runs were also merged.</p></sec><sec id="Sec14"><title>Differentially methylated regions (DMR) and comparative analysis</title><p id="Par38">Methylation at CpG sites was called using Bismark’s bismark_methylation_extractor (options: -p --multicore 9 --comprehensive --no_overlap --merge_non_CpG). DMRs (&gt;25% methylation difference, ≥50 bp, ≥4 CG and <italic>p</italic> &lt; 0.05) were predicted using DSS<sup><xref ref-type="bibr" rid="CR75">75</xref></sup> (v2.32.0). samtools (v1.9) and bedtools (v2.27.1) were used to generate averaged methylation levels across non-overlapping windows of various sizes genome-wide. ggplot2 (v3.3.0) and pheatmap (v1.0.12) were used to visualise methylome data and to produce unbiased hierarchal clustering (Euclidean’s distances and complete-linkage clustering). Spearman’s correlation matrices, Euclidean distances, and principal component analyses (scaled and centred) were produced using R (v3.6.0) functions cor, dist, and prcom, respectively. The minimum read overage requirement at any CpG sites for all analyses—except for DSS-predicted DMRs, for which all read coverage was used—was as follows: &gt;4 and ≤100 non-PCR-duplicate mapped paired-end reads. mCG % levels over 50 bp-long non-overlapping windows for all annotations were averaged for each tissue of each sample. The genome browser IGV (v2.5.2) was used to visualise DNA methylation levels genome-wide (% mCG/CG in 50 bp windows; bigwig format).</p></sec><sec id="Sec15"><title>Additional statistics</title><p id="Par39">Kruskal−Wallis H and Dunn’s multiple comparisons tests (using Benjamini−Hochberg correction, unless otherwise specified) were performed using FSA (v0.8.25). Box plots indicate median (middle line), 25th, 75th percentile (box), and 5th and 95th percentile (whiskers) as well as outliers (single points). Violin plots were generated using ggplot2 and represent rotated and mirrored kernel density plots.</p></sec><sec id="Sec16"><title>Genomic annotations</title><p id="Par40">The reference genome of <italic>M. zebra</italic> (UMD2a; NCBI genome build: GCF_000238955.4 and NCBI annotation release 104) was used to generate all annotations. Custom annotation files were generated and were defined as follows: promoter regions, TSS ± 500 bp unless otherwise indicated; gene bodies included both exons and introns and other intronic regions, and excluded the first 500 bp regions downstream of TSS to avoid any overlap with promoter regions; transposable elements and repetitive elements (TE<underline>)</underline> were modelled and annotated, as well as their sequence divergence analysed, using RepeatModeler (v1.0.11) and RepeatMasker (v4.0.9.p2), respectively. Intergenic regions were defined as genomic regions more than 0.5 kbp away from any gene. CpG-rich regions, or CpG islands (CGI), were predicted and annotated using makeCGI (v1.3.4)<sup><xref ref-type="bibr" rid="CR76">76</xref></sup>. The following genomes were used to compare genomic CG contents across different organisms (Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">5a</xref>): honey bee (<italic>A. melifera</italic>, Amel_4.5), nematode (<italic>C. elegans</italic>, WBcel235), <italic>Arabidopsis</italic> (<italic>A. thaliana</italic>, TAIR10), zebrafish (<italic>D. rerio</italic>, GRCz10), Mbuna cichlid <italic>Maylandia zebra</italic> (<italic>M. zebra</italic>, UMD1), West Indian Ocean coelacanth (<italic>L. chalumnae</italic>, LatCha.1), red junglefowl (<italic>G. gallus</italic>, Gall_5), grey whale (<italic>E. robustus</italic>, v1), human (<italic>H. sapiens</italic>, GRCh38.p10), mouse (<italic>M. musculus</italic>, GRCm38.p5), tammar wallaby (<italic>N. eugenii</italic>, Meug1.1). pfDMRs and transposon/repeat elements were assigned to a gene when they were located within gene bodies (from 0.5 kbp downstream TSS), within promoter regions (TSS ± 500 bp) and in the vicinity of genes (0.5−4 kbp away from genes).</p></sec><sec id="Sec17"><title>Enrichment analysis</title><p id="Par41">Enrichment analysis was calculated by shuffling each type of DMRs (liver, muscle, tissue) across the <italic>M.zebra</italic> UMD2a genome (accounting for the number of DMRs and length; 1000 iterations). The expected values were determined by intersecting shuffled DMRs with each genomic category. Chi-square tests were then performed for each Observed/Expected (O/E) distribution. The same process was performed for TE enrichment analysis.</p></sec><sec id="Sec18"><title>Gene Ontology (GO) enrichment analysis</title><p id="Par42">All GO enrichment analyses were performed using g:Profiler (<ext-link xlink:href="https://biit.cs.ut.ee/gprofiler/gost" ext-link-type="url">https://biit.cs.ut.ee/gprofiler/gost</ext-link>; version: e104_eg51_p15_3922dba [September 2020]). Only annotated genes for <italic>Maylandia zebra</italic> were used with a statistical cut-off of FDR &lt; 0.05 (unless otherwise specified).</p></sec><sec id="Sec19"><title>Sequence divergence</title><p id="Par43">A pairwise sequence divergence matrix was generated using a published dataset<sup><xref ref-type="bibr" rid="CR36">36</xref></sup>. Unrooted phylogenetic trees and heatmap were generated using the following R packages: phangorn (v.2.5.5), ape_5.4-1 and pheatmap (v.1.0.12).</p></sec><sec id="Sec20"><title>Total RNA extraction and RNA sequencing</title><p id="Par44">In brief, for each species, 2-3 biological replicates of liver and muscle tissues were used to sequence total RNA (see Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">1</xref> for a summary of the method and Supplementary Table <xref ref-type="supplementary-material" rid="MOESM1">1</xref> for sampling size). The same specimens were used for both RNAseq and WGBS.</p><p id="Par45">RNAseq libraries for both liver and muscle tissues were prepared using ~5−10 mg of RNA<italic>later</italic>-preserved homogenised liver and muscle tissues. Total RNA was isolated using a phenol/chloroform method following the manufacturer’s instructions (TRIzol, ThermoFisher). RNA samples were treated with DNase (TURBO DNase, ThermoFisher) to remove any DNA contamination. The quality and quantity of total RNA extracts were determined using NanoDrop spectrophotometer (ThermoFisher), Qubit (ThermoFisher), and BioAnalyser (Agilent). Following ribosomal RNA depletion (RiboZero, Illumina), stranded rRNA-depleted RNA libraries (Illumina) were prepped according to the manufacturer’s instructions and sequenced (paired-end 75bp-long reads) on HiSeq2500 V4 (Illumina) by the sequencing facility of the Wellcome Sanger Institute. Published RNAseq dataset<sup><xref ref-type="bibr" rid="CR36">36</xref></sup> for all <italic>A. calliptera</italic> sp. Itupi tissues were used (NCBI Short Read Archive BioProjects <ext-link xlink:href="https://www.ncbi.nlm.nih.gov/bioproject/?term=PRJEB1254" ext-link-type="url">PRJEB1254</ext-link> and <ext-link xlink:href="https://www.ncbi.nlm.nih.gov/bioproject/?term=PRJEB15289" ext-link-type="url">PRJEB15289</ext-link>).</p></sec><sec id="Sec21"><title>RNAseq reads mapping and gene quantification</title><p id="Par46">TrimGalore (options: --paired --fastqc --illumina; v0.6.2; <ext-link xlink:href="https://github.com/FelixKrueger/TrimGalore" ext-link-type="url">https://github.com/FelixKrueger/TrimGalore</ext-link>) was used to determine the quality of sequenced read pairs and to remove Illumina adaptor sequences and low-quality reads/bases (Phred quality score &lt;20). Reads were then aligned to the <italic>M. zebra</italic> transcriptome (UMD2a; NCBI genome build: GCF_000238955.4 and NCBI annotation release 104) and the expression value for each transcript was quantified in transcripts per million (TPM) using kallisto<sup><xref ref-type="bibr" rid="CR77">77</xref></sup> (options: quant --bias -b 100 -t 1; v0.46.0). For all downstream analyses, gene expression values for each tissue were averaged for each species.</p><p id="Par47">To assess transcription variation across samples, a Spearman’s rank correlation matrix using overall gene expression values was produced with the R function cor. Unsupervised clustering and heatmaps were produced with R packages ggplot2 (v3.3.0) and pheatmap (v1.0.12; see above). Heatmaps of gene expression show scaled TPM values (<italic>Z</italic>-score).</p></sec><sec id="Sec22"><title>Differential gene expression (DEG) analysis</title><p id="Par48">Differential gene expression analysis was performed using sleuth<sup><xref ref-type="bibr" rid="CR78">78</xref></sup> (v0.30.0; Wald test, false discovery rate adjusted two-sided <italic>p</italic>-value, using Benjamini−Hochberg &lt;0.01). Only DEGs with gene expression difference of ≥50 TPM between at least one species pairwise comparison were analysed further.</p></sec><sec id="Sec23"><title>Correlation between methylation variation and differential transcriptional activity</title><p id="Par49">To study the correlation between methylome and gene expression levels (Fig. <xref rid="Fig1" ref-type="fig">1e</xref> and Supplementary Fig. <xref ref-type="supplementary-material" rid="MOESM1">7</xref>), genes were binned into 11 categories based on their expression levels (increasing gene expression levels, from category 1 to 10); cat “OFF” grouped silent/not expressed genes, i.e., TPM = 0 in all replicates for a particular species. RL liver (<italic>n</italic> = 2 biological replicates): 10 ‘ON’ categories, <italic>n</italic> = 2,129 each; 1 ‘OFF’ category, <italic>n</italic> = 5,331. MZ liver (<italic>n</italic> = 3 biological replicates): 10 ‘ON’ categories, <italic>n</italic> = 2,199 each; 1 ‘OFF’ category, <italic>n</italic> = 4,704. RL muscle (<italic>n</italic> = 2 biological replicates): 10 ‘ON’ categories, <italic>n</italic> = 2,101 each; 1 ‘OFF’ category, <italic>n</italic> = 4,622. Promoters (500 bp ± TSS) and gene bodies were also binned into 10 categories according to methylation levels (0−100% average methylation levels, by 10% DNA methylation increment); RL liver (<italic>n</italic> = 2 biological replicates), 11 categories, <italic>n</italic> ranging from 34 to 11,202 per category. MZ liver (<italic>n</italic> = 3 biological replicates), 11 categories, <italic>n</italic> ranging from 28 to 11,192 per category. RL muscle (<italic>n</italic> = 2 biological replicates), 11 categories, <italic>n</italic> ranging from 60 to 9,946 per category. Categories were generated using the R script tidyverse (v1.3.0) and graphs were generated using deepTools v.3.2.1. TPM values and methylation levels were averaged for each tissue and each species.</p></sec><sec id="Sec24"><title>Reporting summary</title><p id="Par50">Further information on research design is available in the <xref ref-type="supplementary-material" rid="MOESM5">Nature Research Reporting Summary</xref> linked to this article.</p></sec></sec></body><back><ack><title>Acknowledgements</title><p>We would like to thank S.M. Grant’s diving team for collecting some of the fish specimens, as well as the Fisheries Research Unit of the Government of Malawi, and the Tanzania Fisheries Research Institute, for their assistance and support. We would like to thank the staff at the Gurdon Institute and the sequencing facilities at CRUK Cambridge Institute, Gurdon, and Sanger Institutes for their expertise and support. We would like to thank the members of the Miska Lab as well as the Cambridge Cichlid community for fruitful discussions. We thank Navin B. Ramakrishna for critical comments on the manuscript, as well as David Jordan, Tomás di Domenico and Konrad L.M. Rudolph for their support with data analysis. We are grateful to Ole Seehausen and Marcel Häsler (University of Bern, Switzerland) for providing PN tissues. We thank Alan Hudson for help with sample collection. The map of Africa (Fig. 1a) was downloaded and modified from <ext-link xlink:href="https://www.d-maps.com/carte.php?num_car=733&amp;lang=en" ext-link-type="url">https://www.d-maps.com/carte.php?num_car=733&amp;lang=en</ext-link>. This work was supported by the following grants to E.A.M.: Wellcome Trust Senior Investigator Award (104640/Z/14/Z and 219475/Z/19/Z) and CRUK award (C13474/A27826); to R.D.: Wellcome award (WT207492); to G.F.T. and M.J.G., the Leverhulme Trust—Royal Society Africa Awards (AA100023 and AA130107), and NERC award (NE/S001794/1). G.V. thanks Wolfson College, University of Cambridge, and the Genetics Society, London for financial support. The authors also acknowledge core funding to the Gurdon Institute from Wellcome (092096/Z/10/Z, 203144/Z/16/Z) and CRUK (C6946/A24843). For Open Access, the author has applied a CC BY public copyright licence to any Author Accepted Manuscript version arising from this submission.</p></ack><sec sec-type="author-contribution"><title>Author contributions</title><p>G.V. and E.A.M. devised and supervised the study; G.V. and E.A.M. interpreted the results with contributions from G.F.T., M.J.G, M.E.S., M.M. and R.D.; G.V. performed all experiments and analyses with contribution from M.M. (SNP-corrected genomes); M.D., H.S., M.M., R.D., M.J.G., G.F.T., and A.M.T. collected and provided tissues from wild-caught cichlid specimens; M.D. extracted total RNA samples; G.V. and E.A.M. wrote the paper with comments and contribution from all authors.</p></sec><sec sec-type="data-availability"><title>Data availability</title><p>The data that support this study are available from the corresponding authors upon reasonable request. All raw sequencing reads (WGBS, RNAseq, and SNP-corrected genomes), and processed data generated in the course of this study have been deposited in the Gene Expression Omnibus (GEO) database under the accession number <ext-link xlink:href="https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE158514" ext-link-type="url">GSE158514</ext-link>. Sample accessions are listed in Supplementary Data <xref ref-type="supplementary-material" rid="MOESM4">1</xref>. In addition, variant call files (for SNP-corrected genomes and pairwise whole-genome sequence divergence), as well as RNAseq for <italic>A. calliptera</italic> tissues were downloaded from NCBI Short Read Archive BioProjects <ext-link xlink:href="https://www.ncbi.nlm.nih.gov/bioproject/?term=PRJEB1254" ext-link-type="url">PRJEB1254</ext-link> and <ext-link xlink:href="https://www.ncbi.nlm.nih.gov/bioproject/?term=PRJEB15289" ext-link-type="url">PRJEB15289</ext-link>. The source data are provided with this paper.</p></sec><sec sec-type="data-availability"><title>Code availability</title><p>The code used to generate SNP-substituted genomes is available as a part of the Evo package (<ext-link xlink:href="https://github.com/millanek/evo" ext-link-type="url">https://github.com/millanek/evo</ext-link>; v.0.1 r24, commit99d5b22).</p></sec><sec sec-type="ethics-statement"><sec id="FPar1" sec-type="COI-statement"><title>Competing interests</title><p id="Par51">The authors declare no competing interests.</p></sec></sec><ref-list id="Bib1"><title>References</title><ref-list><ref id="CR1"><label>1.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jablonka</surname><given-names>E</given-names></name><name><surname>Raz</surname><given-names>G</given-names></name></person-group><article-title xml:lang="en">Transgenerational epigenetic inheritance: prevalence, mechanisms, and implications for the study of heredity and evolution</article-title><source>Q. Rev. Biol.</source><year>2009</year><volume>84</volume><fpage>131</fpage><lpage>176</lpage><pub-id pub-id-type="pmid">19606595</pub-id><pub-id pub-id-type="doi">10.1086/598822</pub-id><pub-id pub-id-type="pmcid">19606595</pub-id></mixed-citation></ref><ref id="CR2"><label>2.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Miska</surname><given-names>EA</given-names></name><name><surname>Ferguson-Smith</surname><given-names>AC</given-names></name></person-group><article-title xml:lang="en">Transgenerational inheritance: models and mechanisms of non-DNA sequence-based inheritance</article-title><source>Science</source><year>2016</year><volume>354</volume><fpage>59</fpage><lpage>63</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC28Xhs1SktrjJ</pub-id><pub-id pub-id-type="pmid">27846492</pub-id><pub-id pub-id-type="doi">10.1126/science.aaf4945</pub-id><pub-id pub-id-type="bibcode">2016Sci...354...59M</pub-id><pub-id pub-id-type="pmcid">27846492</pub-id></mixed-citation></ref><ref id="CR3"><label>3.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cavalli</surname><given-names>G</given-names></name><name><surname>Heard</surname><given-names>E</given-names></name></person-group><article-title xml:lang="en">Advances in epigenetics link genetics to the environment and disease</article-title><source>Nature</source><year>2019</year><volume>571</volume><fpage>489</fpage><lpage>499</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC1MXhsVeqs7rO</pub-id><pub-id pub-id-type="pmid">31341302</pub-id><pub-id pub-id-type="doi">10.1038/s41586-019-1411-0</pub-id><pub-id pub-id-type="bibcode">2019Natur.571..489C</pub-id><pub-id pub-id-type="pmcid">31341302</pub-id></mixed-citation></ref><ref id="CR4"><label>4.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Heard</surname><given-names>E</given-names></name><name><surname>Martienssen</surname><given-names>RA</given-names></name></person-group><article-title xml:lang="en">Transgenerational epigenetic inheritance: myths and mechanisms</article-title><source>Cell</source><year>2014</year><volume>157</volume><fpage>95</fpage><lpage>109</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC2cXmtVCnurs%3D</pub-id><pub-id pub-id-type="pmid">24679529</pub-id><pub-id pub-id-type="pmcid">4020004</pub-id><pub-id pub-id-type="doi">10.1016/j.cell.2014.02.045</pub-id></mixed-citation></ref><ref id="CR5"><label>5.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Morgan</surname><given-names>HD</given-names></name><name><surname>Sutherland</surname><given-names>HGE</given-names></name><name><surname>Martin</surname><given-names>DIK</given-names></name><name><surname>Whitelaw</surname><given-names>E</given-names></name></person-group><article-title xml:lang="en">Epigenetic inheritance at the agouti locus in the mouse</article-title><source>Nat. Genet.</source><year>1999</year><volume>23</volume><fpage>314</fpage><lpage>318</lpage><pub-id pub-id-type="coi">1:CAS:528:DyaK1MXnt1Gns7w%3D</pub-id><pub-id pub-id-type="pmid">10545949</pub-id><pub-id pub-id-type="doi">10.1038/15490</pub-id><pub-id pub-id-type="pmcid">10545949</pub-id></mixed-citation></ref><ref id="CR6"><label>6.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cubas</surname><given-names>P</given-names></name><name><surname>Vincent</surname><given-names>C</given-names></name><name><surname>Coen</surname><given-names>E</given-names></name></person-group><article-title xml:lang="en">An epigenetic mutation responsible for natural variation in floral symmetry</article-title><source>Nature</source><year>1999</year><volume>401</volume><fpage>157</fpage><lpage>161</lpage><pub-id pub-id-type="coi">1:CAS:528:DyaK1MXlvFKhu7Y%3D</pub-id><pub-id pub-id-type="pmid">10490023</pub-id><pub-id pub-id-type="doi">10.1038/43657</pub-id><pub-id pub-id-type="bibcode">1999Natur.401..157C</pub-id><pub-id pub-id-type="pmcid">10490023</pub-id></mixed-citation></ref><ref id="CR7"><label>7.</label><mixed-citation publication-type="other">Vernaz, G. et al. Epigenetic divergence during early stages of speciation in an African crater lake cichlid fish. Preprint at <italic>bioRxiv</italic><ext-link xlink:href="https://doi.org/10.1101/2021.07.30.435319" ext-link-type="doi">https://doi.org/10.1101/2021.07.30.435319</ext-link> (2021).</mixed-citation></ref><ref id="CR8"><label>8.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zemach</surname><given-names>A</given-names></name><name><surname>McDaniel</surname><given-names>IE</given-names></name><name><surname>Silva</surname><given-names>P</given-names></name><name><surname>Zilberman</surname><given-names>D</given-names></name></person-group><article-title xml:lang="en">Genome-wide evolutionary analysis of eukaryotic DNA methylation</article-title><source>Science</source><year>2010</year><volume>328</volume><fpage>916</fpage><lpage>919</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC3cXlvVelt7o%3D</pub-id><pub-id pub-id-type="pmid">20395474</pub-id><pub-id pub-id-type="doi">10.1126/science.1186366</pub-id><pub-id pub-id-type="bibcode">2010Sci...328..916Z</pub-id><pub-id pub-id-type="pmcid">20395474</pub-id></mixed-citation></ref><ref id="CR9"><label>9.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Feng</surname><given-names>S</given-names></name><etal/></person-group><article-title xml:lang="en">Conservation and divergence of methylation patterning in plants and animals</article-title><source>Proc. Natl Acad. Sci. USA</source><year>2010</year><volume>107</volume><fpage>8689</fpage><lpage>8694</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC3cXmsVOrsbo%3D</pub-id><pub-id pub-id-type="pmid">20395551</pub-id><pub-id pub-id-type="pmcid">2889301</pub-id><pub-id pub-id-type="doi">10.1073/pnas.1002720107</pub-id><pub-id pub-id-type="bibcode">2010PNAS..107.8689F</pub-id></mixed-citation></ref><ref id="CR10"><label>10.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Suzuki</surname><given-names>MM</given-names></name><name><surname>Bird</surname><given-names>A</given-names></name></person-group><article-title xml:lang="en">DNA methylation landscapes: provocative insights from epigenomics</article-title><source>Nat. Rev. Genet.</source><year>2008</year><volume>9</volume><fpage>465</fpage><lpage>476</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BD1cXlvFKrtL0%3D</pub-id><pub-id pub-id-type="pmid">18463664</pub-id><pub-id pub-id-type="doi">10.1038/nrg2341</pub-id></mixed-citation></ref><ref id="CR11"><label>11.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kawakatsu</surname><given-names>T</given-names></name><etal/></person-group><article-title xml:lang="en">Epigenomic diversity in a global collection of Arabidopsis thaliana accessions</article-title><source>Cell</source><year>2016</year><volume>166</volume><fpage>492</fpage><lpage>505</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC28XhtFynu7bO</pub-id><pub-id pub-id-type="pmid">27419873</pub-id><pub-id pub-id-type="pmcid">5172462</pub-id><pub-id pub-id-type="doi">10.1016/j.cell.2016.06.044</pub-id></mixed-citation></ref><ref id="CR12"><label>12.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Quadrana</surname><given-names>L</given-names></name><name><surname>Colot</surname><given-names>V</given-names></name></person-group><article-title xml:lang="en">Plant transgenerational epigenetics</article-title><source>Annu. Rev. Genet.</source><year>2016</year><volume>50</volume><fpage>467</fpage><lpage>491</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC28Xhs1ykt7zF</pub-id><pub-id pub-id-type="pmid">27732791</pub-id><pub-id pub-id-type="doi">10.1146/annurev-genet-120215-035254</pub-id></mixed-citation></ref><ref id="CR13"><label>13.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cortijo</surname><given-names>S</given-names></name><etal/></person-group><article-title xml:lang="en">Mapping the epigenetic basis of complex traits</article-title><source>Science</source><year>2014</year><volume>343</volume><fpage>1145</fpage><lpage>1148</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC2cXjsVegs7k%3D</pub-id><pub-id pub-id-type="pmid">24505129</pub-id><pub-id pub-id-type="doi">10.1126/science.1248127</pub-id><pub-id pub-id-type="bibcode">2014Sci...343.1145C</pub-id></mixed-citation></ref><ref id="CR14"><label>14.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Best</surname><given-names>C</given-names></name><etal/></person-group><article-title xml:lang="en">Epigenetics in teleost fish: from molecular mechanisms to physiological phenotypes</article-title><source>Comp. Biochem. Physiol. Part B Biochem. Mol. Biol.</source><year>2018</year><volume>224</volume><fpage>210</fpage><lpage>244</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC1cXitl2qs7s%3D</pub-id><pub-id pub-id-type="doi">10.1016/j.cbpb.2018.01.006</pub-id></mixed-citation></ref><ref id="CR15"><label>15.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Seritrakul</surname><given-names>P</given-names></name><name><surname>Gross</surname><given-names>JM</given-names></name></person-group><article-title xml:lang="en">Expression of the de novo DNA methyltransferases (dnmt3 - dnmt8) during zebrafish lens development</article-title><source>Dev. Dyn.</source><year>2014</year><volume>243</volume><fpage>350</fpage><lpage>356</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC2cXht1ehsbw%3D</pub-id><pub-id pub-id-type="pmid">24123478</pub-id><pub-id pub-id-type="doi">10.1002/dvdy.24077</pub-id></mixed-citation></ref><ref id="CR16"><label>16.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rai</surname><given-names>K</given-names></name><etal/></person-group><article-title xml:lang="en">Zebra fish Dnmt1 and Suv39h1 regulate organ-specific terminal differentiation during development</article-title><source>Mol. Cell. Biol.</source><year>2006</year><volume>26</volume><fpage>7077</fpage><lpage>7085</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BD28XhtVCltbnF</pub-id><pub-id pub-id-type="pmid">16980612</pub-id><pub-id pub-id-type="pmcid">1592902</pub-id><pub-id pub-id-type="doi">10.1128/MCB.00312-06</pub-id></mixed-citation></ref><ref id="CR17"><label>17.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Law</surname><given-names>JA</given-names></name><name><surname>Jacobsen</surname><given-names>SE</given-names></name></person-group><article-title xml:lang="en">Establishing, maintaining and modifying DNA methylation patterns in plants and animals</article-title><source>Nat. Rev. Genet.</source><year>2010</year><volume>11</volume><fpage>204</fpage><lpage>220</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC3cXitFCrsLk%3D</pub-id><pub-id pub-id-type="pmid">20142834</pub-id><pub-id pub-id-type="pmcid">3034103</pub-id><pub-id pub-id-type="doi">10.1038/nrg2719</pub-id></mixed-citation></ref><ref id="CR18"><label>18.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Deniz</surname><given-names>Ö</given-names></name><name><surname>Frost</surname><given-names>JM</given-names></name><name><surname>Branco</surname><given-names>MR</given-names></name></person-group><article-title xml:lang="en">Regulation of transposable elements by DNA modifications</article-title><source>Nat. Rev. Genet.</source><year>2019</year><volume>20</volume><fpage>417</fpage><lpage>431</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC1MXmslKhurk%3D</pub-id><pub-id pub-id-type="pmid">30867571</pub-id><pub-id pub-id-type="doi">10.1038/s41576-019-0117-3</pub-id><pub-id pub-id-type="pmcid">30867571</pub-id></mixed-citation></ref><ref id="CR19"><label>19.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bestor</surname><given-names>TH</given-names></name></person-group><article-title xml:lang="en">DNA methylation: evolution of a bacterial immune function into a regulator of gene expression and genome structure in higher eukaryotes</article-title><source>Phil. Trans. R. Soc. Lond. B, Biol. Sci.</source><year>1990</year><volume>326</volume><fpage>179</fpage><lpage>187</lpage><pub-id pub-id-type="coi">1:STN:280:DyaK3c7nsFKntg%3D%3D</pub-id><pub-id pub-id-type="doi">10.1098/rstb.1990.0002</pub-id><pub-id pub-id-type="bibcode">1990RSPTB.326..179B</pub-id></mixed-citation></ref><ref id="CR20"><label>20.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Greenberg</surname><given-names>MVC</given-names></name><name><surname>Bourc’his</surname><given-names>D</given-names></name></person-group><article-title xml:lang="en">The diverse roles of DNA methylation in mammalian development and disease</article-title><source>Nat. Rev. Mol. Cell Biol.</source><year>2019</year><volume>20</volume><fpage>590</fpage><lpage>607</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC1MXhsFGjtbfO</pub-id><pub-id pub-id-type="pmid">31399642</pub-id><pub-id pub-id-type="doi">10.1038/s41580-019-0159-6</pub-id></mixed-citation></ref><ref id="CR21"><label>21.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Smith</surname><given-names>ZD</given-names></name><name><surname>Meissner</surname><given-names>A</given-names></name></person-group><article-title xml:lang="en">DNA methylation: roles in mammalian development</article-title><source>Nat. Rev. Genet.</source><year>2013</year><volume>14</volume><fpage>204</fpage><lpage>220</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC3sXitlaku7Y%3D</pub-id><pub-id pub-id-type="pmid">23400093</pub-id><pub-id pub-id-type="doi">10.1038/nrg3354</pub-id></mixed-citation></ref><ref id="CR22"><label>22.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yin</surname><given-names>Y</given-names></name><etal/></person-group><article-title xml:lang="en">Impact of cytosine methylation on DNA binding specificities of human transcription factors</article-title><source>Science</source><year>2017</year><volume>356</volume><fpage>eaaj2239</fpage><pub-id pub-id-type="pmid">28473536</pub-id><pub-id pub-id-type="pmcid">8009048</pub-id><pub-id pub-id-type="doi">10.1126/science.aaj2239</pub-id><pub-id pub-id-type="coi">1:CAS:528:DC%2BC2sXmvVGnsb8%3D</pub-id></mixed-citation></ref><ref id="CR23"><label>23.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Du</surname><given-names>J</given-names></name><name><surname>Johnson</surname><given-names>LM</given-names></name><name><surname>Jacobsen</surname><given-names>SE</given-names></name><name><surname>Patel</surname><given-names>DJ</given-names></name></person-group><article-title xml:lang="en">DNA methylation pathways and their crosstalk with histone methylation</article-title><source>Nat. Rev. Mol. Cell Biol.</source><year>2015</year><volume>16</volume><fpage>519</fpage><lpage>532</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC2MXhtlOrtrvO</pub-id><pub-id pub-id-type="pmid">26296162</pub-id><pub-id pub-id-type="pmcid">4672940</pub-id><pub-id pub-id-type="doi">10.1038/nrm4043</pub-id></mixed-citation></ref><ref id="CR24"><label>24.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Schübeler</surname><given-names>D</given-names></name></person-group><article-title xml:lang="en">Function and information content of DNA methylation</article-title><source>Nature</source><year>2015</year><volume>517</volume><fpage>321</fpage><lpage>326</lpage><pub-id pub-id-type="pmid">25592537</pub-id><pub-id pub-id-type="doi">10.1038/nature14192</pub-id><pub-id pub-id-type="bibcode">2015Natur.517..321S</pub-id><pub-id pub-id-type="coi">1:CAS:528:DC%2BC2MXpvV2mtw%3D%3D</pub-id></mixed-citation></ref><ref id="CR25"><label>25.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhu</surname><given-names>H</given-names></name><name><surname>Wang</surname><given-names>G</given-names></name><name><surname>Qian</surname><given-names>J</given-names></name></person-group><article-title xml:lang="en">Transcription factors as readers and effectors of DNA methylation</article-title><source>Nat. Rev. Genet.</source><year>2016</year><volume>17</volume><fpage>551</fpage><lpage>565</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC28Xht1GrtLvJ</pub-id><pub-id pub-id-type="pmid">27479905</pub-id><pub-id pub-id-type="pmcid">5559737</pub-id><pub-id pub-id-type="doi">10.1038/nrg.2016.83</pub-id></mixed-citation></ref><ref id="CR26"><label>26.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hon</surname><given-names>GC</given-names></name><etal/></person-group><article-title xml:lang="en">Epigenetic memory at embryonic enhancers identified in DNA methylation maps from adult mouse tissues</article-title><source>Nat. Genet.</source><year>2013</year><volume>45</volume><fpage>1198</fpage><lpage>1206</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC3sXhtlGltL7P</pub-id><pub-id pub-id-type="pmid">23995138</pub-id><pub-id pub-id-type="pmcid">4095776</pub-id><pub-id pub-id-type="doi">10.1038/ng.2746</pub-id></mixed-citation></ref><ref id="CR27"><label>27.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>West-Eberhard</surname><given-names>MJ</given-names></name></person-group><article-title xml:lang="en">Developmental plasticity and the origin of species differences</article-title><source>Proc. Natl Acad. Sci. USA</source><year>2005</year><volume>102</volume><fpage>6543</fpage><lpage>6549</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BD2MXktlais7g%3D</pub-id><pub-id pub-id-type="pmid">15851679</pub-id><pub-id pub-id-type="pmcid">1131862</pub-id><pub-id pub-id-type="doi">10.1073/pnas.0501844102</pub-id><pub-id pub-id-type="bibcode">2005PNAS..102.6543W</pub-id></mixed-citation></ref><ref id="CR28"><label>28.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kazachenka</surname><given-names>A</given-names></name><etal/></person-group><article-title xml:lang="en">Identification, characterization, and heritability of murine metastable epialleles: implications for non-genetic inheritance</article-title><source>Cell</source><year>2018</year><volume>175</volume><fpage>1259</fpage><lpage>1271.e13</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC1cXitVWju7zN</pub-id><pub-id pub-id-type="pmid">30454646</pub-id><pub-id pub-id-type="pmcid">6242299</pub-id><pub-id pub-id-type="doi">10.1016/j.cell.2018.09.043</pub-id></mixed-citation></ref><ref id="CR29"><label>29.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gore</surname><given-names>AV</given-names></name><etal/></person-group><article-title xml:lang="en">An epigenetic mechanism for cavefish eye degeneration</article-title><source>Nat. Ecol. Evol.</source><year>2018</year><volume>2</volume><fpage>1155</fpage><lpage>1160</lpage><pub-id pub-id-type="pmid">29807993</pub-id><pub-id pub-id-type="pmcid">6023768</pub-id><pub-id pub-id-type="doi">10.1038/s41559-018-0569-4</pub-id></mixed-citation></ref><ref id="CR30"><label>30.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Skvortsova</surname><given-names>K</given-names></name><name><surname>Iovino</surname><given-names>N</given-names></name><name><surname>Bogdanović</surname><given-names>O</given-names></name></person-group><article-title xml:lang="en">Functions and mechanisms of epigenetic inheritance in animals</article-title><source>Nat. Rev. Mol. Cell Biol.</source><year>2018</year><volume>19</volume><fpage>774</fpage><lpage>790</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC1cXit1Sgur3O</pub-id><pub-id pub-id-type="pmid">30425324</pub-id><pub-id pub-id-type="doi">10.1038/s41580-018-0074-2</pub-id></mixed-citation></ref><ref id="CR31"><label>31.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ryu</surname><given-names>T</given-names></name><name><surname>Veilleux</surname><given-names>HD</given-names></name><name><surname>Donelson</surname><given-names>JM</given-names></name><name><surname>Munday</surname><given-names>PL</given-names></name><name><surname>Ravasi</surname><given-names>T</given-names></name></person-group><article-title xml:lang="en">The epigenetic landscape of transgenerational acclimation to ocean warming</article-title><source>Nat. Clim. Chang.</source><year>2018</year><volume>8</volume><fpage>504</fpage><lpage>509</lpage><pub-id pub-id-type="doi">10.1038/s41558-018-0159-0</pub-id><pub-id pub-id-type="bibcode">2018NatCC...8..504R</pub-id></mixed-citation></ref><ref id="CR32"><label>32.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Moran</surname><given-names>D</given-names></name><name><surname>Softley</surname><given-names>R</given-names></name><name><surname>Warrant</surname><given-names>EJ</given-names></name></person-group><article-title xml:lang="en">The energetic cost of vision and the evolution of eyeless Mexican cavefish</article-title><source>Sci. Adv.</source><year>2015</year><volume>1</volume><fpage>e1500363</fpage><pub-id pub-id-type="pmid">26601263</pub-id><pub-id pub-id-type="pmcid">4643782</pub-id><pub-id pub-id-type="doi">10.1126/sciadv.1500363</pub-id><pub-id pub-id-type="bibcode">2015SciA....1E0363M</pub-id></mixed-citation></ref><ref id="CR33"><label>33.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Turner</surname><given-names>GF</given-names></name></person-group><article-title xml:lang="en">Adaptive radiation of cichlid fish</article-title><source>Curr. Biol.</source><year>2007</year><volume>17</volume><fpage>R827</fpage><lpage>R831</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BD2sXhtFCjtL3L</pub-id><pub-id pub-id-type="pmid">17925206</pub-id><pub-id pub-id-type="doi">10.1016/j.cub.2007.07.026</pub-id></mixed-citation></ref><ref id="CR34"><label>34.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Salzburger</surname><given-names>W</given-names></name></person-group><article-title xml:lang="en">Understanding explosive diversification through cichlid fish genomics</article-title><source>Nat. Rev. Genet.</source><year>2018</year><volume>19</volume><fpage>705</fpage><lpage>717</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC1cXhsFahsb3M</pub-id><pub-id pub-id-type="pmid">30111830</pub-id><pub-id pub-id-type="doi">10.1038/s41576-018-0043-9</pub-id></mixed-citation></ref><ref id="CR35"><label>35.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Malinsky</surname><given-names>M</given-names></name><name><surname>Salzburger</surname><given-names>W</given-names></name></person-group><article-title xml:lang="en">Environmental context for understanding the iconic adaptive radiation of cichlid fishes in Lake Malawi</article-title><source>Proc. Natl Acad. Sci. USA</source><year>2016</year><volume>113</volume><fpage>11654</fpage><lpage>11656</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC28XhslSqtrrL</pub-id><pub-id pub-id-type="pmid">27791049</pub-id><pub-id pub-id-type="pmcid">5081610</pub-id><pub-id pub-id-type="doi">10.1073/pnas.1614272113</pub-id><pub-id pub-id-type="bibcode">2016PNAS..11311654M</pub-id></mixed-citation></ref><ref id="CR36"><label>36.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Malinsky</surname><given-names>M</given-names></name><etal/></person-group><article-title xml:lang="en">Whole-genome sequences of Malawi cichlids reveal multiple radiations interconnected by gene flow</article-title><source>Nat. Ecol. Evol.</source><year>2018</year><volume>2</volume><fpage>1940</fpage><lpage>1955</lpage><pub-id pub-id-type="pmid">30455444</pub-id><pub-id pub-id-type="pmcid">6443041</pub-id><pub-id pub-id-type="doi">10.1038/s41559-018-0717-x</pub-id></mixed-citation></ref><ref id="CR37"><label>37.</label><mixed-citation publication-type="other">Konings, A. <italic>Malawi Cichlids in their Natural Habitat</italic> (Cichlid Press, 2016).</mixed-citation></ref><ref id="CR38"><label>38.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Brawand</surname><given-names>D</given-names></name><etal/></person-group><article-title xml:lang="en">The genomic substrate for adaptive radiation in African cichlid fish</article-title><source>Nature</source><year>2014</year><volume>513</volume><fpage>375</fpage><lpage>381</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC2cXhsFOlu7bM</pub-id><pub-id pub-id-type="pmid">25186727</pub-id><pub-id pub-id-type="pmcid">4353498</pub-id><pub-id pub-id-type="doi">10.1038/nature13726</pub-id><pub-id pub-id-type="bibcode">2014Natur.513..375B</pub-id></mixed-citation></ref><ref id="CR39"><label>39.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Genner</surname><given-names>MJ</given-names></name><name><surname>Turner</surname><given-names>GF</given-names></name></person-group><article-title xml:lang="en">Ancient hybridization and phenotypic novelty within Lake Malawi’s cichlid fish radiation</article-title><source>Mol. Biol. Evol.</source><year>2012</year><volume>29</volume><fpage>195</fpage><lpage>206</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC3MXhs1ynurnE</pub-id><pub-id pub-id-type="pmid">22114359</pub-id><pub-id pub-id-type="doi">10.1093/molbev/msr183</pub-id></mixed-citation></ref><ref id="CR40"><label>40.</label><mixed-citation publication-type="other">Turner, G. F., Ngatunga, B. P. &amp; Genner, M. J. The natural history of the satellite lakes of Lake Malawi. <italic>EcoEvoRxiv</italic>. <ext-link xlink:href="https://doi.org/10.32942/osf.io/sehdq" ext-link-type="doi">https://doi.org/10.32942/osf.io/sehdq</ext-link> (2019).</mixed-citation></ref><ref id="CR41"><label>41.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Long</surname><given-names>HK</given-names></name><etal/></person-group><article-title xml:lang="en">Epigenetic conservation at gene regulatory elements revealed by non-methylated DNA profiling in seven vertebrates</article-title><source>Elife</source><year>2013</year><volume>2013</volume><fpage>1</fpage><lpage>19</lpage><pub-id pub-id-type="bibcode">2013lds..book.....L</pub-id></mixed-citation></ref><ref id="CR42"><label>42.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Deaton</surname><given-names>AM</given-names></name><name><surname>Bird</surname><given-names>A</given-names></name></person-group><article-title xml:lang="en">CpG islands and the regulation of transcription</article-title><source>Genes Dev.</source><year>2011</year><volume>25</volume><fpage>1010</fpage><lpage>1022</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC3MXmslOgsLY%3D</pub-id><pub-id pub-id-type="pmid">3093116</pub-id><pub-id pub-id-type="pmcid">3093116</pub-id><pub-id pub-id-type="doi">10.1101/gad.2037511</pub-id></mixed-citation></ref><ref id="CR43"><label>43.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Conte</surname><given-names>MA</given-names></name><etal/></person-group><article-title xml:lang="en">Chromosome-scale assemblies reveal the structural evolution of African cichlid genomes</article-title><source>Gigascience</source><year>2019</year><volume>8</volume><fpage>1</fpage><lpage>20</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BB3cXotlOisw%3D%3D</pub-id><pub-id pub-id-type="doi">10.1093/gigascience/giz030</pub-id></mixed-citation></ref><ref id="CR44"><label>44.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yin</surname><given-names>Y</given-names></name><etal/></person-group><article-title xml:lang="en">Impact of cytosine methylation on DNA binding specificities of human transcription factors</article-title><source>Science</source><year>2017</year><volume>356</volume><fpage>eaaj2239</fpage><pub-id pub-id-type="pmid">28473536</pub-id><pub-id pub-id-type="pmcid">8009048</pub-id><pub-id pub-id-type="doi">10.1126/science.aaj2239</pub-id><pub-id pub-id-type="coi">1:CAS:528:DC%2BC2sXmvVGnsb8%3D</pub-id></mixed-citation></ref><ref id="CR45"><label>45.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chuong</surname><given-names>EB</given-names></name><name><surname>Elde</surname><given-names>NC</given-names></name><name><surname>Feschotte</surname><given-names>C</given-names></name></person-group><article-title xml:lang="en">Regulatory activities of transposable elements: from conflicts to benefits</article-title><source>Nat. Rev. Genet.</source><year>2017</year><volume>18</volume><fpage>71</fpage><lpage>86</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC28XhvV2iur7P</pub-id><pub-id pub-id-type="pmid">27867194</pub-id><pub-id pub-id-type="doi">10.1038/nrg.2016.139</pub-id><pub-id pub-id-type="pmcid">27867194</pub-id></mixed-citation></ref><ref id="CR46"><label>46.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Santos</surname><given-names>ME</given-names></name><etal/></person-group><article-title xml:lang="en">The evolution of cichlid fish egg-spots is linked with a cis-regulatory change</article-title><source>Nat. Commun.</source><year>2014</year><volume>5</volume><pub-id pub-id-type="coi">1:CAS:528:DC%2BC2cXitVaksLfP</pub-id><pub-id pub-id-type="pmid">25296686</pub-id><pub-id pub-id-type="doi">10.1038/ncomms6149</pub-id><pub-id pub-id-type="bibcode">2014NatCo...5.5149S</pub-id><pub-id pub-id-type="pmcid">25296686</pub-id></mixed-citation></ref><ref id="CR47"><label>47.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fedoroff</surname><given-names>NV</given-names></name></person-group><article-title xml:lang="en">Transposable elements, epigenetics, and genome evolution</article-title><source>Science</source><year>2012</year><volume>338</volume><fpage>758</fpage><lpage>767</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC38Xhslagt7%2FO</pub-id><pub-id pub-id-type="pmid">23145453</pub-id><pub-id pub-id-type="pmcid">23145453</pub-id><pub-id pub-id-type="doi">10.1126/science.338.6108.758</pub-id><pub-id pub-id-type="bibcode">2012Sci...338..758F</pub-id></mixed-citation></ref><ref id="CR48"><label>48.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Carleton</surname><given-names>KL</given-names></name><etal/></person-group><article-title xml:lang="en">Movement of transposable elements contributes to cichlid diversity</article-title><source>Mol. Ecol.</source><year>2020</year><volume>29</volume><fpage>4956</fpage><lpage>4969</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BB3MXotlCmtQ%3D%3D</pub-id><pub-id pub-id-type="pmid">33049090</pub-id><pub-id pub-id-type="doi">10.1111/mec.15685</pub-id><pub-id pub-id-type="pmcid">33049090</pub-id></mixed-citation></ref><ref id="CR49"><label>49.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lev Maor</surname><given-names>G</given-names></name><name><surname>Yearim</surname><given-names>A</given-names></name><name><surname>Ast</surname><given-names>G</given-names></name></person-group><article-title xml:lang="en">The alternative role of DNA methylation in splicing regulation</article-title><source>Trends Genet.</source><year>2015</year><volume>31</volume><fpage>274</fpage><lpage>280</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC2MXltFWiu7o%3D</pub-id><pub-id pub-id-type="pmid">25837375</pub-id><pub-id pub-id-type="doi">10.1016/j.tig.2015.03.002</pub-id><pub-id pub-id-type="pmcid">25837375</pub-id></mixed-citation></ref><ref id="CR50"><label>50.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hayhurst</surname><given-names>GP</given-names></name><name><surname>Lee</surname><given-names>Y-H</given-names></name><name><surname>Lambert</surname><given-names>G</given-names></name><name><surname>Ward</surname><given-names>JM</given-names></name><name><surname>Gonzalez</surname><given-names>FJ</given-names></name></person-group><article-title xml:lang="en">Hepatocyte nuclear factor 4α (nuclear receptor 2A1) is essential for maintenance of hepatic gene expression and lipid homeostasis</article-title><source>Mol. Cell. Biol.</source><year>2001</year><volume>21</volume><fpage>1393</fpage><lpage>1403</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BD3MXovVCmuw%3D%3D</pub-id><pub-id pub-id-type="pmid">11158324</pub-id><pub-id pub-id-type="pmcid">99591</pub-id><pub-id pub-id-type="doi">10.1128/MCB.21.4.1393-1403.2001</pub-id></mixed-citation></ref><ref id="CR51"><label>51.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Albertsson</surname><given-names>E</given-names></name><name><surname>Rad</surname><given-names>A</given-names></name><name><surname>Sturve</surname><given-names>J</given-names></name><name><surname>Larsson</surname><given-names>DGJ</given-names></name><name><surname>Förlin</surname><given-names>L</given-names></name></person-group><article-title xml:lang="en">Carbonyl reductase mRNA abundance and enzymatic activity as potential biomarkers of oxidative stress in marine fish</article-title><source>Mar. Environ. Res.</source><year>2012</year><volume>80</volume><fpage>56</fpage><lpage>61</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC38Xht1KjsLvP</pub-id><pub-id pub-id-type="pmid">22819450</pub-id><pub-id pub-id-type="doi">10.1016/j.marenvres.2012.07.001</pub-id></mixed-citation></ref><ref id="CR52"><label>52.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Revelo</surname><given-names>XS</given-names></name><etal/></person-group><article-title xml:lang="en">Perforin is a novel immune regulator of obesity-related insulin resistance</article-title><source>Diabetes</source><year>2015</year><volume>64</volume><fpage>90</fpage><lpage>103</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC2MXktVOlsw%3D%3D</pub-id><pub-id pub-id-type="pmid">25048196</pub-id><pub-id pub-id-type="doi">10.2337/db13-1524</pub-id></mixed-citation></ref><ref id="CR53"><label>53.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname><given-names>CS</given-names></name><name><surname>Friedman</surname><given-names>JR</given-names></name><name><surname>Fulmer</surname><given-names>JT</given-names></name><name><surname>Kaestner</surname><given-names>KH</given-names></name></person-group><article-title xml:lang="en">The initiation of liver development is dependent on Foxa transcription factors</article-title><source>Nature</source><year>2005</year><volume>435</volume><fpage>944</fpage><lpage>947</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BD2MXltFeltb8%3D</pub-id><pub-id pub-id-type="pmid">15959514</pub-id><pub-id pub-id-type="doi">10.1038/nature03649</pub-id><pub-id pub-id-type="bibcode">2005Natur.435..944L</pub-id></mixed-citation></ref><ref id="CR54"><label>54.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bassett</surname><given-names>EA</given-names></name><name><surname>Wallace</surname><given-names>VA</given-names></name></person-group><article-title xml:lang="en">Cell fate determination in the vertebrate retina</article-title><source>Trends Neurosci.</source><year>2012</year><volume>35</volume><fpage>565</fpage><lpage>573</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC38XoslKitr0%3D</pub-id><pub-id pub-id-type="pmid">22704732</pub-id><pub-id pub-id-type="doi">10.1016/j.tins.2012.05.004</pub-id></mixed-citation></ref><ref id="CR55"><label>55.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hahn</surname><given-names>C</given-names></name><name><surname>Genner</surname><given-names>MJ</given-names></name><name><surname>Turner</surname><given-names>GF</given-names></name><name><surname>Joyce</surname><given-names>DA</given-names></name></person-group><article-title xml:lang="en">The genomic basis of cichlid fish adaptation within the deepwater “twilight zone” of Lake Malawi</article-title><source>Evol. Lett.</source><year>2017</year><volume>1</volume><fpage>184</fpage><lpage>198</lpage><pub-id pub-id-type="pmid">30283648</pub-id><pub-id pub-id-type="pmcid">6124600</pub-id><pub-id pub-id-type="doi">10.1002/evl3.20</pub-id></mixed-citation></ref><ref id="CR56"><label>56.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Reinhard</surname><given-names>E</given-names></name><name><surname>Nedivi</surname><given-names>E</given-names></name><name><surname>Wegner</surname><given-names>J</given-names></name><name><surname>Skene</surname><given-names>JHP</given-names></name><name><surname>Westerfield</surname><given-names>M</given-names></name></person-group><article-title xml:lang="en">Neural selective activation and temporal regulation of a mammalian GAP-43 promoter in zebrafish</article-title><source>Development</source><year>1994</year><volume>120</volume><fpage>1767</fpage><lpage>1775</lpage><pub-id pub-id-type="coi">1:CAS:528:DyaK2MXivVWmtQ%3D%3D</pub-id><pub-id pub-id-type="pmid">7924984</pub-id><pub-id pub-id-type="doi">10.1242/dev.120.7.1767</pub-id></mixed-citation></ref><ref id="CR57"><label>57.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cheung</surname><given-names>A</given-names></name><name><surname>Trevers</surname><given-names>KE</given-names></name><name><surname>Reyes-Corral</surname><given-names>M</given-names></name><name><surname>Antinucci</surname><given-names>P</given-names></name><name><surname>Hindges</surname><given-names>R</given-names></name></person-group><article-title xml:lang="en">Expression and roles of teneurins in zebrafish</article-title><source>Front. Neurosci.</source><year>2019</year><volume>13</volume><fpage>1</fpage><lpage>13</lpage></mixed-citation></ref><ref id="CR58"><label>58.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nadeau</surname><given-names>NJ</given-names></name><etal/></person-group><article-title xml:lang="en">The gene cortex controls mimicry and crypsis in butterflies and moths</article-title><source>Nature</source><year>2016</year><volume>534</volume><fpage>106</fpage><lpage>110</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC28XptV2jurY%3D</pub-id><pub-id pub-id-type="pmid">27251285</pub-id><pub-id pub-id-type="pmcid">5094491</pub-id><pub-id pub-id-type="doi">10.1038/nature17961</pub-id><pub-id pub-id-type="bibcode">2016Natur.534..106N</pub-id></mixed-citation></ref><ref id="CR59"><label>59.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Marques</surname><given-names>DA</given-names></name><name><surname>Meier</surname><given-names>JI</given-names></name><name><surname>Seehausen</surname><given-names>O</given-names></name></person-group><article-title xml:lang="en">A combinatorial view on speciation and adaptive radiation</article-title><source>Trends Ecol. Evol.</source><year>2019</year><volume>34</volume><fpage>531</fpage><lpage>544</lpage><pub-id pub-id-type="pmid">30885412</pub-id><pub-id pub-id-type="doi">10.1016/j.tree.2019.02.008</pub-id></mixed-citation></ref><ref id="CR60"><label>60.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Colot</surname><given-names>V</given-names></name><name><surname>Rossignol</surname><given-names>J-L</given-names></name></person-group><article-title xml:lang="en">Eukaryotic DNA methylation as an evolutionary device</article-title><source>BioEssays</source><year>1999</year><volume>21</volume><fpage>402</fpage><lpage>411</lpage><pub-id pub-id-type="coi">1:STN:280:DyaK1MzgsVaquw%3D%3D</pub-id><pub-id pub-id-type="pmid">10376011</pub-id><pub-id pub-id-type="doi">10.1002/(SICI)1521-1878(199905)21:5&lt;402::AID-BIES7&gt;3.0.CO;2-B</pub-id></mixed-citation></ref><ref id="CR61"><label>61.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Svardal</surname><given-names>H</given-names></name><etal/></person-group><article-title xml:lang="en">Ancestral hybridization facilitated species diversification in the Lake Malawi Cichlid fish adaptive radiation</article-title><source>Mol. Biol. Evol.</source><year>2020</year><volume>37</volume><fpage>1100</fpage><lpage>1113</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BB3MXht12htL3K</pub-id><pub-id pub-id-type="pmid">31821500</pub-id><pub-id pub-id-type="doi">10.1093/molbev/msz294</pub-id></mixed-citation></ref><ref id="CR62"><label>62.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Heckwolf</surname><given-names>MJ</given-names></name><etal/></person-group><article-title xml:lang="en">Two different epigenetic information channels in wild three-spined sticklebacks are involved in salinity adaptation</article-title><source>Sci. Adv.</source><year>2020</year><volume>6</volume><fpage>eaaz1138</fpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BB3cXitFGntr7N</pub-id><pub-id pub-id-type="pmid">32219167</pub-id><pub-id pub-id-type="pmcid">7083608</pub-id><pub-id pub-id-type="doi">10.1126/sciadv.aaz1138</pub-id><pub-id pub-id-type="bibcode">2020SciA....6.1138H</pub-id></mixed-citation></ref><ref id="CR63"><label>63.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hu</surname><given-names>J</given-names></name><etal/></person-group><article-title xml:lang="en">Heritability of DNA methylation in threespine stickleback (Gasterosteus aculeatus)</article-title><source>Genetics</source><year>2021</year><volume>217</volume><fpage>1</fpage><lpage>15</lpage><pub-id pub-id-type="pmid">33683369</pub-id><pub-id pub-id-type="doi">10.1093/genetics/iyab001</pub-id></mixed-citation></ref><ref id="CR64"><label>64.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>X</given-names></name><name><surname>Bhandari</surname><given-names>RK</given-names></name></person-group><article-title xml:lang="en">DNA methylation dynamics during epigenetic reprogramming of medaka embryo</article-title><source>Epigenetics</source><year>2019</year><volume>14</volume><fpage>611</fpage><lpage>622</lpage><pub-id pub-id-type="pmid">31010368</pub-id><pub-id pub-id-type="pmcid">6557613</pub-id><pub-id pub-id-type="doi">10.1080/15592294.2019.1605816</pub-id></mixed-citation></ref><ref id="CR65"><label>65.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Potok</surname><given-names>ME</given-names></name><name><surname>Nix</surname><given-names>DA</given-names></name><name><surname>Parnell</surname><given-names>TJ</given-names></name><name><surname>Cairns</surname><given-names>BR</given-names></name></person-group><article-title xml:lang="en">Reprogramming the maternal zebrafish genome after fertilization to match the paternal methylation pattern</article-title><source>Cell</source><year>2013</year><volume>153</volume><fpage>759</fpage><lpage>772</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC3sXnsFWjs7Y%3D</pub-id><pub-id pub-id-type="pmid">23663776</pub-id><pub-id pub-id-type="pmcid">4030421</pub-id><pub-id pub-id-type="doi">10.1016/j.cell.2013.04.030</pub-id></mixed-citation></ref><ref id="CR66"><label>66.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname><given-names>HJ</given-names></name><name><surname>Hore</surname><given-names>TA</given-names></name><name><surname>Reik</surname><given-names>W</given-names></name></person-group><article-title xml:lang="en">Reprogramming the methylome: erasing memory and creating diversity</article-title><source>Cell Stem Cell</source><year>2014</year><volume>14</volume><fpage>710</fpage><lpage>719</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC2cXpvFSktL8%3D</pub-id><pub-id pub-id-type="pmid">24905162</pub-id><pub-id pub-id-type="pmcid">4051243</pub-id><pub-id pub-id-type="doi">10.1016/j.stem.2014.05.008</pub-id></mixed-citation></ref><ref id="CR67"><label>67.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Thurman</surname><given-names>RE</given-names></name><etal/></person-group><article-title xml:lang="en">The accessible chromatin landscape of the human genome</article-title><source>Nature</source><year>2012</year><volume>489</volume><fpage>75</fpage><lpage>82</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC38XhtlGns7bL</pub-id><pub-id pub-id-type="pmid">22955617</pub-id><pub-id pub-id-type="pmcid">3721348</pub-id><pub-id pub-id-type="doi">10.1038/nature11232</pub-id><pub-id pub-id-type="bibcode">2012Natur.489...75T</pub-id></mixed-citation></ref><ref id="CR68"><label>68.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bogdanović</surname><given-names>O</given-names></name><name><surname>Veenstra</surname><given-names>GJC</given-names></name></person-group><article-title xml:lang="en">DNA methylation and methyl-CpG binding proteins: developmental requirements and function</article-title><source>Chromosoma</source><year>2009</year><volume>118</volume><fpage>549</fpage><lpage>565</lpage><pub-id pub-id-type="pmid">19506892</pub-id><pub-id pub-id-type="pmcid">2729420</pub-id><pub-id pub-id-type="doi">10.1007/s00412-009-0221-9</pub-id><pub-id pub-id-type="coi">1:CAS:528:DC%2BD1MXhtVarurfK</pub-id></mixed-citation></ref><ref id="CR69"><label>69.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Houwing</surname><given-names>S</given-names></name><etal/></person-group><article-title xml:lang="en">A role for piwi and piRNAs in germ cell maintenance and transposon silencing in Zebrafish</article-title><source>Cell</source><year>2007</year><volume>129</volume><fpage>69</fpage><lpage>82</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BD2sXkvVeltL0%3D</pub-id><pub-id pub-id-type="pmid">17418787</pub-id><pub-id pub-id-type="doi">10.1016/j.cell.2007.03.026</pub-id></mixed-citation></ref><ref id="CR70"><label>70.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cosby</surname><given-names>RL</given-names></name><name><surname>Chang</surname><given-names>N-C</given-names></name><name><surname>Feschotte</surname><given-names>C</given-names></name></person-group><article-title xml:lang="en">Host–transposon interactions: conflict, cooperation, and cooption</article-title><source>Genes Dev.</source><year>2019</year><volume>33</volume><fpage>1098</fpage><lpage>1116</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC1MXhvVahsrrJ</pub-id><pub-id pub-id-type="pmid">31481535</pub-id><pub-id pub-id-type="pmcid">6719617</pub-id><pub-id pub-id-type="doi">10.1101/gad.327312.119</pub-id></mixed-citation></ref><ref id="CR71"><label>71.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dubin</surname><given-names>MJ</given-names></name><etal/></person-group><article-title xml:lang="en">DNA methylation in Arabidopsis has a genetic basis and shows evidence of local adaptation</article-title><source>Elife</source><year>2015</year><volume>4</volume><fpage>e05255</fpage><pub-id pub-id-type="pmid">25939354</pub-id><pub-id pub-id-type="pmcid">4413256</pub-id><pub-id pub-id-type="doi">10.7554/eLife.05255</pub-id></mixed-citation></ref><ref id="CR72"><label>72.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>McGee</surname><given-names>MD</given-names></name><etal/></person-group><article-title xml:lang="en">The ecological and genomic basis of explosive adaptive radiation</article-title><source>Nature</source><year>2020</year><volume>586</volume><fpage>75</fpage><lpage>79</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BB3cXhs12jt7bM</pub-id><pub-id pub-id-type="pmid">32848251</pub-id><pub-id pub-id-type="doi">10.1038/s41586-020-2652-7</pub-id><pub-id pub-id-type="bibcode">2020Natur.586...75M</pub-id></mixed-citation></ref><ref id="CR73"><label>73.</label><mixed-citation publication-type="other">Harris, R. S. <italic>Improved Pairwise Alignment of Genomic DNA</italic> (The Pennsylvania State University, 2007).</mixed-citation></ref><ref id="CR74"><label>74.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Krueger</surname><given-names>F</given-names></name><name><surname>Andrews</surname><given-names>SR</given-names></name></person-group><article-title xml:lang="en">Bismark: a flexible aligner and methylation caller for Bisulfite-Seq applications</article-title><source>Bioinformatics</source><year>2011</year><volume>27</volume><fpage>1571</fpage><lpage>1572</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC3MXmvVWqurw%3D</pub-id><pub-id pub-id-type="pmid">21493656</pub-id><pub-id pub-id-type="pmcid">3102221</pub-id><pub-id pub-id-type="doi">10.1093/bioinformatics/btr167</pub-id></mixed-citation></ref><ref id="CR75"><label>75.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname><given-names>H</given-names></name><etal/></person-group><article-title xml:lang="en">Detection of differentially methylated regions from whole-genome bisulfite sequencing data without replicates</article-title><source>Nucleic Acids Res.</source><year>2015</year><volume>43</volume><fpage>gkv715</fpage><pub-id pub-id-type="doi">10.1093/nar/gkv715</pub-id><pub-id pub-id-type="coi">1:CAS:528:DC%2BC28Xjt1Gru74%3D</pub-id></mixed-citation></ref><ref id="CR76"><label>76.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname><given-names>H</given-names></name><name><surname>Caffo</surname><given-names>B</given-names></name><name><surname>Jaffee</surname><given-names>HA</given-names></name><name><surname>Irizarry</surname><given-names>RA</given-names></name><name><surname>Feinberg</surname><given-names>AP</given-names></name></person-group><article-title xml:lang="en">Redefining CpG islands using hidden Markov models</article-title><source>Biostatistics</source><year>2010</year><volume>11</volume><fpage>499</fpage><lpage>514</lpage><pub-id pub-id-type="pmid">20212320</pub-id><pub-id pub-id-type="pmcid">2883304</pub-id><pub-id pub-id-type="zbl">1437.62659</pub-id><pub-id pub-id-type="doi">10.1093/biostatistics/kxq005</pub-id></mixed-citation></ref><ref id="CR77"><label>77.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bray</surname><given-names>NL</given-names></name><name><surname>Pimentel</surname><given-names>H</given-names></name><name><surname>Melsted</surname><given-names>P</given-names></name><name><surname>Pachter</surname><given-names>L</given-names></name></person-group><article-title xml:lang="en">Near-optimal probabilistic RNA-seq quantification</article-title><source>Nat. Biotechnol.</source><year>2016</year><volume>34</volume><fpage>525</fpage><lpage>527</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC28XlsVansL8%3D</pub-id><pub-id pub-id-type="pmid">27043002</pub-id><pub-id pub-id-type="doi">10.1038/nbt.3519</pub-id></mixed-citation></ref><ref id="CR78"><label>78.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Pimentel</surname><given-names>H</given-names></name><name><surname>Bray</surname><given-names>NL</given-names></name><name><surname>Puente</surname><given-names>S</given-names></name><name><surname>Melsted</surname><given-names>P</given-names></name><name><surname>Pachter</surname><given-names>L</given-names></name></person-group><article-title xml:lang="en">Differential analysis of RNA-seq incorporating quantification uncertainty</article-title><source>Nat. Methods</source><year>2017</year><volume>14</volume><fpage>687</fpage><lpage>690</lpage><pub-id pub-id-type="coi">1:CAS:528:DC%2BC2sXpt1OmtLk%3D</pub-id><pub-id pub-id-type="pmid">28581496</pub-id><pub-id pub-id-type="doi">10.1038/nmeth.4324</pub-id></mixed-citation></ref></ref-list></ref-list><app-group><app id="App1"><sec id="Sec25"><title>Supplementary information</title><p id="Par52"><supplementary-material content-type="local-data" id="MOESM1" xlink:title="Supplementary information"><media xlink:href="MediaObjects/41467_2021_26166_MOESM1_ESM.pdf" mimetype="application" mime-subtype="pdf"><caption xml:lang="en"><p>Supplementary Information</p></caption></media></supplementary-material><supplementary-material content-type="local-data" id="MOESM2" xlink:title="Supplementary information"><media xlink:href="MediaObjects/41467_2021_26166_MOESM2_ESM.pdf" mimetype="application" mime-subtype="pdf"><caption xml:lang="en"><p>Peer Review File</p></caption></media></supplementary-material><supplementary-material content-type="local-data" id="MOESM3" xlink:title="Supplementary information"><media xlink:href="MediaObjects/41467_2021_26166_MOESM3_ESM.pdf" mimetype="application" mime-subtype="pdf"><caption xml:lang="en"><p>Description of Additional Supplementary File</p></caption></media></supplementary-material><supplementary-material content-type="local-data" id="MOESM4" xlink:title="Supplementary information"><media xlink:href="MediaObjects/41467_2021_26166_MOESM4_ESM.xlsx" mimetype="application" mime-subtype="vnd.ms-excel"><caption xml:lang="en"><p>Supplementary Data 1</p></caption></media></supplementary-material><supplementary-material content-type="local-data" id="MOESM5" xlink:title="Supplementary information"><media xlink:href="MediaObjects/41467_2021_26166_MOESM5_ESM.pdf" mimetype="application" mime-subtype="pdf"><caption xml:lang="en"><p>Reporting Summary</p></caption></media></supplementary-material></p></sec></app></app-group><notes notes-type="ESMHint"><title>Supplementary information</title><p>The online version contains supplementary material available at <ext-link xlink:href="https://doi.org/10.1038/s41467-021-26166-2" ext-link-type="doi">https://doi.org/10.1038/s41467-021-26166-2</ext-link>.</p></notes><notes notes-type="Misc"><p><bold>Peer review information</bold><italic>Nature Communications</italic> thanks the anonymous reviewers for their contribution to the peer review of this work. Peer reviewer reports are available.</p></notes><notes notes-type="Misc"><p><bold>Publisher’s note</bold> Springer Nature remains neutral with regard to jurisdictional claims in published maps and institutional affiliations.</p></notes></back></article>