<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing with OASIS Tables v3.0 20080202//EN" "https://jats.nlm.nih.gov/nlm-dtd/publishing/3.0/journalpub-oasis3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:oasis="http://docs.oasis-open.org/ns/oasis-exchange/table" xml:lang="en" dtd-version="3.0" article-type="data-paper">
  <front>
    <journal-meta><journal-id journal-id-type="publisher">ESSD</journal-id><journal-title-group>
    <journal-title>Earth System Science Data</journal-title>
    <abbrev-journal-title abbrev-type="publisher">ESSD</abbrev-journal-title><abbrev-journal-title abbrev-type="nlm-ta">Earth Syst. Sci. Data</abbrev-journal-title>
  </journal-title-group><issn pub-type="epub">1866-3516</issn><publisher>
    <publisher-name>Copernicus Publications</publisher-name>
    <publisher-loc>Göttingen, Germany</publisher-loc>
  </publisher></journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.5194/essd-17-5165-2025</article-id><title-group><article-title>A database of glacier prokaryotic genomes  and genes for the Three Poles</article-title><alt-title>A database of glacier prokaryotic genomes and genes for the Three Poles</alt-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author" corresp="yes" rid="aff1 aff2 aff3">
          <name><surname>Liu</surname><given-names>Yongqin</given-names></name>
          <email>yql@lzu.edu.cn</email>
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff3 aff4">
          <name><surname>Hu</surname><given-names>Songnian</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1 aff3 aff4">
          <name><surname>Yu</surname><given-names>Tao</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff3 aff4">
          <name><surname>Luo</surname><given-names>Yingfeng</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2 aff3">
          <name><surname>Zhang</surname><given-names>Zhihao</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2 aff3">
          <name><surname>Chen</surname><given-names>Yuying</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff4 aff5 aff6">
          <name><surname>Guo</surname><given-names>Shunchao</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff4 aff5 aff6">
          <name><surname>Sun</surname><given-names>Qinglan</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff4 aff5 aff6">
          <name><surname>Fan</surname><given-names>Guomei</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff4 aff5 aff6">
          <name><surname>Wu</surname><given-names>Linhuan</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff4 aff5 aff6">
          <name><surname>Ma</surname><given-names>Juncai</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff2">
          <name><surname>Liu</surname><given-names>Keshao</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Liu</surname><given-names>Pengfei</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Liu</surname><given-names>Junzhi</given-names></name>
          
        <ext-link>https://orcid.org/0000-0002-7354-4207</ext-link></contrib>
        <contrib contrib-type="author" corresp="no" rid="aff1">
          <name><surname>Dong</surname><given-names>Ruyi</given-names></name>
          
        </contrib>
        <contrib contrib-type="author" corresp="yes" rid="aff1">
          <name><surname>Ji</surname><given-names>Mukan</given-names></name>
          <email>jimk@lzu.edu.cn</email>
        <ext-link>https://orcid.org/0000-0001-8139-2875</ext-link></contrib>
        <aff id="aff1"><label>1</label><institution>Center for Pan-third Pole Environment, Lanzhou University, Lanzhou, China</institution>
        </aff>
        <aff id="aff2"><label>2</label><institution>State Key Laboratory of Tibetan Plateau Earth System, Resources and Environment (TPESRE),  Institute of Tibetan Plateau Research, Chinese Academy of Sciences, Beijing, China</institution>
        </aff>
        <aff id="aff3"><label>3</label><institution>College of Earth and Planetary Sciences, University of Chinese Academy of Sciences, Beijing, China</institution>
        </aff>
        <aff id="aff4"><label>4</label><institution>State Key Laboratory of Microbial Resources, Institute of Microbiology,  Chinese Academy of Sciences, Beijing, China</institution>
        </aff>
        <aff id="aff5"><label>5</label><institution>Microbial Resource and Big Data Center, Institute of Microbiology,  Chinese Academy of Sciences, Beijing, China</institution>
        </aff>
        <aff id="aff6"><label>6</label><institution>Chinese National Microbiology Data Center (NMDC), Beijing, China</institution>
        </aff>
      </contrib-group>
      <author-notes><corresp id="corr1">Yongqin Liu (yql@lzu.edu.cn) and Mukan Ji (jimk@lzu.edu.cn)</corresp></author-notes><pub-date><day>7</day><month>October</month><year>2025</year></pub-date>
      
      <volume>17</volume>
      <issue>10</issue>
      <fpage>5165</fpage><lpage>5179</lpage>
      <history>
        <date date-type="received"><day>27</day><month>September</month><year>2023</year></date>
           <date date-type="rev-request"><day>1</day><month>December</month><year>2023</year></date>
           <date date-type="rev-recd"><day>25</day><month>May</month><year>2025</year></date>
           <date date-type="accepted"><day>8</day><month>July</month><year>2025</year></date>
      </history>
      <permissions>
        <copyright-statement>Copyright: © 2025 Yongqin Liu et al.</copyright-statement>
        <copyright-year>2025</copyright-year>
      <license license-type="open-access"><license-p>This work is licensed under the Creative Commons Attribution 4.0 International License. To view a copy of this licence, visit <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link></license-p></license></permissions><self-uri xlink:href="https://essd.copernicus.org/articles/17/5165/2025/essd-17-5165-2025.html">This article is available from https://essd.copernicus.org/articles/17/5165/2025/essd-17-5165-2025.html</self-uri><self-uri xlink:href="https://essd.copernicus.org/articles/17/5165/2025/essd-17-5165-2025.pdf">The full text article is available as a PDF file from https://essd.copernicus.org/articles/17/5165/2025/essd-17-5165-2025.pdf</self-uri>
      <abstract><title>Abstract</title>

      <p id="d2e262">Glaciers cover 10 % of Earth's land area and are a pool of carbon and nitrogen for downstream ecosystems. Microbes, including bacteria, fungi, algae, and other microeukaryotes, are the primary inhabitants of glacier ecosystems and are key drivers of carbon and nitrogen transformation. Among them, prokaryotes (including bacteria and archaea) are the most diverse and abundant. Here, we present a dataset of supraglacial bacterial and archaeal (referred to as prokaryotic hereafter) communities across the Antarctic, Arctic, Tibetan Plateau, and other alpine regions. The dataset comprises 2039 amplicon sequencing data points, 999 cultured bacterial genomes, and 208 metagenomes, covering ice, snow, and cryoconite habitats. The dataset contains 64 510 prokaryotic amplicon sequencing phylotypes, with a higher diversity in the Tibetan glaciers than in the Antarctic and Arctic glaciers, which were respectively enriched with Gammaproteobacteria, Bacteroidota, and Alphaproteobacteria. The dataset also contains 62 595 715 unique genes and 4501 prokaryotic genomes, a 35.5 % expansion from previous publications. Genes were annotated for those associated with carbohydrate-active enzymes, nitrogen cycling, methane cycling, antimicrobial resistance, and microbial virulence, revealing the dynamic microbial functions in glacial habitats. This comprehensive dataset provides standardized prokaryotic diversity, taxonomy, community structure, and genetic functions of glacial microbiomes. The data can be leveraged to elucidate ecological principles governing the distribution of prokaryotes, to gain insights into the key functional genes for supraglacial microbiomes, to build mechanistic models, and to identify any potential biohazards for policymakers to make informed decisions regarding climate change. The dataset is available at the Global Glacier Genome and Gene Database (<uri>https://nmdc.cn/4gdb/</uri>, last access: 11 July 2025; DOI: <ext-link xlink:href="https://doi.org/10.11888/Cryos.tpdc.300830" ext-link-type="DOI">10.11888/Cryos.tpdc.300830</ext-link>, Liu et al., 2023).</p>
  </abstract>
    
<funding-group>
<award-group id="gs1">
<funding-source>National Natural Science Foundation of China</funding-source>
<award-id>42421001</award-id>
<award-id>42425607</award-id>
</award-group>
<award-group id="gs2">
<funding-source>Science and Technology Department of Gansu Province</funding-source>
<award-id>25RCKA021</award-id>
</award-group>
</funding-group>
</article-meta>
  </front>
<body>
      

<sec id="Ch1.S1" sec-type="intro">
  <label>1</label><title>Introduction</title>
      <p id="d2e280">Glaciers cover 10 % of Earth's land area (Cauvy-Fraunié and Dangles, 2019) and are mainly distributed in the Antarctic, Arctic, and Tibetan Plateau (the Three Poles) (Qiu, 2008). Glaciers store approximately three-quarters of Earth's fresh water (Boetius et al., 2015) and are also a pool of carbon and nitrogen. It has been estimated that 6 Pg of carbon is stored in global glaciers. These carbon may be released into downstream ecosystems with glacier runoff (Hood et al., 2015), influencing key elemental cycling in downstream ecosystems. Before carbons and nitrogen are released, they undergo extensive biological transformation (Guo et al., 2022), primarily microbially driven. Microbes, including bacteria, fungi, algae, and other microeukaryotes, are the main inhabitants of glacier ecosystems (Cauvy-Fraunié and Dangles, 2019), while bacteria are the most abundant and diverse. These microorganisms employ strategies to survive the glacial conditions, such as strong UV radiation, low temperature, and low-carbon and low-nitrogen nutrients (Ciccazzo et al., 2016). As microorganisms are the key driver of carbon and nitrogen transformation in glacier ecosystems, knowledge of their biogeography and functions can greatly enhance our understanding of the biogeochemical cycling in glacial ecosystems and aid in predicting the impact of climate change.</p>
      <p id="d2e283">The glacier as a habitat is not homogeneous and is divided into supraglacial, englacial, and subglacial ecosystems. Compared with other glacier-related habitats, the microorganisms in supraglacial ecosystems are the most active due to their exposure to the external environment and ambient temperature. Supraglacial ecosystems can be further separated into snow, ice, and cryoconite holes (cylindrical depressions formed by the preferential melting of dark debris into the surface, typically comprising surface water and cryoconite at the bottom) (Cook et al., 2016), each of which has a distinct microbial composition (Anesio and Laybourn-Parry, 2012). Algae and Cyanobacteria are the primary producers in supraglacial ecosystems, with other heterotrophic microorganisms participating in the transformation and degradation of endogenous and exogenous nutrients (Hotaling et al., 2017; Anesio et al., 2017). Active metabolism is reported in glacial ecosystems; for instance, cryoconite is a source of methane but a sink of carbon dioxide, with a rate of 4.60 and <inline-formula><mml:math id="M1" display="inline"><mml:mo>-</mml:mo></mml:math></inline-formula>1.77 <inline-formula><mml:math id="M2" display="inline"><mml:mrow class="unit"><mml:mi mathvariant="normal">µ</mml:mi></mml:mrow></mml:math></inline-formula>mol m<sup>−2</sup> d<sup>−1</sup>, respectively (Zhang et al., 2021). Furthermore, organisms with photosynthesis, nitrification, and denitrification functions are also widespread in glacier cryoconite (Cameron et al., 2012; Stibal et al., 2020).</p>
      <p id="d2e325">It was estimated that the mean microbial abundance in glacier surface meltwater is 10<sup>4</sup> cells mL<sup>−1</sup> (Stevens et al., 2022); this quantity may further increase with enhanced climate warming (Segawa et al., 2005). Some of these naturally occurring microorganisms are known as emerging contaminants, which are not commonly monitored in the environment but have the potential to enter the environment and cause known or suspected adverse ecological and/or human health effects (Taheran et al., 2018). A previous study cultivated hemolytic bacteria from Spitsbergen glacier meltwater with potential pathogenicity (Mogrovejo-Arias et al., 2020). Other emerging contaminants in glaciers, such as antibiotic resistance genes and microbial virulence factors, have also received increased attention (Mao et al., 2023).</p>
      <p id="d2e349">Here, we present a glacier dataset of glacial prokaryotes (bacteria and archaea) across the Antarctic, Arctic, Tibetan Plateau, and other alpine regions. This dataset includes amplicon sequencing data from 2039 samples, 999 cultured bacterial genomes, and shotgun metagenomic sequencing from 224 samples (Fig. 1). From an ecological perspective, this dataset with standardized prokaryotic diversity, taxonomy, and community structure can improve understanding of the ecological principles governing the distribution of microorganisms across glaciers, as well as their partitioning across the various habitats in the supraglacial ecosystem. From a geochemical cycling perspective, the database can provide insights into the key functional genes for supraglacial microbiomes, which can be used to better comprehend carbon and nitrogen cycling and allow the building of a model to anticipate glacial carbon and nitrogen dynamics in the future. The dataset archives glacially specific microorganisms and unique genes in digital form, thus representing an invaluable resource for bioprospecting. Additionally, the dataset can be employed to identify any potential biohazards (pathogens and emerging contaminants) of glaciers and evaluate the impact of glacier melting on downstream ecosystems from a biosafety perspective, thereby assisting policymakers in making informed decisions regarding climate change.</p>

      <fig id="F1" specific-use="star"><label>Figure 1</label><caption><p id="d2e355">The location of glacier samples across the Antarctic, Arctic, and Tibetan glaciers.</p></caption>
        <graphic xlink:href="https://essd.copernicus.org/articles/17/5165/2025/essd-17-5165-2025-f01.jpg"/>

      </fig>

</sec>
<sec id="Ch1.S2">
  <label>2</label><title>Materials and methods</title>
<sec id="Ch1.S2.SS1">
  <label>2.1</label><title>Data acquisition</title>
      <p id="d2e379"><italic>Amplicon data.</italic> Based on the keywords of “glacier” OR “snow” OR “ice” OR “cryoconite” with sample type being DNA and instrument of Illumina, we retrieved 225 378 Short Read Archives (SRAs) initially. Then the results were filtered manually to remove non-supra-glacier habitats (such as glacier forefield, subglacial sediment, proglacial lakes, ice cave), metagenome data, and primers that do not amplify the V4 region of the 16S rRNA gene (i.e., those that amplify V3V4, V4, and V4V5 were retained) (Tables S1 and S2 in the Supplement).</p>
      <p id="d2e384"><italic>Metagenome data.</italic> All articles containing the keyword “glacier metagenome” were retrieved using the Web of Science (searched on the 1 December 2022). Only studies with sequenced ice, snow, or cryoconite samples with raw sequence data uploaded on the NCBI (National Center for Biotechnology Information) Short Read Archive were kept. Additionally, a small amount of metagenome data without published articles were added from the Integrated Microbial Genomes &amp; Microbiomes (IMG/M) database and the National Microbiology Data Center (NMDC) database based on a keyword search of the terms “ice”, “snow”, and “cryoconite”. In addition to metagenomes from the Antarctic, Arctic, and Tibetan Plateau, metagenomes from the Andes and Alps were also downloaded (Table S3).</p>
      <p id="d2e389"><italic>Cultivated bacterial genome data.</italic> A total of 883 isolate genome data points of Tibetan Plateau glaciers were obtained from the TG2G dataset (Liu et al., 2022), and another 116 genomes of bacterial isolates from glaciers beyond the Tibetan Plateau were downloaded from the NCBI genome database based on a keyword search of the terms “Antarctic” and “Arctic”. After careful manual curation, only samples from ice, snow, and cryoconite habitats were kept (Table S4).</p>
</sec>
<sec id="Ch1.S2.SS2">
  <label>2.2</label><title>Amplicon sequencing data processing</title>
      <p id="d2e402">Sequencing data were processed using the USEARCH v11 pipeline (Edgar, 2010) on a sequencing project basis. For each NCBI sequencing project, the reads associated with the project were first merged and quality-screened with a maximum expected error threshold of 0.5, while single-end reads were directly quality-screened using the same threshold. The quality-filtered reads from each bioproject were aligned with the SILVA reference alignment (release 128) to ensure that the V4 hypervariable region is covered, using the align.seqs command in mothur. After removing any sequences that do not cover the V4 region (using screen.seqs in mothur), the remaining sequences were dereplicated. After this pre-processing was completed for all bioprojects, the dereplicated sequences of different bioprojects were combined and dereplicated again. Then, these further dereplicated sequences were clustered with 97 % identity, and chimeric sequences were identified and removed using the cluster_otus command in USEARCH. The representative sequences were used as the references for operational taxonomic unit (OTU) table construction. Additionally, the representative sequences were taxonomically classified using the Bayesian classifier against the Silva database (release 132) (Quast et al., 2012). Then, mitochondria, chloroplast, and eukaryotic sequences were removed from the OTU table. After removing samples with fewer than 5000 reads, the final OTU table comprises 2039 samples and 64 510 OTUs. The sequencing depth (number of reads) ranges from 5036 to 1 492 659 per sample. We retained two datasets, one without rarefaction (Table S5) and another being subsampled (rarefied) to 5036 reads (Table S6).</p>
      <p id="d2e405">We calculated the Shannon diversity, richness (number of phylotypes), evenness, and Good's coverage indices for both original and subsampled data using R. The alpha diversity indices (richness, evenness, and Shannon diversity) and the relative abundance of dominant taxonomic lineages were compared by region (Antarctic, Arctic, Tibetan Plateau, and other alpine regions) and habitat (snow, ice, and cryoconite) using Kruskal–Wallis one-way ANOVA, and multiple testing was performed based on Dunn's post hoc test using the Fisheries Stock Assessment (FSA) package in the R environment (Ogle et al., 2022). The community structure variations were visualized using a non-metric multidimensional scaling (NMDS) ordination plot based on the Hellinger-transformed Bray–Curtis distance matrix. Permutational analysis of variance (PERMANOVA) was used to test the significance of community differences in samples by region and habitat (Anderson, 2017) using the “vegan” package in R with 999 permutations. PERMDISP analysis was performed using the betadisper command in the vegan package. Core phylotypes were defined as occurring in more than 55 % of the samples with an average relative abundance <inline-formula><mml:math id="M7" display="inline"><mml:mrow><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">0.1</mml:mn></mml:mrow></mml:math></inline-formula> % in each habitat–region pair (Delgado-Baquerizo et al., 2018). If a phylotype was identified as a core phylotype for all habitats of a region, then it was designated as the core phylotype for the region.</p>
</sec>
<sec id="Ch1.S2.SS3">
  <label>2.3</label><title>Metagenome data processing</title>
      <p id="d2e426">Metagenome data processing has been described previously (Liu et al., 2022). Briefly, it includes raw data quality-filtering, assembly, open reading frame prediction, and genome binning. Gene open reading frames (ORFs) for the metagenomic assemblies were predicted using Prodigal (Hyatt et al., 2010) and dereplicated by clustering in the 80 % aligned region with 95 % nucleotide identity using MMseqs2 (Steinegger and Söding, 2017) with the following parameters: easy-linclust -<inline-formula><mml:math id="M8" display="inline"><mml:mi>e</mml:mi></mml:math></inline-formula> 0.001, –min-seq-id 0.95, -<inline-formula><mml:math id="M9" display="inline"><mml:mi>c</mml:mi></mml:math></inline-formula> 0.80.</p>
      <p id="d2e443">Metagenomic assemblies were binned using MetaBAT 2 (v2.12.1) (Kang et al., 2019), MaxBin 2 (v2.2.7) (Wu et al., 2016), and VAMB (v2.0.1) (Nissen et al., 2021) separately. The resulting bins (or MAGs) were then refined using RefineM (v0.0.20) (Parks et al., 2017) by removing contigs with divergent guanine–cytosine (GC) content, coverage, or tetranucleotide signatures. Then only MAGs meeting the medium and higher quality of MIMAG (Bowers et al., 2017a) were retained (completeness <inline-formula><mml:math id="M10" display="inline"><mml:mrow><mml:mo>&gt;</mml:mo><mml:mn mathvariant="normal">50</mml:mn></mml:mrow></mml:math></inline-formula> %, contamination <inline-formula><mml:math id="M11" display="inline"><mml:mrow><mml:mo>&lt;</mml:mo><mml:mn mathvariant="normal">10</mml:mn></mml:mrow></mml:math></inline-formula> %). The obtained MAGs were combined with the cultured bacterial genomes, and these genomes were dereplicated using the thresholds of 10 % aligned fraction and a genome-wide average nucleotide identity (ANI) threshold of 95 %. They were then taxonomically annotated using the Genome Taxonomy Database Toolkit (GTDB-Tk, v2.4) (Chaumeil et al., 2019) against the GTDB release R220.</p>
</sec>
<sec id="Ch1.S2.SS4">
  <label>2.4</label><title>Gene function annotation</title>
      <p id="d2e474">The functions of the dereplicated genes were annotated using eggNOG-mapper (Huerta-Cepas et al., 2017) against the eggNOG orthologous groups (OGs) database (v5.0) (Huerta-Cepas et al., 2019). This includes the Kyoto Encyclopedia of Genes and Genomes (KEGG) functional orthologs (Kanehisa et al., 2017), the carbohydrate-active enzyme database (CAZy) (Levasseur et al., 2013), and the COG categories (Tatusov et al., 2003). Antibiotic resistance genes (ARGs) were annotated against the Comprehensive Antibiotic Resistance Database (CARD) (Jia et al., 2017) and Resistance Gene Identifier (RGI v3.1.4) (Alcock et al., 2020) with the loose model (–include_loose). Virulence factors were annotated by aligning gene sequences against the Virulence Factors Database (VFDB 2019) (Liu et al., 2019) with DIAMOND blastp (Buchfink et al., 2021) (<inline-formula><mml:math id="M12" display="inline"><mml:mi>e</mml:mi></mml:math></inline-formula>-value threshold of <inline-formula><mml:math id="M13" display="inline"><mml:mrow><mml:mn mathvariant="normal">1</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mn mathvariant="normal">10</mml:mn><mml:mrow><mml:mo>-</mml:mo><mml:mn mathvariant="normal">5</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></inline-formula>).</p>
</sec>
</sec>
<sec id="Ch1.S3">
  <label>3</label><title>Data availability</title>
      <p id="d2e511">The data introduced here are the first step in archiving global glacier microbial data. For this purpose, the data are deposited into the Global Glacier Genome and Gene Database (4GDB, <uri>https://nmdc.cn/4gdb/</uri>) and the National Tibetan Plateau Data Center (<ext-link xlink:href="https://doi.org/10.11888/Cryos.tpdc.300830" ext-link-type="DOI">10.11888/Cryos.tpdc.300830</ext-link>, Liu et al., 2023), which provides a comprehensive solution for glacier microbial studies, featuring an amplicon-sequencing phylotype table, representative sequences, taxonomic annotations, metagenomic raw sequences, assembled contigs, annotated gene sequences, sequences of metagenome-assembled genomes, and the growth characteristics of cultivated microorganisms, on a user-friendly website. The website is constructed under the OSI-approved CC BY 4.0 Open Source license (<uri>https://creativecommons.org/licenses/by/4.0/</uri>, last access: 11 July 2025), and all data can be accessed and reused freely, without any restrictions, for both academic and commercial purposes.</p>
      <p id="d2e523">The 4GDB website is structured into three main sections, comprising amplicon sequencing, metagenome/genome sequences, and function prediction. The user-friendly web interface allows data filtering based on sample type, sample location, habitat type, gene type, and taxonomy, enabling seamless download of the filtered results. In conclusion, 4GDB (<uri>https://nmdc.cn/4gdb/downloadtemp</uri>, last access: 11 July 2025) provides an open-access genome- and gene-oriented resource platform that is regularly updated to include newly published and in-house-generated sequence data.</p>
      <p id="d2e529">Tables S5 and S6 are deposited at <uri>https://figshare.com</uri> (last access: 11 July 2025; DOI: <ext-link xlink:href="https://doi.org/10.6084/m9.figshare.28423781.v2" ext-link-type="DOI">10.6084/m9.figshare.28423781.v2</ext-link>, Ji, 2025).</p>
</sec>
<sec id="Ch1.S4" sec-type="conclusions">
  <label>4</label><title>Results</title>
<sec id="Ch1.S4.SS1">
  <label>4.1</label><title>Amplicon-based dataset</title>
      <p id="d2e553">A total of 2039 glacier-related samples were retained after quality-filtering, comprising 1077 from cryoconite sediments, 601 from snow or ice, 216 from glacial melting water (including cryoconite hole meltwater and supraglacial melting water), 79 from ice core, 34 from snow during algal blooming (algal material), and 32 from subglacial basal ice (Table 1). Spatially, 29 % of all samples (<inline-formula><mml:math id="M14" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula> <inline-formula><mml:math id="M15" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 574) were from the Antarctic, 28 % (<inline-formula><mml:math id="M16" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula> <inline-formula><mml:math id="M17" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 574) from Arctic glaciers, 16 % (<inline-formula><mml:math id="M18" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula> <inline-formula><mml:math id="M19" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 335) from the Tibetan Plateau (<inline-formula><mml:math id="M20" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula> <inline-formula><mml:math id="M21" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 335), and 27 % from other alpine regions (<inline-formula><mml:math id="M22" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula> <inline-formula><mml:math id="M23" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 545; the Alps, Kenya, Japan, and Montana Glacier National Park).</p>
      <p id="d2e627">The retained datasets originate from 66 bioprojects, 8 of which missed sequencing platform information and 2 of which missed primer information (Table S2). Most of these bioprojects do not have environmental metadata and are therefore not included in the dataset. A variety of primers were used by these projects, amplifying the hypervariable regions V3V4, V4, and V4V5. These data were harmonized by retaining only the V4 region (sequence trimming). Surprisingly, four bioprojects that used primers 783F and 1046R (V5V6 region) were also retained. We speculate that incorrect primers may have been provided in the NCBI.</p>

<table-wrap id="T1" specific-use="star"><label>Table 1</label><caption><p id="d2e633">Number of samples by habitat and region.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="8">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="right"/>
     <oasis:colspec colnum="3" colname="col3" align="right"/>
     <oasis:colspec colnum="4" colname="col4" align="right"/>
     <oasis:colspec colnum="5" colname="col5" align="right"/>
     <oasis:colspec colnum="6" colname="col6" align="right"/>
     <oasis:colspec colnum="7" colname="col7" align="right"/>
     <oasis:colspec colnum="8" colname="col8" align="right"/>
     <oasis:thead>
       <oasis:row>
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2">Snow</oasis:entry>
         <oasis:entry colname="col3">Ice</oasis:entry>
         <oasis:entry colname="col4">Cryoconite</oasis:entry>
         <oasis:entry colname="col5">Supraglacial</oasis:entry>
         <oasis:entry colname="col6">Ice</oasis:entry>
         <oasis:entry colname="col7">Algal</oasis:entry>
         <oasis:entry colname="col8">Basal</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5">meltwater</oasis:entry>
         <oasis:entry colname="col6">core</oasis:entry>
         <oasis:entry colname="col7">material</oasis:entry>
         <oasis:entry colname="col8">ice</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row>
         <oasis:entry colname="col1">Antarctic</oasis:entry>
         <oasis:entry colname="col2">119</oasis:entry>
         <oasis:entry colname="col3">58</oasis:entry>
         <oasis:entry colname="col4">335</oasis:entry>
         <oasis:entry colname="col5">59</oasis:entry>
         <oasis:entry colname="col6">0</oasis:entry>
         <oasis:entry colname="col7">1</oasis:entry>
         <oasis:entry colname="col8">13</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Arctic</oasis:entry>
         <oasis:entry colname="col2">107</oasis:entry>
         <oasis:entry colname="col3">74</oasis:entry>
         <oasis:entry colname="col4">286</oasis:entry>
         <oasis:entry colname="col5">59</oasis:entry>
         <oasis:entry colname="col6">6</oasis:entry>
         <oasis:entry colname="col7">23</oasis:entry>
         <oasis:entry colname="col8">19</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Tibetan Plateau</oasis:entry>
         <oasis:entry colname="col2">67</oasis:entry>
         <oasis:entry colname="col3">8</oasis:entry>
         <oasis:entry colname="col4">172</oasis:entry>
         <oasis:entry colname="col5">30</oasis:entry>
         <oasis:entry colname="col6">58</oasis:entry>
         <oasis:entry colname="col7">0</oasis:entry>
         <oasis:entry colname="col8">0</oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Other non-polar regions</oasis:entry>
         <oasis:entry colname="col2">89</oasis:entry>
         <oasis:entry colname="col3">79</oasis:entry>
         <oasis:entry colname="col4">284</oasis:entry>
         <oasis:entry colname="col5">68</oasis:entry>
         <oasis:entry colname="col6">15</oasis:entry>
         <oasis:entry colname="col7">10</oasis:entry>
         <oasis:entry colname="col8">0</oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table></table-wrap>

<sec id="Ch1.S4.SS1.SSS1">
  <label>4.1.1</label><title>Prokaryotic diversity</title>
      <p id="d2e835">Good's coverage index provides an estimation for the number of singletons in a sample, reflecting the coverage of the sequencing. The values of the index were 0.98 <inline-formula><mml:math id="M24" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 0.02 and 0.96 <inline-formula><mml:math id="M25" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 0.02 for the datasets without and with subsampling, respectively (Table S7). This indicates that the majority of the OTUs were identified. The amplicon sequencing dataset comprised 64 510 phylotypes. Due to the large variation in sequencing depth among samples, here we only presented patterns that are consistently observed in the original and subsampled OTU tables (Tables 2, 3, and S7). Across all habitats, the number of OTUs observed (prokaryotic richness) was significantly lower in other non-polar regions than those in the Three Poles (Antarctic, Arctic, and Tibetan Plateau). This pattern is also significantly observed for the alpha diversity indices, including the Chao1, ACE, and Gini Simpson, but not in the Shannon diversity. Specifically, the prokaryotic Shannon diversity of the Arctic glaciers was not significantly different from that of other non-polar glaciers. Across habitats (Table 3), supraglacial meltwater had the highest prokaryotic diversity compared with other habitats (except the ice core). The alpha diversity indices typically follow the order of supraglacial meltwater <inline-formula><mml:math id="M26" display="inline"><mml:mo>&gt;</mml:mo></mml:math></inline-formula> snow <inline-formula><mml:math id="M27" display="inline"><mml:mo>&gt;</mml:mo></mml:math></inline-formula> ice core <inline-formula><mml:math id="M28" display="inline"><mml:mo>&gt;</mml:mo></mml:math></inline-formula> ice <inline-formula><mml:math id="M29" display="inline"><mml:mo>&gt;</mml:mo></mml:math></inline-formula> cryoconite <inline-formula><mml:math id="M30" display="inline"><mml:mo>&gt;</mml:mo></mml:math></inline-formula> algae-influenced snow <inline-formula><mml:math id="M31" display="inline"><mml:mo>&gt;</mml:mo></mml:math></inline-formula> basal ice. This may reflect the strength of environmental filtering among the habitats.</p>
      <p id="d2e895">We further compared the alpha diversity indices of the same habitats across different regions (Table S8). Due to the bias in the number of samples across habitats, here we only compared the diversity indices in cryoconite, snow, ice, and supraglacial water. For cryoconites, their prokaryotic diversity (Shannon diversity and Gini Simpson indices) was the highest in the Antarctic, which was followed by the Arctic, Tibetan Plateau, and other non-polar glaciers. For snow, its prokaryotic diversity (Richness, Chao1, and ACE indices) was the highest in Tibetan glaciers, followed by Antarctic, Arctic, and other non-polar glaciers. For ice, the diversity indices were not significantly different across all regions, with only significantly higher values of diversity than in the Arctic and Tibetan Plateau being observed in the Antarctic. For supraglacial meltwater, other non-polar glaciers demonstrated the highest diversity (Shannon diversity and Gini Simpson diversity indices, all <inline-formula><mml:math id="M32" display="inline"><mml:mi>P</mml:mi></mml:math></inline-formula> <inline-formula><mml:math id="M33" display="inline"><mml:mo>&lt;</mml:mo></mml:math></inline-formula> 0.05), while the Antarctic had the lowest values. In summary, the biogeographic pattern for prokaryotic diversity in the same habitat differed among regions.</p>
      <p id="d2e912">We further assessed the influence of the region amplified on the validity of the results. For each region–habitat pair, the alpha diversity indices were significantly different to a certain extent. However, those from Arctic basal ice, other non-polar glacier ice, and Tibetan Plateau supraglacial meltwater were less affected (Table S9). Nevertheless, the influence may be explained by the different sampling locations, which have distinct microbial compositions. We further tested the validity of the diversity comparison results using the data that were generated using the same primer set (Table S10). The influence of primer selection on prokaryotic diversity was inconsistent. For instance, primers targeting the V4 region resulted in a higher richness in supraglacial ice than primers targeting the V3V4 region in other alpine glaciers. In contrast, the primers targeting the V3V4 region resulted in a higher richness in the Antarctic and Arctic. Such inconsistency in microbial community assessment by different primers and platforms has been reported previously (Fredriksson et al., 2013; Tremblay et al., 2015). Thus, the homogenization method may not fully overcome the bias caused by primer selection. Nevertheless, we provided comprehensive information on the primer and regions amplified; thus users may choose to use the entire dataset or only those using the same primer for analysis.</p>

<table-wrap id="T2" specific-use="star"><label>Table 2</label><caption><p id="d2e919">Diversity metrics of the bacterial community in glacier microbiomes of global glaciers.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="5">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:colspec colnum="3" colname="col3" align="left"/>
     <oasis:colspec colnum="4" colname="col4" align="left"/>
     <oasis:colspec colnum="5" colname="col5" align="left"/>
     <oasis:thead>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Region</oasis:entry>
         <oasis:entry colname="col2">Antarctic</oasis:entry>
         <oasis:entry colname="col3">Arctic</oasis:entry>
         <oasis:entry colname="col4">Non-polar glacier</oasis:entry>
         <oasis:entry colname="col5">Tibetan Plateau</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row rowsep="1">
         <oasis:entry namest="col1" nameend="col2">Original dataset </oasis:entry>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Species observed</oasis:entry>
         <oasis:entry colname="col2">1025.1 <inline-formula><mml:math id="M36" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 722.5<sup>b</sup></oasis:entry>
         <oasis:entry colname="col3">981.4 <inline-formula><mml:math id="M38" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 784.4<sup>b</sup></oasis:entry>
         <oasis:entry colname="col4">868 <inline-formula><mml:math id="M40" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 676.3<sup>c</sup></oasis:entry>
         <oasis:entry colname="col5">1185 <inline-formula><mml:math id="M42" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 825.9<sup>a</sup></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Chao1</oasis:entry>
         <oasis:entry colname="col2">1400 <inline-formula><mml:math id="M44" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 912.5<sup>b</sup></oasis:entry>
         <oasis:entry colname="col3">1492.4 <inline-formula><mml:math id="M46" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1308.7<sup>b</sup></oasis:entry>
         <oasis:entry colname="col4">1223.2 <inline-formula><mml:math id="M48" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 941.8<sup>c</sup></oasis:entry>
         <oasis:entry colname="col5">1768.2 <inline-formula><mml:math id="M50" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1279.3<sup>a</sup></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">ACE</oasis:entry>
         <oasis:entry colname="col2">1422.5 <inline-formula><mml:math id="M52" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 948.1<sup>b</sup></oasis:entry>
         <oasis:entry colname="col3">1526.9 <inline-formula><mml:math id="M54" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1340.8<sup>ab</sup></oasis:entry>
         <oasis:entry colname="col4">1232.3 <inline-formula><mml:math id="M56" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 959.5<sup>c</sup></oasis:entry>
         <oasis:entry colname="col5">1767.5 <inline-formula><mml:math id="M58" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1295.4<sup>a</sup></oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Shannon diversity</oasis:entry>
         <oasis:entry colname="col2">4.3 <inline-formula><mml:math id="M60" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1.03<sup>a</sup></oasis:entry>
         <oasis:entry colname="col3">3.97 <inline-formula><mml:math id="M62" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1.05<sup>b</sup></oasis:entry>
         <oasis:entry colname="col4">4.17 <inline-formula><mml:math id="M64" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1.19<sup>b</sup></oasis:entry>
         <oasis:entry colname="col5">4.2 <inline-formula><mml:math id="M66" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1.3<sup>a</sup></oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry namest="col1" nameend="col2">Subsampled dataset </oasis:entry>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Species observed</oasis:entry>
         <oasis:entry colname="col2">475.7 <inline-formula><mml:math id="M68" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 232<sup>a</sup></oasis:entry>
         <oasis:entry colname="col3">467.9 <inline-formula><mml:math id="M70" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 275.9<sup>a</sup></oasis:entry>
         <oasis:entry colname="col4">468.1 <inline-formula><mml:math id="M72" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 384.2<sup>b</sup></oasis:entry>
         <oasis:entry colname="col5">507.1 <inline-formula><mml:math id="M74" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 317.3<sup>a</sup></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Chao1</oasis:entry>
         <oasis:entry colname="col2">809.6 <inline-formula><mml:math id="M76" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 458.3<sup>a</sup></oasis:entry>
         <oasis:entry colname="col3">847.9 <inline-formula><mml:math id="M78" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 575.3<sup>a</sup></oasis:entry>
         <oasis:entry colname="col4">777.5 <inline-formula><mml:math id="M80" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 679.4<sup>b</sup></oasis:entry>
         <oasis:entry colname="col5">884.4 <inline-formula><mml:math id="M82" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 622<sup>a</sup></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">ACE</oasis:entry>
         <oasis:entry colname="col2">825.7 <inline-formula><mml:math id="M84" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 482.6<sup>b</sup></oasis:entry>
         <oasis:entry colname="col3">881.6 <inline-formula><mml:math id="M86" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 619.9<sup>ab</sup></oasis:entry>
         <oasis:entry colname="col4">796.6 <inline-formula><mml:math id="M88" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 715.3<sup>c</sup></oasis:entry>
         <oasis:entry colname="col5">903.4 <inline-formula><mml:math id="M90" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 651.8<sup>a</sup></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Shannon diversity</oasis:entry>
         <oasis:entry colname="col2">4.23 <inline-formula><mml:math id="M92" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1<sup>a</sup></oasis:entry>
         <oasis:entry colname="col3">3.9 <inline-formula><mml:math id="M94" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1.02<sup>b</sup></oasis:entry>
         <oasis:entry colname="col4">4.1 <inline-formula><mml:math id="M96" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1.16<sup>b</sup></oasis:entry>
         <oasis:entry colname="col5">4.11 <inline-formula><mml:math id="M98" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1.25<sup>a</sup></oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table><table-wrap-foot><p id="d2e922">Statistical test is based on Kruskal–Wallis one-way ANOVA; multiple testing is performed based on Dunn's post hoc test. Different superscript letters within each row indicate significant pairwise differences between regions at <inline-formula><mml:math id="M34" display="inline"><mml:mi>P</mml:mi></mml:math></inline-formula> <inline-formula><mml:math id="M35" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 0.05, based on Kruskal–Wallis one-way ANOVA followed by Dunn's post hoc test (with Bonferroni correction). Values sharing the same letter are not significantly different.</p></table-wrap-foot></table-wrap>

<table-wrap id="T3" specific-use="star"><label>Table 3</label><caption><p id="d2e1631">Diversity metrics of the bacterial community in glacier microbiomes of different habitats.</p></caption><oasis:table frame="topbot"><oasis:tgroup cols="8">
     <oasis:colspec colnum="1" colname="col1" align="left"/>
     <oasis:colspec colnum="2" colname="col2" align="left"/>
     <oasis:colspec colnum="3" colname="col3" align="left"/>
     <oasis:colspec colnum="4" colname="col4" align="left"/>
     <oasis:colspec colnum="5" colname="col5" align="left"/>
     <oasis:colspec colnum="6" colname="col6" align="left"/>
     <oasis:colspec colnum="7" colname="col7" align="left"/>
     <oasis:colspec colnum="8" colname="col8" align="left"/>
     <oasis:thead>
       <oasis:row>
         <oasis:entry colname="col1">Habitats</oasis:entry>
         <oasis:entry colname="col2">Algal material</oasis:entry>
         <oasis:entry colname="col3">Basal ice</oasis:entry>
         <oasis:entry colname="col4">Cryoconite</oasis:entry>
         <oasis:entry colname="col5">Supraglacial ice</oasis:entry>
         <oasis:entry colname="col6">Ice core</oasis:entry>
         <oasis:entry colname="col7">Snow</oasis:entry>
         <oasis:entry colname="col8">Supraglacial</oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1"/>
         <oasis:entry colname="col2"/>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
         <oasis:entry colname="col6"/>
         <oasis:entry colname="col7"/>
         <oasis:entry colname="col8">meltwater</oasis:entry>
       </oasis:row>
     </oasis:thead>
     <oasis:tbody>
       <oasis:row rowsep="1">
         <oasis:entry namest="col1" nameend="col2">Original dataset </oasis:entry>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
         <oasis:entry colname="col6"/>
         <oasis:entry colname="col7"/>
         <oasis:entry colname="col8"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Species observed</oasis:entry>
         <oasis:entry colname="col2">596.3 <inline-formula><mml:math id="M102" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 451.7<sup>ab</sup></oasis:entry>
         <oasis:entry colname="col3">489.6 <inline-formula><mml:math id="M104" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 306.3<sup>a</sup></oasis:entry>
         <oasis:entry colname="col4">904.4 <inline-formula><mml:math id="M106" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 532.6<sup>c</sup></oasis:entry>
         <oasis:entry colname="col5">929.2 <inline-formula><mml:math id="M108" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 695.9<sup>bc</sup></oasis:entry>
         <oasis:entry colname="col6">999.9 <inline-formula><mml:math id="M110" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 438.3<sup>cd</sup></oasis:entry>
         <oasis:entry colname="col7">1178.8 <inline-formula><mml:math id="M112" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1121.6<sup>c</sup></oasis:entry>
         <oasis:entry colname="col8">1344.3 <inline-formula><mml:math id="M114" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 910.3<sup>d</sup></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Chao1</oasis:entry>
         <oasis:entry colname="col2">873.5 <inline-formula><mml:math id="M116" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 648.2<sup>ab</sup></oasis:entry>
         <oasis:entry colname="col3">646.8 <inline-formula><mml:math id="M118" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 379.1<sup>a</sup></oasis:entry>
         <oasis:entry colname="col4">1316.9 <inline-formula><mml:math id="M120" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 786.1<sup>c</sup></oasis:entry>
         <oasis:entry colname="col5">1285.8 <inline-formula><mml:math id="M122" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 962.3<sup>bc</sup></oasis:entry>
         <oasis:entry colname="col6">1452.8 <inline-formula><mml:math id="M124" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 618.7<sup>cd</sup></oasis:entry>
         <oasis:entry colname="col7">1726.4 <inline-formula><mml:math id="M126" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1736.5<sup>bc</sup></oasis:entry>
         <oasis:entry colname="col8">1898.4 <inline-formula><mml:math id="M128" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1307.7<sup>d</sup></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">ACE</oasis:entry>
         <oasis:entry colname="col2">905.1 <inline-formula><mml:math id="M130" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 682.1<sup>ab</sup></oasis:entry>
         <oasis:entry colname="col3">641.8 <inline-formula><mml:math id="M132" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 388.3<sup>a</sup></oasis:entry>
         <oasis:entry colname="col4">1335.5 <inline-formula><mml:math id="M134" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 806.4<sup>c</sup></oasis:entry>
         <oasis:entry colname="col5">1296 <inline-formula><mml:math id="M136" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 979<sup>bc</sup></oasis:entry>
         <oasis:entry colname="col6">1430.8 <inline-formula><mml:math id="M138" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 599<sup>cd</sup></oasis:entry>
         <oasis:entry colname="col7">1760.1 <inline-formula><mml:math id="M140" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1777.7<sup>bc</sup></oasis:entry>
         <oasis:entry colname="col8">1914.2 <inline-formula><mml:math id="M142" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1339.1<sup>d</sup></oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry colname="col1">Shannon diversity</oasis:entry>
         <oasis:entry colname="col2">3.18 <inline-formula><mml:math id="M144" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1.38<sup>a</sup></oasis:entry>
         <oasis:entry colname="col3">3.4 <inline-formula><mml:math id="M146" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 0.99<sup>a</sup></oasis:entry>
         <oasis:entry colname="col4">4.21 <inline-formula><mml:math id="M148" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 0.84<sup>b</sup></oasis:entry>
         <oasis:entry colname="col5">3.67 <inline-formula><mml:math id="M150" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1.09<sup>a</sup></oasis:entry>
         <oasis:entry colname="col6">4.6 <inline-formula><mml:math id="M152" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 0.8<sup>c</sup></oasis:entry>
         <oasis:entry colname="col7">3.8 <inline-formula><mml:math id="M154" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1.5<sup>a</sup></oasis:entry>
         <oasis:entry colname="col8">5 <inline-formula><mml:math id="M156" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1.2<sup>c</sup></oasis:entry>
       </oasis:row>
       <oasis:row rowsep="1">
         <oasis:entry namest="col1" nameend="col2">Subsampled dataset </oasis:entry>
         <oasis:entry colname="col3"/>
         <oasis:entry colname="col4"/>
         <oasis:entry colname="col5"/>
         <oasis:entry colname="col6"/>
         <oasis:entry colname="col7"/>
         <oasis:entry colname="col8"/>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Species observed</oasis:entry>
         <oasis:entry colname="col2">317.5 <inline-formula><mml:math id="M158" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 293<sup>ab</sup></oasis:entry>
         <oasis:entry colname="col3">239.2 <inline-formula><mml:math id="M160" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 129.5<sup>a</sup></oasis:entry>
         <oasis:entry colname="col4">464.8 <inline-formula><mml:math id="M162" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 223<sup>c</sup></oasis:entry>
         <oasis:entry colname="col5">356.1 <inline-formula><mml:math id="M164" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 205.1<sup>ab</sup></oasis:entry>
         <oasis:entry colname="col6">521.7 <inline-formula><mml:math id="M166" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 207.9<sup>cd</sup></oasis:entry>
         <oasis:entry colname="col7">471.9 <inline-formula><mml:math id="M168" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 386.5<sup>bc</sup></oasis:entry>
         <oasis:entry colname="col8">710.1 <inline-formula><mml:math id="M170" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 458.2<sup>d</sup></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Chao1</oasis:entry>
         <oasis:entry colname="col2">568.6 <inline-formula><mml:math id="M172" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 544.6<sup>abc</sup></oasis:entry>
         <oasis:entry colname="col3">357.4 <inline-formula><mml:math id="M174" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 201.4<sup>a</sup></oasis:entry>
         <oasis:entry colname="col4">798.9 <inline-formula><mml:math id="M176" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 424.1<sup>d</sup></oasis:entry>
         <oasis:entry colname="col5">613.7 <inline-formula><mml:math id="M178" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 405.5<sup>b</sup></oasis:entry>
         <oasis:entry colname="col6">799.5 <inline-formula><mml:math id="M180" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 325.4<sup>de</sup></oasis:entry>
         <oasis:entry colname="col7">883.2 <inline-formula><mml:math id="M182" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 807.7<sup>cd</sup></oasis:entry>
         <oasis:entry colname="col8">1176.4 <inline-formula><mml:math id="M184" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 836.6<sup>e</sup></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">ACE</oasis:entry>
         <oasis:entry colname="col2">588.9 <inline-formula><mml:math id="M186" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 581.2<sup>abc</sup></oasis:entry>
         <oasis:entry colname="col3">353.4 <inline-formula><mml:math id="M188" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 207.7<sup>a</sup></oasis:entry>
         <oasis:entry colname="col4">818.5 <inline-formula><mml:math id="M190" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 442.6<sup>d</sup></oasis:entry>
         <oasis:entry colname="col5">626.1 <inline-formula><mml:math id="M192" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 419.2<sup>b</sup></oasis:entry>
         <oasis:entry colname="col6">795.6 <inline-formula><mml:math id="M194" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 339.9<sup>de</sup></oasis:entry>
         <oasis:entry colname="col7">921.9 <inline-formula><mml:math id="M196" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 868.7<sup>cd</sup></oasis:entry>
         <oasis:entry colname="col8">1207.6 <inline-formula><mml:math id="M198" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 888.5<sup>e</sup></oasis:entry>
       </oasis:row>
       <oasis:row>
         <oasis:entry colname="col1">Shannon diversity</oasis:entry>
         <oasis:entry colname="col2">3.14 <inline-formula><mml:math id="M200" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1.35<sup>a</sup></oasis:entry>
         <oasis:entry colname="col3">3.37 <inline-formula><mml:math id="M202" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 0.99<sup>a</sup></oasis:entry>
         <oasis:entry colname="col4">4.14 <inline-formula><mml:math id="M204" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 0.82<sup>b</sup></oasis:entry>
         <oasis:entry colname="col5">3.6 <inline-formula><mml:math id="M206" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1.06<sup>a</sup></oasis:entry>
         <oasis:entry colname="col6">4.5 <inline-formula><mml:math id="M208" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 0.8<sup>c</sup></oasis:entry>
         <oasis:entry colname="col7">3.7 <inline-formula><mml:math id="M210" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1.4<sup>a</sup></oasis:entry>
         <oasis:entry colname="col8">4.9 <inline-formula><mml:math id="M212" display="inline"><mml:mo>±</mml:mo></mml:math></inline-formula> 1.1<sup>c</sup></oasis:entry>
       </oasis:row>
     </oasis:tbody>
   </oasis:tgroup></oasis:table><table-wrap-foot><p id="d2e1634">Statistical test is based on Kruskal–Wallis one-way ANOVA; multiple testing is performed based on Dunn's post hoc test. Different superscript letters within each row indicate significant pairwise differences between habitats at <inline-formula><mml:math id="M100" display="inline"><mml:mi>P</mml:mi></mml:math></inline-formula> <inline-formula><mml:math id="M101" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 0.05, based on Kruskal–Wallis one-way ANOVA followed by Dunn's post hoc test (with Bonferroni correction). Values sharing the same letter are not significantly different.</p></table-wrap-foot></table-wrap>

</sec>
<sec id="Ch1.S4.SS1.SSS2">
  <label>4.1.2</label><title>Prokaryotic taxonomy composition in the glaciers of the Three Poles</title>
      <p id="d2e2839">We identified 53 bacterial and archaeal phyla across the dataset. The glacier microbiomes had similar taxonomic composition, dominated by Proteobacteria (averaged 37.8 %), Cyanobacteria (22.2 %), Bacteroidetes (20.3 %), and Actinobacteria (9.2 %) (Fig. 2 and Tables S11). At the class level (Tables S12), the microbiome was dominated by Gammaproteobacteria (22.7 %, Proteobacteria), Oxyphotobacteria (22.1 %, Cyanobacteria), Bacteroidia (22.2 %, Bacteroidetes), Alphaproteobacteria (13 %, Proteobacteria), and Actinobacteria (class) (8.1 %, Actinobacteria).</p>

      <fig id="F2" specific-use="star"><label>Figure 2</label><caption><p id="d2e2844">Taxonomy composition of supraglacial ecosystems in glaciers of the Antarctic, Arctic, Tibetan Plateau, and other alpine regions. Taxonomy is inferred based on amplicon sequencing results.</p></caption>
            <graphic xlink:href="https://essd.copernicus.org/articles/17/5165/2025/essd-17-5165-2025-f02.png"/>

          </fig>

</sec>
<sec id="Ch1.S4.SS1.SSS3">
  <label>4.1.3</label><title>Bacterial community structure in the glaciers of the Three Poles</title>
      <p id="d2e2861">The NMDS ordination plot revealed distinct prokaryotic communities among habitats (Fig. 3a). PERMANOVA analysis showed significantly different prokaryotic community structures among Antarctic, Arctic, Tibetan Plateau, and other non-polar glaciers (<inline-formula><mml:math id="M214" display="inline"><mml:mi>P</mml:mi></mml:math></inline-formula> <inline-formula><mml:math id="M215" display="inline"><mml:mo>&lt;</mml:mo></mml:math></inline-formula> 0.001). The influence of location exhibited a higher <inline-formula><mml:math id="M216" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup></mml:mrow></mml:math></inline-formula> value (0.10535) than the influence of habitat (<inline-formula><mml:math id="M217" display="inline"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn mathvariant="normal">2</mml:mn></mml:msup><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.06299</mml:mn></mml:mrow></mml:math></inline-formula>), suggesting that spatial location may have a greater influence in shaping glacier microbiomes. PERMDISP analysis showed that snow samples exhibited a significantly (at the threshold of <inline-formula><mml:math id="M218" display="inline"><mml:mi>P</mml:mi></mml:math></inline-formula> <inline-formula><mml:math id="M219" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 0.05) higher dispersal from the centroid (67.4 %) compared to cryoconite (65.1 %). Comparatively, those of ice core and algae were lower (57.9 % and 58.9 %, respectively), possibly due to the low sample numbers.</p>

      <fig id="F3" specific-use="star"><label>Figure 3</label><caption><p id="d2e2921">The community structure of glacier microbiomes across the Antarctic, Arctic, and Tibetan Plateau. <bold>(a)</bold> Microbial community structure differences visualized using the non-metric multidimensional scaling ordination plot. <bold>(b)</bold> The heatmap highlights the distribution pattern of dominant phylotypes for each habitat–region pair.</p></caption>
            <graphic xlink:href="https://essd.copernicus.org/articles/17/5165/2025/essd-17-5165-2025-f03.png"/>

          </fig>

      <p id="d2e2936">We identified the top three most abundant phylotypes for each habitat–region pair (Fig. 3b and Table S13). These abundant phylotypes were mainly affiliated with Proteobacteria, Cyanobacteria, and Bacteroidetes. The distribution of these abundant phylotypes was clustered predominantly by geographical location, reflecting strong spatial effects. We then attempted to identify ubiquitous phylotypes for each region–habitat pair, defined as those present in more than 55 % of samples with a relative abundance greater than 0.1 %. However, we found no phylotypes that were common across any regions or habitats (Table S14). The number of ubiquitous phylotypes varied among region–habitat pairs, ranging from 9 in Arctic ice to 129 in Tibetan supraglacial meltwater. Notably, we did not identify any ubiquitous phylotypes in Arctic snow or other non-polar snow. Most of the ubiquitous phylotypes were classified as Gammaproteobacteria (29 % of the total), followed by Bacteroidetes (19 %), Alphaproteobacteria (16 %), Cyanobacteria (13 %), and Actinobacteria (11 %). This distribution may indicate their ability to disperse and adapt to different environmental conditions.</p>
</sec>
</sec>
<sec id="Ch1.S4.SS2">
  <label>4.2</label><title>Metagenome and genome dataset</title>
      <p id="d2e2948">We acquired 226 glacier metagenome data points (Table S3) and 999 bacterial genomes from glacial environments (Table S4). After quality-filtering, assembly, gene prediction, and dereplication, 63 294 073 unique open reading frames (ORFs) were obtained. Of these dereplicated ORFs, 47.8 % (29 947 128) can be functionally annotated using eggNOG.</p>
<sec id="Ch1.S4.SS2.SSS1">
  <label>4.2.1</label><title>Overall features of glacier metagenome-assembled genomes</title>
      <p id="d2e2958">After binning, the dataset generated 3502 metagenome-assembled genomes of medium quality (genome completion <inline-formula><mml:math id="M220" display="inline"><mml:mo>≥</mml:mo></mml:math></inline-formula> 50 %, contamination <inline-formula><mml:math id="M221" display="inline"><mml:mo>&lt;</mml:mo></mml:math></inline-formula> 10 %) and higher (Bowers et al., 2017b). After combining the genomes of cultivated glacier bacteria (999), this expanded the total genome number to 4501 from the previously published 3322 (Liu et al., 2022) (Table S15), a 35.5 % increase. The median genome size was 3.46 Mb, ranging from 0.42 to 10.49 Mb; the GC percentage was 60 %, ranging from 30 % to 76 %. The MAGs were taxonomically affiliated with 33 phyla, 79 classes, 154 orders, 271 families, and 549 genera (Fig. 4a). Additionally, 3470 (77.1 % of all MAGs) were unable to be classified at the species level (Fig. 4b), reflecting substantial genomic novelty in the glacier microbiome. These genomes were dereplicated into 1400 genomic OTUs (gOTUs), which are typically considered species.</p>

      <fig id="F4" specific-use="star"><label>Figure 4</label><caption><p id="d2e2977">Taxonomy classification of the obtained prokaryotic genomes. <bold>(a)</bold> The phylogenetic tree contains the representative bacterial genomic OTUs with genome size and GC percentage being shown. <bold>(b)</bold> The taxonomic classification of the obtained genomes. Classified refers to valid taxonomic classification, placeholders are genomes that have been deposited in the GTDB R220 database, and unclassified refers to genomes that have not been deposited in the GTDB database.</p></caption>
            <graphic xlink:href="https://essd.copernicus.org/articles/17/5165/2025/essd-17-5165-2025-f04.png"/>

          </fig>

</sec>
<sec id="Ch1.S4.SS2.SSS2">
  <label>4.2.2</label><title>Key functional genes</title>
      <p id="d2e3000"><italic>Carbohydrate-active enzymes.</italic> The dataset contains 1 082 125 genes encoding carbohydrate-active enzymes (CAZymes; Fig. 5a), i.e., those enzymes involved in the metabolism of glycoconjugates, oligosaccharides, and polysaccharides (Zerillo et al., 2013). Genes associated with carbohydrate hydrolysis (GH) and biosynthesis (GT) were the most abundant, accounting for 45.2 % and 44.4 %, respectively. In contrast, those genes associated with non-hydrolytic cleavage of glycosidic bonds (PL), hydrolysis of carbohydrate esters (CEW), and assisting in degrading biomass substrates (AA) were relatively scarce, accounting for 0.8 %, 3.1 %, and 0.2 % of the predicted CAZymes, respectively. This indicates that the glacier microbiome is competent in a diverse range of carbon transformation processes, mediating the delivery of carbon to downstream ecosystems.</p>

      <fig id="F5" specific-use="star"><label>Figure 5</label><caption><p id="d2e3007">The distribution of genes associated with carbohydrate-active enzymes (CAZymes) in glaciers. <bold>(a)</bold> The relative contributions of genes associated with different CAZymes in each habitat (GH: glycoside hydrolases; GT: glycosyl transferases; PL: polysaccharide lyases; CE: carbohydrate esterases; AA: auxiliary activities). <bold>(b)</bold> The most diverse CAZymes in each habitat–region combination. <bold>(c)</bold> PCA plots show the distribution of CAZymes across habitats and regions. <bold>(d)</bold> The selective enrichment of CAZymes between cryoconite and snow and between cryoconite and ice.</p></caption>
            <graphic xlink:href="https://essd.copernicus.org/articles/17/5165/2025/essd-17-5165-2025-f05.png"/>

          </fig>

      <p id="d2e3028">We further examined the distribution of CAZyme genes across different glaciers. At the CAZY family level, GT2, GT4, GH13, and GT51 were the most diverse across all habitats (Fig. 5b). PERMANOVA tests revealed significant composition differences by both habitat (pseudo-<inline-formula><mml:math id="M222" display="inline"><mml:mi>F</mml:mi></mml:math></inline-formula> <inline-formula><mml:math id="M223" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 10.014, <inline-formula><mml:math id="M224" display="inline"><mml:mi>P</mml:mi></mml:math></inline-formula> <inline-formula><mml:math id="M225" display="inline"><mml:mo>&lt;</mml:mo></mml:math></inline-formula> 0.001) and region (pseudo-<inline-formula><mml:math id="M226" display="inline"><mml:mi>F</mml:mi></mml:math></inline-formula> <inline-formula><mml:math id="M227" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 5.038, <inline-formula><mml:math id="M228" display="inline"><mml:mrow><mml:mi>P</mml:mi><mml:mo>=</mml:mo><mml:mn mathvariant="normal">0.002</mml:mn></mml:mrow></mml:math></inline-formula>), with habitat exhibiting a greater influence on CAZY composition. Specifically, the principal component analysis (PCA) plot revealed that cryoconites harbor a greater number of genes classified as GH5 and GH9 (Fig. 5c). Furthermore, 30 GHs and 20 GTs exhibited a significantly higher contribution in cryoconites than in ice or snow (Fig. 5d). Comparatively, 15 GHs and 27 GTs exhibited a significantly higher contribution in ice or snow than in cryoconites. Thus, cryoconites exhibited higher capacity in the catabolism of organic carbon, whereas snow and ice are more prevalent in anabolism.</p>
      <p id="d2e3087"><italic>Nitrogen cycling.</italic> The dataset contained 138 421 unique genes associated with nitrogen cycling, most of which (99.3 %) were associated with nitrate reduction and/or denitrification pathways (Fig. 6a). These genes included the <italic>nirB</italic> gene responsible for the nitrite reduction to ammonia in the assimilatory nitrate reduction pathway, the <italic>narB</italic> and <italic>nirA</italic> genes responsible for sequential nitrate reduction to ammonia in dissimilatory nitrate reduction pathways, and the <italic>nirK</italic> gene responsible for nitrite reduction to nitric oxide in the denitrification pathway. This suggests that microbially driven nitrate reduction is widespread in glacial habitats for both nitrogen assimilation and energy supply, highlighting their potential roles in NO<sub><italic>x</italic></sub> formation. In comparison, genes involved in nitrogen fixation (<italic>nifH</italic>) and nitrification (<italic>hao</italic>) were relatively rare, with only 678 (0.49 % of the nitrogen cycling-related genes) and 240 (0.17 %) unique genes identified, respectively. This suggests that microorganisms capable of these high-energy demand processes only account for a small fraction of the glacial microbiome, which is consistent with the low nitrogen fixation rates reported in glacier-related habitats (Telling et al., 2011).</p>

      <fig id="F6" specific-use="star"><label>Figure 6</label><caption><p id="d2e3122">Features of the functional genes across the glacier metagenomes from the Antarctic, Arctic, and Tibetan Plateau. <bold>(a)</bold> Nitrogen cycling (the numbers indicate the number of genes identified; genes of the anaerobic ammonium oxidation pathway are not identified in the glacier metagenomes), <bold>(b)</bold> methane cycling (the <italic>mcrA</italic> gene is responsible for methanogenesis, the <italic>mmoX</italic> gene is the soluble-form methane oxidation gene, and <italic>pmoA</italic> is the particulate-form methane oxidation gene, both of which are associated with methane oxidation), <bold>(c)</bold> genes associated with antibiotic resistance, and <bold>(d)</bold> the number of genes associated with virulence factors (the numbers have been square root-transformed).</p></caption>
            <graphic xlink:href="https://essd.copernicus.org/articles/17/5165/2025/essd-17-5165-2025-f06.png"/>

          </fig>

      <p id="d2e3153">The differences in gene distributions are apparent among habitats. Specifically, the genes associated with nitrogen fixation and denitrification were mainly present in cryoconites. The former could be explained by the high abundance of Cyanobacteria (Fig. 2), while the latter could be attributed to its anaerobic conditions. Thus, the cryoconite could be a potential source of N<sub>2</sub>O. Comparatively, <italic>amoA</italic> (in nitrification) was mainly identified from ice, while <italic>norB</italic> and <italic>nosZ</italic> (in denitrification) were also abundant. This suggests that ice could harbor greater functional diversity than snow, with the capacity for nitrogen transformation and influencing the nutrients discharged to downstream ecosystems.</p>
      <p id="d2e3174"><italic>Methane cycling.</italic> The dataset contained 154 methane cycling-related genes. Of these, 93 were the soluble form of methane oxidase (<italic>mmoX</italic>), accounting for 61 % of the total methane-cycling genes identified (Fig. 6b). More <italic>mmoX</italic> genes were identified from cryoconite (34.4 % of the total methane-cycling genes identified) than from ice (20.8 %) or snow (5.2 %). Conversely, genes associated with the particulate form of methane oxidation (<italic>pmoA</italic>, <italic>pmoB</italic>, and <italic>pmoC</italic>) were more frequently identified from ice (21.4 %) than from cryoconite (5.8 %) and snow (3.2 %). The two forms of methane monooxygenase (sMMO and pMMO) have distinct enzymatic characteristics and are expressed under different growth conditions. Specifically, sMMO is expressed under low-copper conditions (<inline-formula><mml:math id="M231" display="inline"><mml:mo lspace="0mm">≤</mml:mo></mml:math></inline-formula> 0.9 nmol Cu per mg of cell protein), while pMMO is expressed under relatively high copper–biomass ratios (Zhang et al., 2017). Furthermore, sMMO has a broader substrate range and can oxidize methane, short-chain alkane, alkene, and aromatic compounds, while pMMO can only oxidize alkanes of less than five carbons (Trotsenko and Murrell, 2008). Despite not being empirically measured, the cryoconite is expected to contain a higher concentration of copper than the ice, as the former is precipitated dust. Thus, the higher diversity of sMMO in the cryoconite could be associated with its ability to oxidize diverse alkanes, which may be present in soils. In comparison, high-affinity pMMO could oxidize methane at atmospheric levels, which may support microbial communities in the oligotrophic ice habitat. Only six unique methanogenesis-related genes (<italic>mcrA</italic>) were identified, almost exclusively in cryoconite metagenomes. This is consistent with the cryoconite as a methane source in the literature (Zhang et al., 2021).</p>
      <p id="d2e3205"><italic>Antimicrobial resistance genes.</italic> Using thresholds of 80 % identity and 80 % sequence coverage, we identified 1166 ORFs that exhibited high sequence similarity to 224 antibiotic resistance genes (ARG). Of these identified ARGs, <italic>MexF</italic>, beta-lactamase, and <italic>mexK</italic> were the most abundant, accounting for 8.1 %, 4.2 %, and 3.7 % of the ARGs identified, respectively (Table S16). The predominant antibiotic resistance mechanisms were antibiotic efflux and antibiotic inactivation, accounting for 44 % and 41 % of the total ARGs identified, respectively. These ARGs were predicted to confer resistance against 30 different antibiotics, with penam, tetracycline, and macrolide being the most commonly encountered resistant targets. Additionally, 54 % of the identified ARGs provided multiple-drug resistance, with the <italic>OprM</italic>, <italic>CpxR</italic>, and <italic>tolC</italic> genes conferring resistance to 16, 15, and 15 types of antibiotics, respectively. ARGs were identified in 566 genomes (13 % of the total genomes obtained). This low proportion of ARG-bearing genomes suggests that the glacier habitats are only weakly affected by antibiotic contamination. Of the genomes containing ARGs, 48.6 % and 34.1 % were affiliated with Proteobacteria and Firmicutes, respectively (Fig. 6c). However, the resistance mechanisms exhibited by these two bacterial phyla were markedly distinct, with antibiotic efflux (<italic>MexF</italic>) and antibiotic target alternation (<italic>vanZf</italic>)/inactivation (<italic>FosB</italic>) being the most common mechanisms for Proteobacteria and Firmicutes, respectively. Most of the genomes (<inline-formula><mml:math id="M232" display="inline"><mml:mi>n</mml:mi></mml:math></inline-formula> <inline-formula><mml:math id="M233" display="inline"><mml:mo>=</mml:mo></mml:math></inline-formula> 224) carried only a single ARG, while 7 genomes possessed more than 10 ARG genes, with <italic>Pseudomonas aeruginosa</italic> genomes hosting up to 48 ARGs.</p>
      <p id="d2e3253"><italic>Virulence factors.</italic> Using thresholds of 80 % identity and 80 % coverage, the dataset contains 66 822 virulence factor genes, accounting for 0.11 % of the total ORFs identified (Table S17). Virulence factors were predominately associated with adherence, motility, and immune modulation functions, while those associated with toxin production accounted for only 0.48 % (Fig. 6d). We did not detect any toxin genes from the genomes obtained using the same thresholds, with only those associated with regulation, effector delivery systems, and metabolic factors being identified from Proteobacteria, Actinobacteria, and Deinococcota genomes. Nevertheless, 878 potential toxin genes were identified from the genomes if the criteria were loosened, with sequence identity ranging from 20.1 % to 67.8 %, which may represent novel toxins without references in the dataset or non-toxin genes that are homologous to known toxin genes. These candidate toxin genes were most abundantly identified in Gammaproteobacteria, followed by Bacteroides (15.9 %) and Alphaproteobacteria (10.0 %).</p>
</sec>
</sec>
</sec>

      
      </body>
    <back><app-group>
        <supplementary-material position="anchor"><p id="d2e3257">The supplement related to this article is available online at <inline-supplementary-material xlink:href="https://doi.org/10.5194/essd-17-5165-2025-supplement" xlink:title="zip">https://doi.org/10.5194/essd-17-5165-2025-supplement</inline-supplementary-material>.</p></supplementary-material>
        </app-group><notes notes-type="authorcontribution"><title>Author contributions</title>

      <p id="d2e3271">YL conceptualized the paper; SH, YL, TY, ZZ, YC, KL, PL, JL, RD, and MJ analyzed the data; TY, SG, QS, GF, LW, and JM developed the website; MJ and YL prepared the manuscript with contributions from all authors.</p>
  </notes><notes notes-type="competinginterests"><title>Competing interests</title>

      <p id="d2e3277">The contact author has declared that none of the authors has any competing interests.</p>
  </notes><notes notes-type="disclaimer"><title>Disclaimer</title>

      <p id="d2e3283">Publisher's note: Copernicus Publications remains neutral with regard to jurisdictional claims made in the text, published maps, institutional affiliations, or any other geographical representation in this paper. While Copernicus Publications makes every effort to include appropriate place names, the final responsibility lies with the authors.</p>
  </notes><notes notes-type="financialsupport"><title>Financial support</title>

      <p id="d2e3289">This study was supported by the National Natural Science Foundation of China (42421001, Yongqin Liu; 42425607, Mukan Ji) and the Department of Science and Technology, Gansu, China (25RCKA021, Mukan Ji).</p>
  </notes><notes notes-type="reviewstatement"><title>Review statement</title>

      <p id="d2e3295">This paper was edited by Dalei Hao and reviewed by four anonymous referees.</p>
  </notes><ref-list>
    <title>References</title>

      <ref id="bib1.bib1"><label>1</label><mixed-citation>Alcock, B. P., Raphenya, A. R., Lau, T. T. Y., Tsang, K. K., Bouchard, M., Edalatmand, A., Huynh, W., Nguyen, A. V., Cheng, A. A., Liu, S., Min, S. Y., Miroshnichenko, A., Tran, H. K., Werfalli, R. E., Nasir, J. A., Oloni, M., Speicher, D. J., Florescu, A., Singh, B., Faltyn, M., Hernandez-Koutoucheva, A., Sharma, A. N., Bordeleau, E., Pawlowski, A. C., Zubyk, H. L., Dooley, D., Griffiths, E., Maguire, F., Winsor, G. L., Beiko, R. G., Brinkman, F. S. L., Hsiao, W. W. L., Domselaar, G. V., and McArthur, A. G.: CARD 2020: antibiotic resistome surveillance with the comprehensive antibiotic resistance database, Nucleic Acids Res., 48, D517–D525, <ext-link xlink:href="https://doi.org/10.1093/nar/gkz935" ext-link-type="DOI">10.1093/nar/gkz935</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib2"><label>2</label><mixed-citation>Anderson, M. J.: Permutational Multivariate Analysis of Variance (PERMANOVA), Wiley StatsRef: Statistics Reference Online, <ext-link xlink:href="https://doi.org/10.1002/9781118445112.stat07841" ext-link-type="DOI">10.1002/9781118445112.stat07841</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib3"><label>3</label><mixed-citation>Anesio, A. M. and Laybourn-Parry, J.: Glaciers and ice sheets as a biome, Trends Ecol. Evol., 27, 219–225, <ext-link xlink:href="https://doi.org/10.1016/j.tree.2011.09.012" ext-link-type="DOI">10.1016/j.tree.2011.09.012</ext-link>, 2012.</mixed-citation></ref>
      <ref id="bib1.bib4"><label>4</label><mixed-citation>Anesio, A. M., Lutz, S., Chrismas, N. A. M., and Benning, L. G.: The microbiome of glaciers and ice sheets, NPJ Biofilms Microbi., 3, 10, <ext-link xlink:href="https://doi.org/10.1038/s41522-017-0019-0" ext-link-type="DOI">10.1038/s41522-017-0019-0</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib5"><label>5</label><mixed-citation>Boetius, A., Anesio, A. M., Deming, J. W., Mikucki, J. A., and Rapp, J. Z.: Microbial ecology of the cryosphere: sea ice and glacial habitats, Nat. Rev. Microbiol., 13, 677–690, <ext-link xlink:href="https://doi.org/10.1038/nrmicro3522" ext-link-type="DOI">10.1038/nrmicro3522</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bib6"><label>6</label><mixed-citation>Bowers, R. M., Kyrpides, N. C., Stepanauskas, R., Harmon-Smith, M., Doud, D., Reddy, T. B. K., Schulz, F., Jarett, J., Rivers, A. R., Eloe-Fadrosh, E. A., Tringe, S. G., Ivanova, N. N., Copeland, A., Clum, A., Becraft, E. D., Malmstrom, R. R., Birren, B., Podar, M., Bork, P., Weinstock, G. M., Garrity, G. M., Dodsworth, J. A., Yooseph, S., Sutton, G., Glöckner, F. O., Gilbert, J. A., Nelson, W. C., Hallam, S. J., Jungbluth, S. P., Ettema, T. J. G., Tighe, S., Konstantinidis, K. T., Liu, W. T., Baker, B. J., Rattei, T., Eisen, J. A., Hedlund, B., McMahon, K. D., Fierer, N., Knight, R., Finn, R., Cochrane, G., Karsch-Mizrachi, I., Tyson, G. W., Rinke, C., Lapidus, A., Meyer, F., Yilmaz, P., Parks, D. H., Eren, A. M., Schriml, L., Banfield, J. F., Hugenholtz, P., and Woyke, T.: Minimum information about a single amplified genome (MISAG) and a metagenome-assembled genome (MIMAG) of bacteria and archaea, Nat. Biotechnol., 35, 725–731, <ext-link xlink:href="https://doi.org/10.1038/nbt.3893" ext-link-type="DOI">10.1038/nbt.3893</ext-link>, 2017a.</mixed-citation></ref>
      <ref id="bib1.bib7"><label>7</label><mixed-citation>Bowers, R. M., Kyrpides, N. C., Stepanauskas, R., Harmon-Smith, M., Doud, D., Reddy, T. B. K., Schulz, F., Jarett, J., Rivers, A. R., Eloe-Fadrosh, E. A., Tringe, S. G., Ivanova, N. N., Copeland, A., Clum, A., Becraft, E. D., Malmstrom, R. R., Birren, B., Podar, M., Bork, P., Weinstock, G. M., Garrity, G. M., Dodsworth, J. A., Yooseph, S., Sutton, G., Glöckner, F. O., Gilbert, J. A., Nelson, W. C., Hallam, S. J., Jungbluth, S. P., Ettema, T. J. G., Tighe, S., Konstantinidis, K. T., Liu, W.-T., Baker, B. J., Rattei, T., Eisen, J. A., Hedlund, B., McMahon, K. D., Fierer, N., Knight, R., Finn, R., Cochrane, G., Karsch-Mizrachi, I., Tyson, G. W., Rinke, C., Kyrpides, N. C., Schriml, L., Garrity, G. M., Hugenholtz, P., Sutton, G., Yilmaz, P., Meyer, F., Glöckner, F. O., Gilbert, J. A., Knight, R., Finn, R., Cochrane, G., Karsch-Mizrachi, I., Lapidus, A., Meyer, F., Yilmaz, P., Parks, D. H., Murat Eren, A., Schriml, L., Banfield, J. F., Hugenholtz, P., Woyke, T., and The Genome Standards, C.: Minimum information about a single amplified genome (MISAG) and a metagenome-assembled genome (MIMAG) of bacteria and archaea, Nat. Biotechnol., 35, 725–731, <ext-link xlink:href="https://doi.org/10.1038/nbt.3893" ext-link-type="DOI">10.1038/nbt.3893</ext-link>, 2017b.</mixed-citation></ref>
      <ref id="bib1.bib8"><label>8</label><mixed-citation>Buchfink, B., Reuter, K., and Drost, H. G.: Sensitive protein alignments at tree-of-life scale using DIAMOND, Nat. Methods, 18, 366–368, <ext-link xlink:href="https://doi.org/10.1038/s41592-021-01101-x" ext-link-type="DOI">10.1038/s41592-021-01101-x</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib9"><label>9</label><mixed-citation>Cameron, K. A., Hodson, A. J., and Osborn, A. M.: Carbon and nitrogen biogeochemical cycling potentials of supraglacial cryoconite communities, Polar Biol., 35, 1375–1393, <ext-link xlink:href="https://doi.org/10.1007/s00300-012-1178-3" ext-link-type="DOI">10.1007/s00300-012-1178-3</ext-link>, 2012.</mixed-citation></ref>
      <ref id="bib1.bib10"><label>10</label><mixed-citation>Cauvy-Fraunié, S. and Dangles, O.: A global synthesis of biodiversity responses to glacier retreat, Nat. Ecol. Evol., 3, 1675–1685, <ext-link xlink:href="https://doi.org/10.1038/s41559-019-1042-8" ext-link-type="DOI">10.1038/s41559-019-1042-8</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib11"><label>11</label><mixed-citation>Chaumeil, P. A., Mussig, A. J., Hugenholtz, P., and Parks, D. H.: GTDB-Tk: a toolkit to classify genomes with the Genome Taxonomy Database, Bioinformatics, 36, 1925–1927, <ext-link xlink:href="https://doi.org/10.1093/bioinformatics/btz848" ext-link-type="DOI">10.1093/bioinformatics/btz848</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib12"><label>12</label><mixed-citation>Ciccazzo, S., Esposito, A., Borruso, L., and Brusetti, L.: Microbial communities and primary succession in high altitude mountain environments, Ann. Microbiol., 66, 43–60, <ext-link xlink:href="https://doi.org/10.1007/s13213-015-1130-1" ext-link-type="DOI">10.1007/s13213-015-1130-1</ext-link>, 2016.</mixed-citation></ref>
      <ref id="bib1.bib13"><label>13</label><mixed-citation>Cook, J., Edwards, A., Takeuchi, N., and Irvine-Fynn, T.: Cryoconite: The dark biological secret of the cryosphere, Prog. Phys. Geogr., 40, 66–111, <ext-link xlink:href="https://doi.org/10.1177/0309133315616574" ext-link-type="DOI">10.1177/0309133315616574</ext-link>, 2016.</mixed-citation></ref>
      <ref id="bib1.bib14"><label>14</label><mixed-citation>Delgado-Baquerizo, M., Oliverio, A. M., Brewer, T. E., Benavent-Gonzalez, A., Eldridge, D. J., Bardgett, R. D., Maestre, F. T., Singh, B. K., and Fierer, N.: A global atlas of the dominant bacteria found in soil, Science, 359, 320–325, <ext-link xlink:href="https://doi.org/10.1126/science.aap9516" ext-link-type="DOI">10.1126/science.aap9516</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bib15"><label>15</label><mixed-citation>Edgar, R. C.: Search and clustering orders of magnitude faster than BLAST, Bioinformatics, 26, 2460–2461, <ext-link xlink:href="https://doi.org/10.1093/bioinformatics/btq461" ext-link-type="DOI">10.1093/bioinformatics/btq461</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bib16"><label>16</label><mixed-citation>Fredriksson, N. J., Hermansson, M., and Wilén, B. M.: The Choice of PCR Primers Has Great Impact on Assessments of Bacterial Community Diversity and Dynamics in a Wastewater Treatment Plant, Plos One, 8, e76431, <ext-link xlink:href="https://doi.org/10.1371/journal.pone.0076431" ext-link-type="DOI">10.1371/journal.pone.0076431</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bib17"><label>17</label><mixed-citation>Guo, B. X., Liu, Y. Q., Liu, K. S., Shi, Q., He, C., Cai, R. H., and Jiao, N. Z.: Different dissolved organic matter composition between central and southern glaciers on the Tibetan Plateau, Ecol. Indic., 139, 108888, <ext-link xlink:href="https://doi.org/10.1016/j.ecolind.2022.108888" ext-link-type="DOI">10.1016/j.ecolind.2022.108888</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib18"><label>18</label><mixed-citation>Hood, E., Battin, T. J., Fellman, J., O'Neel, S., and Spencer, R. G. M.: Storage and release of organic carbon from glaciers and ice sheets, Nat. Geosci., 8, 91–96, <ext-link xlink:href="https://doi.org/10.1038/ngeo2331" ext-link-type="DOI">10.1038/ngeo2331</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bib19"><label>19</label><mixed-citation>Hotaling, S., Finn, D. S., Giersch, J. J., Weisrock, D. W., and Jacobsen, D.: Climate change and alpine stream biology: progress, challenges, and opportunities for the future, Biol. Rev. Camb. Philos. Soc., 92, 2024–2045, <ext-link xlink:href="https://doi.org/10.1111/brv.12319" ext-link-type="DOI">10.1111/brv.12319</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib20"><label>20</label><mixed-citation>Huerta-Cepas, J., Forslund, K., Coelho, L. P., Szklarczyk, D., Jensen, L. J., von Mering, C., and Bork, P.: Fast genome-wide functional annotation through orthology assignment by eggNOG-Mapper, Mol. Biol. Evol., 34, 2115–2122, <ext-link xlink:href="https://doi.org/10.1093/molbev/msx148" ext-link-type="DOI">10.1093/molbev/msx148</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib21"><label>21</label><mixed-citation>Huerta-Cepas, J., Szklarczyk, D., Heller, D., Hernández-Plaza, A., Forslund, S. K., Cook, H., Mende, D. R., Letunic, I., Rattei, T., Jensen, L. J., von Mering, C., and Bork, P.: eggNOG 5.0: a hierarchical, functionally and phylogenetically annotated orthology resource based on 5090 organisms and 2502 viruses, Nucleic Acids Res., 47, D309–D314, <ext-link xlink:href="https://doi.org/10.1093/nar/gky1085" ext-link-type="DOI">10.1093/nar/gky1085</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib22"><label>22</label><mixed-citation>Hyatt, D., Chen, G. L., Locascio, P. F., Land, M. L., Larimer, F. W., and Hauser, L. J.: Prodigal: prokaryotic gene recognition and translation initiation site identification, BMC Bioinform., 11, 119, <ext-link xlink:href="https://doi.org/10.1186/1471-2105-11-119" ext-link-type="DOI">10.1186/1471-2105-11-119</ext-link>, 2010.</mixed-citation></ref>
      <ref id="bib1.bib23"><label>23</label><mixed-citation>Ji, M.: OTU tables with and without subsampling, figshare [data set], <ext-link xlink:href="https://doi.org/10.6084/m9.figshare.28423781.v2" ext-link-type="DOI">10.6084/m9.figshare.28423781.v2</ext-link>, 2025.</mixed-citation></ref>
      <ref id="bib1.bib24"><label>24</label><mixed-citation>Jia, B., Raphenya, A. R., Alcock, B., Waglechner, N., Guo, P., Tsang, K. K., Lago, B. A., Dave, B. M., Pereira, S., Sharma, A. N., Doshi, S., Courtot, M., Lo, R., Williams, L. E., Frye, J. G., Elsayegh, T., Sardar, D., Westman, E. L., Pawlowski, A. C., Johnson, T. A., Brinkman, F. S., Wright, G. D., and McArthur, A. G.: CARD 2017: expansion and model-centric curation of the comprehensive antibiotic resistance database, Nucleic Acids Res., 45, D566–D573, <ext-link xlink:href="https://doi.org/10.1093/nar/gkw1004" ext-link-type="DOI">10.1093/nar/gkw1004</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib25"><label>25</label><mixed-citation>Kanehisa, M., Furumichi, M., Tanabe, M., Sato, Y., and Morishima, K.: KEGG: new perspectives on genomes, pathways, diseases and drugs, Nucleic Acids Res., 45, D353–D361, <ext-link xlink:href="https://doi.org/10.1093/nar/gkw1092" ext-link-type="DOI">10.1093/nar/gkw1092</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib26"><label>26</label><mixed-citation>Kang, D. D., Li, F., Kirton, E., Thomas, A., Egan, R., An, H., and Wang, Z.: MetaBAT 2: an adaptive binning algorithm for robust and efficient genome reconstruction from metagenome assemblies, PeerJ, 7, e7359, <ext-link xlink:href="https://doi.org/10.7717/peerj.7359" ext-link-type="DOI">10.7717/peerj.7359</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib27"><label>27</label><mixed-citation>Levasseur, A., Drula, E., Lombard, V., Coutinho, P. M., and Henrissat, B.: Expansion of the enzymatic repertoire of the CAZy database to integrate auxiliary redox enzymes, Biotechnol. Biofuels, 6, 41, <ext-link xlink:href="https://doi.org/10.1186/1754-6834-6-41" ext-link-type="DOI">10.1186/1754-6834-6-41</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bib28"><label>28</label><mixed-citation>Liu, B., Zheng, D., Jin, Q., Chen, L., and Yang, J.: VFDB 2019: a comparative pathogenomic platform with an interactive web interface, Nucleic Acids Res., 47, D687–D692, <ext-link xlink:href="https://doi.org/10.1093/nar/gky1080" ext-link-type="DOI">10.1093/nar/gky1080</ext-link>, 2019.</mixed-citation></ref>
      <ref id="bib1.bib29"><label>29</label><mixed-citation>Liu, Y., Ji, M., Yu, T., Zaugg, J., Anesio, A. M., Zhang, Z., Hu, S., Hugenholtz, P., Liu, K., and Liu, P.: A genome and gene catalog of glacier microbiomes, Nat. Biotechnol., 40, 1341–1348, <ext-link xlink:href="https://doi.org/10.1038/s41587-022-01367-2" ext-link-type="DOI">10.1038/s41587-022-01367-2</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib30"><label>30</label><mixed-citation>Liu, Y., Hu, S., Yu, T., Luo, Y., Zhang, Z., Chen, Y., Guo, S., S, Q., Fan, G., Wu, L., Ma, J., Liu, K., Liu, P., Liu, J., and Ji, M.: A database of glacier microbiomes for the Three Poles, National Tibetan Plateau Data Center, National Tibetan Plateau Data Center [data set], <ext-link xlink:href="https://doi.org/10.11888/Cryos.tpdc.300830" ext-link-type="DOI">10.11888/Cryos.tpdc.300830</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib31"><label>31</label><mixed-citation>Mao, G., Ji, M., Jiao, N., Su, J., Zhang, Z., Liu, K., Chen, Y., and Liu, Y.: Monsoon affects the distribution of antibiotic resistome in Tibetan glaciers, Environ. Pollut., 317, 120809, <ext-link xlink:href="https://doi.org/10.1016/j.envpol.2022.120809" ext-link-type="DOI">10.1016/j.envpol.2022.120809</ext-link>, 2023.</mixed-citation></ref>
      <ref id="bib1.bib32"><label>32</label><mixed-citation>Mogrovejo-Arias, D. C., Brill, F. H. H., and Wagner, D.: Potentially pathogenic bacteria isolated from diverse habitats in Spitsbergen, Svalbard, Environ. Earth Sci., 79, 109, <ext-link xlink:href="https://doi.org/10.1007/s12665-020-8853-4" ext-link-type="DOI">10.1007/s12665-020-8853-4</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib33"><label>33</label><mixed-citation>Nissen, J. N., Johansen, J., Allesøe, R. L., Sønderby, C. K., Armenteros, J. J. A., Grønbech, C. H., Jensen, L. J., Nielsen, H. B., Petersen, T. N., Winther, O., and Rasmussen, S.: Improved metagenome binning and assembly using deep variational autoencoders, Nat. Biotechnol., 39, 555–560, <ext-link xlink:href="https://doi.org/10.1038/s41587-020-00777-4" ext-link-type="DOI">10.1038/s41587-020-00777-4</ext-link>, 2021.</mixed-citation></ref>
      <ref id="bib1.bib34"><label>34</label><mixed-citation>Ogle, D. H., Doll, J. C., Wheeler, P., and Dinno, A.: FSA: Fisheries Stock Analysis [code], <ext-link xlink:href="https://doi.org/10.32614/CRAN.package.FSA" ext-link-type="DOI">10.32614/CRAN.package.FSA</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib35"><label>35</label><mixed-citation>Parks, D. H., Rinke, C., Chuvochina, M., Chaumeil, P. A., Woodcroft, B. J., Evans, P. N., Hugenholtz, P., and Tyson, G. W.: Recovery of nearly 8,000 metagenome-assembled genomes substantially expands the tree of life, Nat. Microbiol., 2, 1533–1542, <ext-link xlink:href="https://doi.org/10.1038/s41564-017-0012-7" ext-link-type="DOI">10.1038/s41564-017-0012-7</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib36"><label>36</label><mixed-citation>Qiu, J.: China: The thrid pole, Nature, 454, 393–396, <ext-link xlink:href="https://doi.org/10.1038/454393a" ext-link-type="DOI">10.1038/454393a</ext-link>, 2008.</mixed-citation></ref>
      <ref id="bib1.bib37"><label>37</label><mixed-citation>Quast, C., Pruesse, E., Yilmaz, P., Gerken, J., Schweer, T., Yarza, P., Peplies, J., and Glöckner, F. O.: The SILVA ribosomal RNA gene database project: improved data processing and web-based tools, Nucleic Acids Res., 41, D590–D596, <ext-link xlink:href="https://doi.org/10.1093/nar/gks1219" ext-link-type="DOI">10.1093/nar/gks1219</ext-link>, 2012.</mixed-citation></ref>
      <ref id="bib1.bib38"><label>38</label><mixed-citation>Segawa, T. K., Ushida, K., Agata, K., Okada, N., and Kohshima, S.: Seasonal change in bacterial flora and biomass in mountain snow from the Tateyama mountains, Japan, analyzed by 16S rRNA gene sequencing and real-time PCR, Appl. Environ. Microbiol., 71, 123–130, <ext-link xlink:href="https://doi.org/10.1128/AEM.71.1.123-130.2005" ext-link-type="DOI">10.1128/AEM.71.1.123-130.2005</ext-link>, 2005.</mixed-citation></ref>
      <ref id="bib1.bib39"><label>39</label><mixed-citation>Steinegger, M. and Söding, J.: MMseqs2 enables sensitive protein sequence searching for the analysis of massive data sets, Nat. Biotechnol., 35, 1026–1028, <ext-link xlink:href="https://doi.org/10.1038/nbt.3988" ext-link-type="DOI">10.1038/nbt.3988</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib40"><label>40</label><mixed-citation>Stevens, I. T., Irvine-Fynn, T. D. L., Edwards, A., Mitchell, A. C., Cook, J. M., Porter, P. R., Holt, T. O., Huss, M., Fettweis, X., Moorman, B. J., Sattler, B., and Hodson, A. J.: Spatially consistent microbial biomass and future cellular carbon release from melting Northern Hemisphere glacier surfaces, Commun. Earth Environ., 3, 275, <ext-link xlink:href="https://doi.org/10.1038/s43247-022-00609-0" ext-link-type="DOI">10.1038/s43247-022-00609-0</ext-link>, 2022.</mixed-citation></ref>
      <ref id="bib1.bib41"><label>41</label><mixed-citation>Stibal, M., Bradley, J. A., Edwards, A., Hotaling, S., Zawierucha, K., Rosvold, J., Lutz, S., Cameron, K. A., Mikucki, J. A., Kohler, T. J., Sabacka, M., and Anesio, A. M.: Glacial ecosystems are essential to understanding biodiversity responses to glacier retreat, Nat. Ecol. Evol., 4, 686–687, <ext-link xlink:href="https://doi.org/10.1038/s41559-020-1163-0" ext-link-type="DOI">10.1038/s41559-020-1163-0</ext-link>, 2020.</mixed-citation></ref>
      <ref id="bib1.bib42"><label>42</label><mixed-citation>Taheran, M., Naghdi, M., Brar, S. K., Verma, M., and Surampalli, R. Y.: Emerging contaminants: Here today, there tomorrow!, Environ. Nanotechnol. Monit. Manag., 10, 122–126, <ext-link xlink:href="https://doi.org/10.1016/j.enmm.2018.05.010" ext-link-type="DOI">10.1016/j.enmm.2018.05.010</ext-link>, 2018.</mixed-citation></ref>
      <ref id="bib1.bib43"><label>43</label><mixed-citation>Tatusov, R. L., Fedorova, N. D., Jackson, J. D., Jacobs, A. R., Kiryutin, B., Koonin, E. V., Krylov, D. M., Mazumder, R., Mekhedov, S. L., Nikolskaya, A. N., Rao, B. S., Smirnov, S., Sverdlov, A. V., Vasudevan, S., Wolf, Y. I., Yin, J. J., and Natale, D. A.: The COG database: an updated version includes eukaryotes, BMC Bioinform., 4, 41, <ext-link xlink:href="https://doi.org/10.1186/1471-2105-4-41" ext-link-type="DOI">10.1186/1471-2105-4-41</ext-link>, 2003.</mixed-citation></ref>
      <ref id="bib1.bib44"><label>44</label><mixed-citation>Telling, J., Anesio, A. M., Tranter, M., Irvine-Fynn, T., Hodson, A., Butler, C., and Wadham, J.: Nitrogen fixation on Arctic glaciers, Svalbard, J. Geophys. Res.-Biogeo., 116, G03039, <ext-link xlink:href="https://doi.org/10.1029/2010JG001632" ext-link-type="DOI">10.1029/2010JG001632</ext-link>, 2011.</mixed-citation></ref>
      <ref id="bib1.bib45"><label>45</label><mixed-citation>Tremblay, J., Singh, K., Fern, A., Kirton, E. S., He, S., Woyke, T., Lee, J., Chen, F., Dangl, J. L., and Tringe, S. G.: Primer and platform effects on 16S rRNA tag sequencing, Front. Microbiol., 6, 00771, <ext-link xlink:href="https://doi.org/10.3389/fmicb.2015.00771" ext-link-type="DOI">10.3389/fmicb.2015.00771</ext-link>, 2015.</mixed-citation></ref>
      <ref id="bib1.bib46"><label>46</label><mixed-citation>Trotsenko, Y. A. and Murrell, J. C.: Metabolic aspects of aerobic obligate methanotrophy, Adv. Appl. Microbiol., 63, 183–229, <ext-link xlink:href="https://doi.org/10.1016/S0065-2164(07)00005-6" ext-link-type="DOI">10.1016/S0065-2164(07)00005-6</ext-link>, 2008.</mixed-citation></ref>
      <ref id="bib1.bib47"><label>47</label><mixed-citation>Wu, Y. W., Simmons, B. A., and Singer, S. W.: MaxBin 2.0: an automated binning algorithm to recover genomes from multiple metagenomic datasets, Bioinformatics, 32, 605–607, <ext-link xlink:href="https://doi.org/10.1093/bioinformatics/btv638" ext-link-type="DOI">10.1093/bioinformatics/btv638</ext-link>, 2016.</mixed-citation></ref>
      <ref id="bib1.bib48"><label>48</label><mixed-citation>Zerillo, M. M., Adhikari, B. N., Hamilton, J. P., Buell, C. R., Levesque, C. A., and Tisserat, N.: Carbohydrate-Active Enzymes in Pythium and their role in plant cell wall and storage polysaccharide degradation, Plos One, 8, 0072572, <ext-link xlink:href="https://doi.org/10.1371/journal.pone.0072572" ext-link-type="DOI">10.1371/journal.pone.0072572</ext-link>, 2013.</mixed-citation></ref>
      <ref id="bib1.bib49"><label>49</label><mixed-citation>Zhang, S., Karthikeyan, R., and Fernando, S. D.: Low-temperature biological activation of methane: structure, function and molecular interactions of soluble and particulate methane monooxygenases, Rev. Environ. Sci. Biotechnol., 16, 611–623, <ext-link xlink:href="https://doi.org/10.1007/s11157-017-9447-9" ext-link-type="DOI">10.1007/s11157-017-9447-9</ext-link>, 2017.</mixed-citation></ref>
      <ref id="bib1.bib50"><label>50</label><mixed-citation>Zhang, Y. L., Kang, S. C., Wei, D., Luo, X., Wang, Z. Z., and Gao, T. G.: Sink or source? Methane and carbon dioxide emissions from cryoconite holes, subglacial sediments, and proglacial river runoff during intensive glacier melting on the Tibetan Plateau, Fundam. Res., 1, 232–239, <ext-link xlink:href="https://doi.org/10.1016/j.fmre.2021.04.005" ext-link-type="DOI">10.1016/j.fmre.2021.04.005</ext-link>, 2021.</mixed-citation></ref>

  </ref-list></back>
    <!--<article-title-html>A database of glacier prokaryotic genomes  and genes for the Three Poles</article-title-html>
<abstract-html/>
<ref-html id="bib1.bib1"><label>1</label><mixed-citation>
      
Alcock, B. P., Raphenya, A. R., Lau, T. T. Y., Tsang, K. K., Bouchard, M.,
Edalatmand, A., Huynh, W., Nguyen, A. V., Cheng, A. A., Liu, S., Min, S. Y.,
Miroshnichenko, A., Tran, H. K., Werfalli, R. E., Nasir, J. A., Oloni, M.,
Speicher, D. J., Florescu, A., Singh, B., Faltyn, M., Hernandez-Koutoucheva,
A., Sharma, A. N., Bordeleau, E., Pawlowski, A. C., Zubyk, H. L., Dooley,
D., Griffiths, E., Maguire, F., Winsor, G. L., Beiko, R. G., Brinkman, F. S.
L., Hsiao, W. W. L., Domselaar, G. V., and McArthur, A. G.: CARD 2020:
antibiotic resistome surveillance with the comprehensive antibiotic
resistance database, Nucleic Acids Res., 48, D517–D525,
<a href="https://doi.org/10.1093/nar/gkz935" target="_blank">https://doi.org/10.1093/nar/gkz935</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib2"><label>2</label><mixed-citation>
      
Anderson, M. J.: Permutational Multivariate Analysis of Variance
(PERMANOVA), Wiley StatsRef: Statistics Reference Online, <a href="https://doi.org/10.1002/9781118445112.stat07841" target="_blank">https://doi.org/10.1002/9781118445112.stat07841</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib3"><label>3</label><mixed-citation>
      
Anesio, A. M. and Laybourn-Parry, J.: Glaciers and ice sheets as a biome,
Trends Ecol. Evol., 27, 219–225, <a href="https://doi.org/10.1016/j.tree.2011.09.012" target="_blank">https://doi.org/10.1016/j.tree.2011.09.012</a>,
2012.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib4"><label>4</label><mixed-citation>
      
Anesio, A. M., Lutz, S., Chrismas, N. A. M., and Benning, L. G.: The microbiome of glaciers and ice sheets, NPJ Biofilms Microbi., 3, 10, <a href="https://doi.org/10.1038/s41522-017-0019-0" target="_blank">https://doi.org/10.1038/s41522-017-0019-0</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib5"><label>5</label><mixed-citation>
      
Boetius, A., Anesio, A. M., Deming, J. W., Mikucki, J. A., and Rapp, J. Z.:
Microbial ecology of the cryosphere: sea ice and glacial habitats, Nat. Rev.
Microbiol., 13, 677–690, <a href="https://doi.org/10.1038/nrmicro3522" target="_blank">https://doi.org/10.1038/nrmicro3522</a>, 2015.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib6"><label>6</label><mixed-citation>
      
Bowers, R. M., Kyrpides, N. C., Stepanauskas, R., Harmon-Smith, M., Doud,
D., Reddy, T. B. K., Schulz, F., Jarett, J., Rivers, A. R., Eloe-Fadrosh, E.
A., Tringe, S. G., Ivanova, N. N., Copeland, A., Clum, A., Becraft, E. D.,
Malmstrom, R. R., Birren, B., Podar, M., Bork, P., Weinstock, G. M.,
Garrity, G. M., Dodsworth, J. A., Yooseph, S., Sutton, G., Glöckner, F.
O., Gilbert, J. A., Nelson, W. C., Hallam, S. J., Jungbluth, S. P., Ettema,
T. J. G., Tighe, S., Konstantinidis, K. T., Liu, W. T., Baker, B. J.,
Rattei, T., Eisen, J. A., Hedlund, B., McMahon, K. D., Fierer, N., Knight,
R., Finn, R., Cochrane, G., Karsch-Mizrachi, I., Tyson, G. W., Rinke, C.,
Lapidus, A., Meyer, F., Yilmaz, P., Parks, D. H., Eren, A. M., Schriml, L.,
Banfield, J. F., Hugenholtz, P., and Woyke, T.: Minimum information about a
single amplified genome (MISAG) and a metagenome-assembled genome (MIMAG) of
bacteria and archaea, Nat. Biotechnol., 35, 725–731,
<a href="https://doi.org/10.1038/nbt.3893" target="_blank">https://doi.org/10.1038/nbt.3893</a>, 2017a.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib7"><label>7</label><mixed-citation>
      
Bowers, R. M., Kyrpides, N. C., Stepanauskas, R., Harmon-Smith, M., Doud,
D., Reddy, T. B. K., Schulz, F., Jarett, J., Rivers, A. R., Eloe-Fadrosh, E.
A., Tringe, S. G., Ivanova, N. N., Copeland, A., Clum, A., Becraft, E. D.,
Malmstrom, R. R., Birren, B., Podar, M., Bork, P., Weinstock, G. M.,
Garrity, G. M., Dodsworth, J. A., Yooseph, S., Sutton, G., Glöckner, F.
O., Gilbert, J. A., Nelson, W. C., Hallam, S. J., Jungbluth, S. P., Ettema,
T. J. G., Tighe, S., Konstantinidis, K. T., Liu, W.-T., Baker, B. J.,
Rattei, T., Eisen, J. A., Hedlund, B., McMahon, K. D., Fierer, N., Knight,
R., Finn, R., Cochrane, G., Karsch-Mizrachi, I., Tyson, G. W., Rinke, C.,
Kyrpides, N. C., Schriml, L., Garrity, G. M., Hugenholtz, P., Sutton, G.,
Yilmaz, P., Meyer, F., Glöckner, F. O., Gilbert, J. A., Knight, R.,
Finn, R., Cochrane, G., Karsch-Mizrachi, I., Lapidus, A., Meyer, F., Yilmaz,
P., Parks, D. H., Murat Eren, A., Schriml, L., Banfield, J. F., Hugenholtz,
P., Woyke, T., and The Genome Standards, C.: Minimum information about a
single amplified genome (MISAG) and a metagenome-assembled genome (MIMAG) of
bacteria and archaea, Nat. Biotechnol., 35, 725–731,
<a href="https://doi.org/10.1038/nbt.3893" target="_blank">https://doi.org/10.1038/nbt.3893</a>, 2017b.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib8"><label>8</label><mixed-citation>
      
Buchfink, B., Reuter, K., and Drost, H. G.: Sensitive protein alignments at
tree-of-life scale using DIAMOND, Nat. Methods, 18, 366–368,
<a href="https://doi.org/10.1038/s41592-021-01101-x" target="_blank">https://doi.org/10.1038/s41592-021-01101-x</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib9"><label>9</label><mixed-citation>
      
Cameron, K. A., Hodson, A. J., and Osborn, A. M.: Carbon and nitrogen
biogeochemical cycling potentials of supraglacial cryoconite communities,
Polar Biol., 35, 1375–1393, <a href="https://doi.org/10.1007/s00300-012-1178-3" target="_blank">https://doi.org/10.1007/s00300-012-1178-3</a>, 2012.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib10"><label>10</label><mixed-citation>
      
Cauvy-Fraunié, S. and Dangles, O.: A global synthesis of biodiversity
responses to glacier retreat, Nat. Ecol. Evol., 3, 1675–1685,
<a href="https://doi.org/10.1038/s41559-019-1042-8" target="_blank">https://doi.org/10.1038/s41559-019-1042-8</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib11"><label>11</label><mixed-citation>
      
Chaumeil, P. A., Mussig, A. J., Hugenholtz, P., and Parks, D. H.: GTDB-Tk: a
toolkit to classify genomes with the Genome Taxonomy Database,
Bioinformatics, 36, 1925–1927,
<a href="https://doi.org/10.1093/bioinformatics/btz848" target="_blank">https://doi.org/10.1093/bioinformatics/btz848</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib12"><label>12</label><mixed-citation>
      
Ciccazzo, S., Esposito, A., Borruso, L., and Brusetti, L.: Microbial
communities and primary succession in high altitude mountain environments,
Ann. Microbiol., 66, 43–60, <a href="https://doi.org/10.1007/s13213-015-1130-1" target="_blank">https://doi.org/10.1007/s13213-015-1130-1</a>, 2016.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib13"><label>13</label><mixed-citation>
      
Cook, J., Edwards, A., Takeuchi, N., and Irvine-Fynn, T.: Cryoconite: The
dark biological secret of the cryosphere, Prog. Phys. Geogr., 40, 66–111,
<a href="https://doi.org/10.1177/0309133315616574" target="_blank">https://doi.org/10.1177/0309133315616574</a>, 2016.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib14"><label>14</label><mixed-citation>
      
Delgado-Baquerizo, M., Oliverio, A. M., Brewer, T. E., Benavent-Gonzalez,
A., Eldridge, D. J., Bardgett, R. D., Maestre, F. T., Singh, B. K., and
Fierer, N.: A global atlas of the dominant bacteria found in soil, Science,
359, 320–325, <a href="https://doi.org/10.1126/science.aap9516" target="_blank">https://doi.org/10.1126/science.aap9516</a>, 2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib15"><label>15</label><mixed-citation>
      
Edgar, R. C.: Search and clustering orders of magnitude faster than BLAST,
Bioinformatics, 26, 2460–2461,
<a href="https://doi.org/10.1093/bioinformatics/btq461" target="_blank">https://doi.org/10.1093/bioinformatics/btq461</a>, 2010.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib16"><label>16</label><mixed-citation>
      
Fredriksson, N. J., Hermansson, M., and Wilén, B. M.: The Choice of PCR Primers
Has Great Impact on Assessments of Bacterial Community Diversity and
Dynamics in a Wastewater Treatment Plant, Plos One, 8, e76431,
<a href="https://doi.org/10.1371/journal.pone.0076431" target="_blank">https://doi.org/10.1371/journal.pone.0076431</a>, 2013.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib17"><label>17</label><mixed-citation>
      
Guo, B. X., Liu, Y. Q., Liu, K. S., Shi, Q., He, C., Cai, R. H., and Jiao,
N. Z.: Different dissolved organic matter composition between central and
southern glaciers on the Tibetan Plateau, Ecol. Indic., 139, 108888,
<a href="https://doi.org/10.1016/j.ecolind.2022.108888" target="_blank">https://doi.org/10.1016/j.ecolind.2022.108888</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib18"><label>18</label><mixed-citation>
      
Hood, E., Battin, T. J., Fellman, J., O'Neel, S., and Spencer, R. G. M.:
Storage and release of organic carbon from glaciers and ice sheets, Nat.
Geosci., 8, 91–96, <a href="https://doi.org/10.1038/ngeo2331" target="_blank">https://doi.org/10.1038/ngeo2331</a>, 2015.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib19"><label>19</label><mixed-citation>
      
Hotaling, S., Finn, D. S., Giersch, J. J., Weisrock, D. W., and Jacobsen, D.: Climate change and alpine stream biology: progress, challenges, and opportunities for the future, Biol. Rev. Camb. Philos. Soc., 92, 2024–2045, <a href="https://doi.org/10.1111/brv.12319" target="_blank">https://doi.org/10.1111/brv.12319</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib20"><label>20</label><mixed-citation>
      
Huerta-Cepas, J., Forslund, K., Coelho, L. P., Szklarczyk, D., Jensen, L.
J., von Mering, C., and Bork, P.: Fast genome-wide functional annotation
through orthology assignment by eggNOG-Mapper, Mol. Biol. Evol., 34,
2115–2122, <a href="https://doi.org/10.1093/molbev/msx148" target="_blank">https://doi.org/10.1093/molbev/msx148</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib21"><label>21</label><mixed-citation>
      
Huerta-Cepas, J., Szklarczyk, D., Heller, D., Hernández-Plaza, A.,
Forslund, S. K., Cook, H., Mende, D. R., Letunic, I., Rattei, T., Jensen, L.
J., von Mering, C., and Bork, P.: eggNOG 5.0: a hierarchical, functionally
and phylogenetically annotated orthology resource based on 5090 organisms
and 2502 viruses, Nucleic Acids Res., 47, D309–D314,
<a href="https://doi.org/10.1093/nar/gky1085" target="_blank">https://doi.org/10.1093/nar/gky1085</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib22"><label>22</label><mixed-citation>
      
Hyatt, D., Chen, G. L., Locascio, P. F., Land, M. L., Larimer, F. W., and
Hauser, L. J.: Prodigal: prokaryotic gene recognition and translation
initiation site identification, BMC Bioinform., 11, 119,
<a href="https://doi.org/10.1186/1471-2105-11-119" target="_blank">https://doi.org/10.1186/1471-2105-11-119</a>, 2010.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib23"><label>23</label><mixed-citation>
      
Ji, M.: OTU tables with and without subsampling, figshare [data set], <a href="https://doi.org/10.6084/m9.figshare.28423781.v2" target="_blank">https://doi.org/10.6084/m9.figshare.28423781.v2</a>, 2025.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib24"><label>24</label><mixed-citation>
      
Jia, B., Raphenya, A. R., Alcock, B., Waglechner, N., Guo, P., Tsang, K. K.,
Lago, B. A., Dave, B. M., Pereira, S., Sharma, A. N., Doshi, S., Courtot,
M., Lo, R., Williams, L. E., Frye, J. G., Elsayegh, T., Sardar, D., Westman,
E. L., Pawlowski, A. C., Johnson, T. A., Brinkman, F. S., Wright, G. D., and
McArthur, A. G.: CARD 2017: expansion and model-centric curation of the
comprehensive antibiotic resistance database, Nucleic Acids Res., 45,
D566–D573, <a href="https://doi.org/10.1093/nar/gkw1004" target="_blank">https://doi.org/10.1093/nar/gkw1004</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib25"><label>25</label><mixed-citation>
      
Kanehisa, M.,
Furumichi, M., Tanabe, M., Sato, Y., and Morishima, K.: KEGG: new
perspectives on genomes, pathways, diseases and drugs, Nucleic Acids Res.,
45, D353–D361, <a href="https://doi.org/10.1093/nar/gkw1092" target="_blank">https://doi.org/10.1093/nar/gkw1092</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib26"><label>26</label><mixed-citation>
      
Kang, D. D., Li, F., Kirton, E., Thomas, A., Egan, R., An, H., and Wang, Z.:
MetaBAT 2: an adaptive binning algorithm for robust and efficient genome
reconstruction from metagenome assemblies, PeerJ, 7, e7359,
<a href="https://doi.org/10.7717/peerj.7359" target="_blank">https://doi.org/10.7717/peerj.7359</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib27"><label>27</label><mixed-citation>
      
Levasseur, A., Drula, E., Lombard, V., Coutinho, P. M., and Henrissat, B.:
Expansion of the enzymatic repertoire of the CAZy database to integrate
auxiliary redox enzymes, Biotechnol. Biofuels, 6, 41,
<a href="https://doi.org/10.1186/1754-6834-6-41" target="_blank">https://doi.org/10.1186/1754-6834-6-41</a>, 2013.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib28"><label>28</label><mixed-citation>
      
Liu, B., Zheng, D., Jin, Q., Chen, L., and Yang, J.: VFDB 2019: a
comparative pathogenomic platform with an interactive web interface, Nucleic
Acids Res., 47, D687–D692, <a href="https://doi.org/10.1093/nar/gky1080" target="_blank">https://doi.org/10.1093/nar/gky1080</a>, 2019.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib29"><label>29</label><mixed-citation>
      
Liu, Y., Ji, M., Yu, T., Zaugg, J., Anesio, A. M., Zhang, Z., Hu, S.,
Hugenholtz, P., Liu, K., and Liu, P.: A genome and gene catalog of glacier
microbiomes, Nat. Biotechnol., 40, 1341–1348,
<a href="https://doi.org/10.1038/s41587-022-01367-2" target="_blank">https://doi.org/10.1038/s41587-022-01367-2</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib30"><label>30</label><mixed-citation>
      
Liu, Y., Hu, S., Yu, T., Luo, Y., Zhang, Z., Chen, Y., Guo, S., S, Q., Fan,
G., Wu, L., Ma, J., Liu, K., Liu, P., Liu, J., and Ji, M.: A database of glacier
microbiomes for the Three Poles, National Tibetan Plateau Data Center, National Tibetan Plateau Data Center [data set],
<a href="https://doi.org/10.11888/Cryos.tpdc.300830" target="_blank">https://doi.org/10.11888/Cryos.tpdc.300830</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib31"><label>31</label><mixed-citation>
      
Mao, G., Ji, M., Jiao, N., Su, J., Zhang, Z., Liu, K., Chen, Y., and Liu, Y.:
Monsoon affects the distribution of antibiotic resistome in Tibetan
glaciers, Environ. Pollut., 317, 120809,
<a href="https://doi.org/10.1016/j.envpol.2022.120809" target="_blank">https://doi.org/10.1016/j.envpol.2022.120809</a>, 2023.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib32"><label>32</label><mixed-citation>
      
Mogrovejo-Arias, D. C., Brill, F. H. H., and Wagner, D.: Potentially
pathogenic bacteria isolated from diverse habitats in Spitsbergen, Svalbard,
Environ. Earth Sci., 79, 109, <a href="https://doi.org/10.1007/s12665-020-8853-4" target="_blank">https://doi.org/10.1007/s12665-020-8853-4</a>,
2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib33"><label>33</label><mixed-citation>
      
Nissen, J. N., Johansen, J., Allesøe, R. L., Sønderby, C. K.,
Armenteros, J. J. A., Grønbech, C. H., Jensen, L. J., Nielsen, H. B.,
Petersen, T. N., Winther, O., and Rasmussen, S.: Improved metagenome binning
and assembly using deep variational autoencoders, Nat. Biotechnol., 39,
555–560, <a href="https://doi.org/10.1038/s41587-020-00777-4" target="_blank">https://doi.org/10.1038/s41587-020-00777-4</a>, 2021.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib34"><label>34</label><mixed-citation>
      
Ogle, D. H., Doll, J. C., Wheeler, P., and Dinno, A.: FSA: Fisheries Stock
Analysis [code], <a href="https://doi.org/10.32614/CRAN.package.FSA" target="_blank">https://doi.org/10.32614/CRAN.package.FSA</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib35"><label>35</label><mixed-citation>
      
Parks, D. H., Rinke, C., Chuvochina, M., Chaumeil, P. A., Woodcroft, B. J.,
Evans, P. N., Hugenholtz, P., and Tyson, G. W.: Recovery of nearly 8,000
metagenome-assembled genomes substantially expands the tree of life, Nat.
Microbiol., 2, 1533–1542, <a href="https://doi.org/10.1038/s41564-017-0012-7" target="_blank">https://doi.org/10.1038/s41564-017-0012-7</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib36"><label>36</label><mixed-citation>
      
Qiu, J.: China: The thrid pole, Nature, 454, 393–396,
<a href="https://doi.org/10.1038/454393a" target="_blank">https://doi.org/10.1038/454393a</a>, 2008.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib37"><label>37</label><mixed-citation>
      
Quast, C., Pruesse, E., Yilmaz, P., Gerken, J., Schweer, T., Yarza, P.,
Peplies, J., and Glöckner, F. O.: The SILVA ribosomal RNA gene database
project: improved data processing and web-based tools, Nucleic Acids Res.,
41, D590–D596, <a href="https://doi.org/10.1093/nar/gks1219" target="_blank">https://doi.org/10.1093/nar/gks1219</a>, 2012.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib38"><label>38</label><mixed-citation>
      
Segawa, T. K., Ushida, K., Agata, K., Okada, N., and Kohshima, S.: Seasonal change in bacterial flora and biomass in mountain snow from the Tateyama mountains, Japan, analyzed by 16S rRNA gene sequencing and real-time PCR, Appl. Environ. Microbiol., 71, 123–130, <a href="https://doi.org/10.1128/AEM.71.1.123-130.2005" target="_blank">https://doi.org/10.1128/AEM.71.1.123-130.2005</a>, 2005.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib39"><label>39</label><mixed-citation>
      
Steinegger, M. and Söding, J.: MMseqs2 enables sensitive protein
sequence searching for the analysis of massive data sets, Nat. Biotechnol.,
35, 1026–1028, <a href="https://doi.org/10.1038/nbt.3988" target="_blank">https://doi.org/10.1038/nbt.3988</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib40"><label>40</label><mixed-citation>
      
Stevens, I. T., Irvine-Fynn, T. D. L., Edwards, A., Mitchell, A. C., Cook,
J. M., Porter, P. R., Holt, T. O., Huss, M., Fettweis, X., Moorman, B. J.,
Sattler, B., and Hodson, A. J.: Spatially consistent microbial biomass and
future cellular carbon release from melting Northern Hemisphere glacier
surfaces, Commun. Earth Environ., 3, 275,
<a href="https://doi.org/10.1038/s43247-022-00609-0" target="_blank">https://doi.org/10.1038/s43247-022-00609-0</a>, 2022.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib41"><label>41</label><mixed-citation>
      
Stibal, M., Bradley, J. A., Edwards, A., Hotaling, S., Zawierucha, K.,
Rosvold, J., Lutz, S., Cameron, K. A., Mikucki, J. A., Kohler, T. J.,
Sabacka, M., and Anesio, A. M.: Glacial ecosystems are essential to
understanding biodiversity responses to glacier retreat, Nat. Ecol. Evol.,
4, 686–687, <a href="https://doi.org/10.1038/s41559-020-1163-0" target="_blank">https://doi.org/10.1038/s41559-020-1163-0</a>, 2020.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib42"><label>42</label><mixed-citation>
      
Taheran, M., Naghdi, M., Brar, S. K., Verma, M., and Surampalli, R. Y.:
Emerging contaminants: Here today, there tomorrow!, Environ. Nanotechnol.
Monit. Manag., 10, 122–126, <a href="https://doi.org/10.1016/j.enmm.2018.05.010" target="_blank">https://doi.org/10.1016/j.enmm.2018.05.010</a>,
2018.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib43"><label>43</label><mixed-citation>
      
Tatusov, R. L., Fedorova, N. D., Jackson, J. D., Jacobs, A. R., Kiryutin,
B., Koonin, E. V., Krylov, D. M., Mazumder, R., Mekhedov, S. L., Nikolskaya,
A. N., Rao, B. S., Smirnov, S., Sverdlov, A. V., Vasudevan, S., Wolf, Y. I.,
Yin, J. J., and Natale, D. A.: The COG database: an updated version includes
eukaryotes, BMC Bioinform., 4, 41, <a href="https://doi.org/10.1186/1471-2105-4-41" target="_blank">https://doi.org/10.1186/1471-2105-4-41</a>,
2003.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib44"><label>44</label><mixed-citation>
      
Telling, J., Anesio, A. M., Tranter, M., Irvine-Fynn, T., Hodson, A.,
Butler, C., and Wadham, J.: Nitrogen fixation on Arctic glaciers, Svalbard,
J. Geophys. Res.-Biogeo., 116, G03039,
<a href="https://doi.org/10.1029/2010JG001632" target="_blank">https://doi.org/10.1029/2010JG001632</a>, 2011.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib45"><label>45</label><mixed-citation>
      
Tremblay, J., Singh, K., Fern, A., Kirton, E. S., He, S., Woyke, T., Lee, J., Chen,
F., Dangl, J. L., and Tringe, S. G.: Primer and platform effects on 16S rRNA tag
sequencing, Front. Microbiol., 6, 00771,
<a href="https://doi.org/10.3389/fmicb.2015.00771" target="_blank">https://doi.org/10.3389/fmicb.2015.00771</a>, 2015.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib46"><label>46</label><mixed-citation>
      
Trotsenko, Y. A. and Murrell, J. C.: Metabolic aspects of aerobic obligate
methanotrophy, Adv. Appl. Microbiol., 63, 183–229, <a href="https://doi.org/10.1016/S0065-2164(07)00005-6" target="_blank">https://doi.org/10.1016/S0065-2164(07)00005-6</a>, 2008.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib47"><label>47</label><mixed-citation>
      
Wu, Y. W., Simmons, B. A., and Singer,
S. W.: MaxBin 2.0: an automated binning algorithm to recover genomes from
multiple metagenomic datasets, Bioinformatics, 32, 605–607,
<a href="https://doi.org/10.1093/bioinformatics/btv638" target="_blank">https://doi.org/10.1093/bioinformatics/btv638</a>, 2016.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib48"><label>48</label><mixed-citation>
      
Zerillo, M. M., Adhikari, B. N., Hamilton, J. P., Buell, C. R., Levesque, C.
A., and Tisserat, N.: Carbohydrate-Active Enzymes in Pythium and their role
in plant cell wall and storage polysaccharide degradation, Plos One, 8,
0072572, <a href="https://doi.org/10.1371/journal.pone.0072572" target="_blank">https://doi.org/10.1371/journal.pone.0072572</a>, 2013.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib49"><label>49</label><mixed-citation>
      
Zhang, S., Karthikeyan, R., and Fernando, S. D.: Low-temperature biological
activation of methane: structure, function and molecular interactions of
soluble and particulate methane monooxygenases, Rev. Environ. Sci.
Biotechnol., 16, 611–623, <a href="https://doi.org/10.1007/s11157-017-9447-9" target="_blank">https://doi.org/10.1007/s11157-017-9447-9</a>, 2017.

    </mixed-citation></ref-html>
<ref-html id="bib1.bib50"><label>50</label><mixed-citation>
      
Zhang, Y. L., Kang, S. C., Wei, D., Luo, X., Wang, Z. Z., and Gao, T. G.:
Sink or source? Methane and carbon dioxide emissions from cryoconite holes,
subglacial sediments, and proglacial river runoff during intensive glacier
melting on the Tibetan Plateau, Fundam. Res., 1, 232–239,
<a href="https://doi.org/10.1016/j.fmre.2021.04.005" target="_blank">https://doi.org/10.1016/j.fmre.2021.04.005</a>, 2021.

    </mixed-citation></ref-html>--></article>
