<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Microbiol.</journal-id>
<journal-title>Frontiers in Microbiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Microbiol.</abbrev-journal-title>
<issn pub-type="epub">1664-302X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmicb.2022.1095497</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Microbiology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Recovery of metagenome-assembled microbial genomes from a full-scale biogas plant of food waste by pacific biosciences high-fidelity sequencing</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author"><name><surname>Jiang</surname><given-names>Fan</given-names></name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<xref rid="fn0001" ref-type="author-notes"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1016589/overview"/>
</contrib>
<contrib contrib-type="author"><name><surname>Li</surname><given-names>Qiang</given-names></name>
<xref rid="aff2" ref-type="aff"><sup>2</sup></xref>
<xref rid="aff3" ref-type="aff"><sup>3</sup></xref>
<xref rid="fn0001" ref-type="author-notes"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1338367/overview"/>
</contrib>
<contrib contrib-type="author"><name><surname>Wang</surname><given-names>Sen</given-names></name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/548029/overview"/>
</contrib>
<contrib contrib-type="author"><name><surname>Shen</surname><given-names>Ting</given-names></name>
<xref rid="aff2" ref-type="aff"><sup>2</sup></xref>
<xref rid="aff3" ref-type="aff"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author"><name><surname>Wang</surname><given-names>Hengchao</given-names></name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/931615/overview"/>
</contrib>
<contrib contrib-type="author"><name><surname>Wang</surname><given-names>Anqi</given-names></name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1340681/overview"/>
</contrib>
<contrib contrib-type="author"><name><surname>Xu</surname><given-names>Dong</given-names></name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2149996/overview"/>
</contrib>
<contrib contrib-type="author"><name><surname>Yuan</surname><given-names>Lihua</given-names></name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2150611/overview"/>
</contrib>
<contrib contrib-type="author"><name><surname>Lei</surname><given-names>Lihong</given-names></name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2150021/overview"/>
</contrib>
<contrib contrib-type="author"><name><surname>Chen</surname><given-names>Rong</given-names></name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2150025/overview"/>
</contrib>
<contrib contrib-type="author"><name><surname>Yang</surname><given-names>Boyuan</given-names></name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2150755/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes"><name><surname>Deng</surname><given-names>Yu</given-names></name>
<xref rid="aff2" ref-type="aff"><sup>2</sup></xref>
<xref rid="aff3" ref-type="aff"><sup>3</sup></xref>
<xref rid="c001" ref-type="corresp"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1338380/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes"><name><surname>Fan</surname><given-names>Wei</given-names></name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<xref rid="c001" ref-type="corresp"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/816487/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Guangdong Laboratory for Lingnan Modern Agriculture (Shenzhen Branch), Genome Analysis Laboratory of the Ministry of Agriculture and Rural Affairs, Agricultural Genomics Institute at Shenzhen, Chinese Academy of Agricultural Sciences</institution>, <addr-line>Shenzhen, Guangdong</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Biogas Institute of Ministry of Agriculture and Rural Affairs</institution>, <addr-line>Chengdu, Sichuan</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>Key Laboratory of Development and Application of Rural Renewable Energy, Ministry of Agriculture and Rural Affairs</institution>, <addr-line>Chengdu, Sichuan</addr-line>, <country>China</country></aff>
<author-notes>
<fn id="fn0002" fn-type="edited-by">
<p>Edited by: Alejandro Gonzalez-Martinez, University of Granada, Spain</p>
</fn>
<fn id="fn0003" fn-type="edited-by">
<p>Reviewed by: Alejandro Rodriguez-Sanchez, University of Granada, Spain; David Correa Galeote, National Autonomous University of Mexico, Mexico</p>
</fn>
<corresp id="c001">&#x002A;Correspondence: Yu Deng, <email>dengyu@caas.cn</email>; Wei Fan, <email>fanwei@caas.cn</email></corresp>
<fn id="fn0001" fn-type="equal">
<p><sup>&#x2020;</sup>These authors have contributed equally to this work and share first authorship</p>
</fn>
<fn id="fn0004" fn-type="other">
<p>This article was submitted to Extreme Microbiology, a section of the journal Frontiers in Microbiology</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>09</day>
<month>01</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>13</volume>
<elocation-id>1095497</elocation-id>
<history>
<date date-type="received">
<day>11</day>
<month>11</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>20</day>
<month>12</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2023 Jiang, Li, Wang, Shen, Wang, Wang, Xu, Yuan, Lei, Chen, Yang, Deng and Fan.</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Jiang, Li, Wang, Shen, Wang, Wang, Xu, Yuan, Lei, Chen, Yang, Deng and Fan</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>Anaerobic digestion (AD) is important in treating of food waste, and thousands of metagenome-assembled genomes (MAGs) have been constructed for the microbiome in AD. However, due to the limitations of the short-read sequencing and assembly technologies, most of these MAGs are grouped from hundreds of short contigs by binning algorithms, and the errors are easily introduced.</p>
</sec>
<sec>
<title>Results</title>
<p>In this study, we constructed a total of 60 non-redundant microbial genomes from 64.5&#x2009;Gb of PacBio high-fidelity (HiFi) long reads, generated from the digestate samples of a full-scale biogas plant fed with food waste. Of the 60 microbial genomes, all genomes have at least one copy of rRNA operons (16S, 23S, and 5S rRNA), 54 have &#x2265;18 types of standard tRNA genes, and 39 are circular complete genomes. In comparison with the published short-read derived MAGs for AD, we found 23 genomes with average nucleotide identity less than 95% to any known MAGs. Besides, our HiFi-derived genomes have much higher average contig N50 size, slightly higher average genome size and lower contamination. GTDB-Tk classification of these genomes revealed two genomes belonging to novel genus and four genomes belonging to novel species, since their 16S rRNA genes have identities lower than 95 and 97% to any known 16S rRNA genes, respectively. Microbial community analysis based on the these assembled genomes reveals the most predominant phylum was <italic>Thermotogae</italic> (70.5%), followed by <italic>Euryarchaeota</italic> (6.1%), and <italic>Bacteroidetes</italic> (4.7%), and the most predominant bacterial and archaeal genera were <italic>Defluviitoga</italic> (69.1%) and <italic>Methanothrix</italic> (5.4%), respectively. Analysis of the full-length 16S rRNA genes identified from the HiFi reads gave similar microbial compositions to that derived from the 60 assembled genomes.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>High-fidelity sequencing not only generated microbial genomes with obviously improved quality but also recovered a substantial portion of novel genomes missed in previous short-read based studies, and the novel genomes will deepen our understanding of the microbial composition in AD of food waste.</p>
</sec>
</abstract>
<kwd-group>
<kwd>food waste</kwd>
<kwd>metagenome</kwd>
<kwd>PacBio HiFi reads</kwd>
<kwd>full-scale biogas plants</kwd>
<kwd>full-length 16S rRNA genes</kwd>
</kwd-group>
<contract-num rid="cn1">JCYJ20190814163805604</contract-num>
<contract-sponsor id="cn1">Shenzhen Science and Technology Program</contract-sponsor>
<counts>
<fig-count count="6"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="58"/>
<page-count count="13"/>
<word-count count="8741"/>
</counts>
</article-meta>
</front>
<body>
<sec id="sec4" sec-type="intro">
<title>Introduction</title>
<p>In recent years, rapid growth of population and economic activities are producing more and more municipal solid wastes (<xref ref-type="bibr" rid="ref26">Li et al., 2017</xref>). Food waste has caused increasing public concerns, with the global production estimated to be around 1.4 billion tons per year, accounting for 30&#x2013;50% of total municipal solid wastes (<xref ref-type="bibr" rid="ref21">Kiran et al., 2014</xref>; <xref ref-type="bibr" rid="ref53">Wong et al., 2018</xref>; <xref ref-type="bibr" rid="ref54">Wu et al., 2021</xref>). When improperly disposed, food waste releases a lot of foul-smelling odor and leachate due to its high content of volatile solids (85&#x2013;95%) and moisture (66&#x2013;80%; <xref ref-type="bibr" rid="ref20">Kim et al., 2016</xref>; <xref ref-type="bibr" rid="ref15">Fisgativa et al., 2017</xref>; <xref ref-type="bibr" rid="ref56">Zan et al., 2018</xref>). On the other hand, food waste is usually rich in carbohydrates, proteins, lipids, and minerals, which makes it a potential valuable source for production of renewable energy (<xref ref-type="bibr" rid="ref37">Paritosh et al., 2017</xref>; <xref ref-type="bibr" rid="ref2">Antonopoulou et al., 2019</xref>). At the same time, anaerobic digestion (AD) is considered as one of the most cost-effective and eco-friendly technologies for both renewable energy production and waste disposal, and to date has been widely used for treating of food waste (<xref ref-type="bibr" rid="ref55">Xu et al., 2018</xref>; <xref ref-type="bibr" rid="ref16">Garcia-Depraect et al., 2022</xref>; <xref ref-type="bibr" rid="ref58">Zhang S. et al., 2022</xref>).</p>
<p>Anaerobic digestion is performed by a highly complex consortium of bacteria and archaea, and the process includes four sequential metabolic steps of hydrolysis, acidogenesis, acetogenesis, and methanogenesis (<xref ref-type="bibr" rid="ref1">Angenent et al., 2004</xref>; <xref ref-type="bibr" rid="ref18">Hassa et al., 2018</xref>). The first three steps are predominantly fulfilled synergistically by fermentative bacteria, while the last step is carried out by methanogenic archaea (<xref ref-type="bibr" rid="ref44">Schn&#x00FC;rer, 2016</xref>). To investigate the microbial communities in AD, 16S rRNA gene amplicon analysis has been widely used with the development of high-throughput short-read sequencing technologies (<xref ref-type="bibr" rid="ref24">Li et al., 2022</xref>; <xref ref-type="bibr" rid="ref58">Zhang S. et al., 2022</xref>). In recent years, the genome-centric metagenome analysis has been used for investigating the complex microbial communities in AD, and recovered a large number of metagenome-assembled genomes (MAGs; <xref ref-type="bibr" rid="ref49">Treu et al., 2016</xref>; <xref ref-type="bibr" rid="ref7">Campanaro et al., 2018</xref>, <xref ref-type="bibr" rid="ref8">2020</xref>). In 2020, Campanaro et al. constructed 1,401 MAGs from 134 publicly available metagenomes derived from different biogas plants, and then in 2021, Ma et al. constructed 2,426 MAGs from 56 full-scale biogas plants with different feedstocks (<xref ref-type="bibr" rid="ref8">Campanaro et al., 2020</xref>; <xref ref-type="bibr" rid="ref30">Ma et al., 2021</xref>), and these efforts greatly deepen the understanding of microbial communities of AD and provide a huge number of microbial genomes for uncultured microbes in AD.</p>
<p>Genome-centric metagenome analysis have facilitated the recovery of microbial genomes for novel organisms residing in AD microbiomes, such as the members of the archaeal phylum <italic>Bathyarchaeota</italic>, which were proposed to contribute to hydrolysis and subsequent fermentation of organic materials within the process of biogas production (<xref ref-type="bibr" rid="ref13">Evans et al., 2015</xref>; <xref ref-type="bibr" rid="ref34">Maus et al., 2018</xref>). However, due to the technical limitation of short-read sequencing, these assembled genomes often fragmented and with some wrong contigs introduced by binning algorithms, and it will partly limit their applications. Recently, the use of highly accurate HiFi long reads and the related assemblers have greatly improved the assembly quality of MAGs, which even generated hundreds of circular genomes (<xref ref-type="bibr" rid="ref4">Bickhart et al., 2022</xref>; <xref ref-type="bibr" rid="ref14">Feng et al., 2022</xref>). Besides, high proportion of novel genomes were generated, which recovered 89 novel genomes (26% of the total assembled genomes) from the chicken gut microbiomes by using 332&#x2009;Gb of HiFi reads (<xref ref-type="bibr" rid="ref57">Zhang Y. et al., 2022</xref>). In addition, HiFi long reads also enabled the analysis of full-length 16S rRNA genes covering all hypervariable regions, which could provide more accurate taxonomic classification for microorganisms (<xref ref-type="bibr" rid="ref28">Liang et al., 2022</xref>). In this study, we used the HiFi long reads to construct the microbial genomes for microorganisms in AD of food waste, and analyzed the full-length 16S rRNA genes identified from the sequenced long reads to investigate the microbial communities.</p>
</sec>
<sec id="sec5" sec-type="materials|methods">
<title>Materials and methods</title>
<sec id="sec6">
<title>Full-scale anaerobic digester of food waste</title>
<p>A full-scale up-flow solid anaerobic digester was selected from a food waste treatment plant in Chengdu, China, which can treat 100 tons of food waste every day. Before entering the digesters, the food waste will undergo a complex process of pretreatment: firstly, after sorting out the impurities such as glass bottles and bowls, the food waste was broken in the pulping machine, and the plastic and woven bags were screened out by the residue liquid separator; secondly, the treated food waste was transported to the sterilization tank for heating, heat preservation (80&#x2013;95&#x00B0;C) and sterilization; finally, three-phase separation was performed, and the residue phase was used to make organic fertilizer, the oil phase was used to extract industrial diesel oil, and only the liquid phase was pumped into the anaerobic digesters to produce biogas. Because the temperature of the liquid phase is high (60&#x2013;70&#x00B0;C) after the three-phase separation, it should be cooled to 40&#x2013;45&#x00B0;C in the buffer tank before entering the digester. At last, the digestate will be discharged after it meets the discharge standard through further water treatment process, and the produced biogas will be used as fuel for pretreating the food waste.</p>
<p>The effective volume of the sampling digester is 3,500&#x2009;m<sup>3</sup>, and the hydraulic retention time of the liquid phase is 37&#x2013;41&#x2009;days, the organic loading rate is 2.48&#x2009;kg chemical oxygen demand (COD) m<sup>&#x2212;3</sup> d<sup>&#x2212;1</sup>. The fermentation temperature is 37&#x00B0;C, the pH of the digestate is 7.3, and the daily gas production is on average 6,000 m<sup>3</sup>. At the day of sampling, the methane, carbon dioxide, and nitrogen contents were 61.1, 36.6, and 2.3% (v/v), respectively. The average concentration of acetate, propionate, and butyrate were 38.7, 18.8, and 20.0&#x2009;mg&#x2009;L<sup>&#x2212;1</sup>, respectively. The average concentration of total ammonium nitrogen was 1,224.7&#x2009;mg&#x2009;L<sup>&#x2212;1</sup>. The other physicochemical characteristics of the fermented digestate and the fed liquid phase from the food waste are shown in <xref ref-type="supplementary-material" rid="SM1">Supplementary Table S1</xref>.</p>
</sec>
<sec id="sec7">
<title>Sample collection</title>
<p>Digestate samples were collected from the sampling valve of the anaerobic digester. Before sampling, the reactor content was stirred and the sampling valve was opened for 5&#x2009;min to flush the sampling valve and tubes. Approximately, 3,000&#x2009;ml of digestate was collected into six sterile, gastight tubes (500&#x2009;ml) and transported to the laboratory immediately. Upon arrival in the laboratory, 1,000&#x2009;ml subsamples were homogenized and centrifuged at 9,000&#x2009;rpm for 30&#x2009;min (at 4&#x00B0;C), and after washing with phosphate buffered saline (pH 7.2) and centrifuging again under the same conditions, the pellet was collected in 50&#x2009;ml sterile tubes and stored at &#x2212;80&#x00B0;C before DNA extraction. Remaining 2,000&#x2009;ml subsamples were stored at &#x2212;20&#x00B0;C before physicochemical analysis. Biogas samples were collected with gas sample bags and stored at room temperature.</p>
</sec>
<sec id="sec8">
<title>Physicochemical analysis</title>
<p>The total solid (TS), total ammonia nitrogen (TAN), chemical oxygen demand (COD), C content, and N content were measured according to APHA Standard Protocols (<xref ref-type="bibr" rid="ref45">Simmons et al., 1998</xref>). Volatile fatty acids (VFAs) were analyzed by a gas chromatography (GC7890, Agilent, United States) with a flame-ionization detector and a capillary column (DB-FFAP 0.25&#x2009;&#x00D7;&#x2009;0.5&#x2009;&#x00D7;&#x2009;30), the initial temperature of column was 80&#x00B0;C, raise it to 180&#x00B0;C at a speed of 28&#x00B0;C s<sup>&#x2212;1</sup>, and keeping 1&#x2009;min, and then, raise it to 220&#x00B0;C at a speed of 40&#x00B0;C s<sup>&#x2212;1</sup> and keeping 1&#x2009;min, the temperature of injection port and detector were 210 and 230&#x00B0;C, respectively. Injection volume was 1&#x2009;&#x03BC;l and split ratio was 1:10. Nitrogen was the carrier gas and the flow rate was 35&#x2009;cm&#x2009;s<sup>&#x2212;1</sup>, the flow rate of hydrogen, air and tail blowing were 30,&#x2009;300, and 38&#x2009;ml&#x2009;min<sup>&#x2212;1</sup>, respectively. VFAs were carried out with external standard method. The biogas composition was analyzed by a gas chromatography (GC7820A, Agilent, United States) with a thermal-conductivity detector and stainless steel column (1/8&#x2009;&#x00D7;&#x2009;3&#x2009;m) packed with supporter (Porapak Q), hydrogen as the carrier gas and the flow rate was 27&#x2009;ml&#x2009;min<sup>&#x2212;1</sup>, and temperatures for the column, injection port, and detector were 65, 120, and 130&#x00B0;C, respectively. Gas content was quantified with the area normalization method. pH values were measured with pH meters (AS ONE AS600, Japan).</p>
</sec>
<sec id="sec9">
<title>DNA extraction, library preparation, and sequencing</title>
<p>Genomic DNA from the sample was extracted using DNeasy PowerSoil Pro kit (ref. 47014; QIAGEN, Germany) according to the manufacturer&#x2019;s instructions. The integrity of extracted DNA was checked on 0.8% (w/v) agarose gel with GelRed nucleic acid gel stain (cat. no. 41003; Biotium, United States). The purity and quantity of the extracted DNA was assessed using Nanodrop 2000 (Thermo Fisher Scientific, United States) and Qubit 4.0 (Thermo Fisher Scientific, United States). Then, the high integrity (with obvious concentrated electrophoresis band &#x003E;15&#x2009;Kb in size) and quality (A260/280 1.8&#x2013;2.0, dsDNA concentration&#x2009;&#x003E;&#x2009;100&#x2009;ng&#x2009;&#x03BC;l<sup>&#x2212;1</sup>) DNA samples were used for library construction. For Pacific Biosciences (PacBio) Hifi sequencing, the DNA samples were fragmented into 15&#x2013;20&#x2009;Kb insets using g-TUBEs (Covaris, United States), and the sequencing library was constructed using SMRTbell Express Template Prep Kit 2.0 (PacBio, United States). Then, three SMRT cells of high-fidelity long reads were generated on PacBio Sequel II system with Circular Consensus Sequence (CCS) mode (PacBio, United States).</p>
</sec>
<sec id="sec10">
<title>Metagenome assembly and binning</title>
<p>The raw HiFi sequencing reads were filtered by requiring a read length over 1&#x2009;Kb and an average read accuracy over 99%, which resulted in a total of 64.6&#x2009;Gb of high-quality reads from all three SMRT cells. To improve the assembly for less abundant species, all reads were pooled together for co-assembly. Then, Hifiasm-meta r058 (<xref ref-type="bibr" rid="ref14">Feng et al., 2022</xref>) was used to assemble all HiFi reads into contigs with parameter &#x201C;--force-preovec.&#x201D; By viewing the contig linkages from the resulted GFA files with Bandage v0.8.1 (<xref ref-type="bibr" rid="ref52">Wick et al., 2015</xref>), we observed that most of the assembled contigs can be divided into three types (<xref rid="fig1" ref-type="fig">Figure 1A</xref>): (1) circular contig, one single contig with head and tail concatenated; (2) tangled &#x201C;circular&#x201D; contigs, many linear contigs linked into a big circular or other complex structure; and (3) linear contig, one single contig with no link to other contigs. Then, the circular contigs were left alone, and each tangled &#x201C;circle&#x201D; was re-assembled by Hifiasm-meta r058 (<xref ref-type="bibr" rid="ref14">Feng et al., 2022</xref>) with default parameters, using the fragmental contigs that constructed the &#x201C;circle&#x201D; as input reads, and resulted seven extra circular contigs. Finally, we obtained a total of 292 circular contigs, including 47 circular contigs with contig length longer than 1&#x2009;Mb. In addition, plasmid and viral genomes were identified using viralVerify v1.1<xref rid="fn0005" ref-type="fn"><sup>1</sup></xref> with parameter &#x201C;--hmm nbc_hmms.hmm&#x201D; from these circular contigs.</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Overview of metagenome assembly. <bold>(A)</bold> Graphic display of the assembled contigs. The graph is drawn by Bandage, and the colors for different contigs are randomly assigned by the software. The line length is in proportion to contig length, and the line width is in proportion to contig coverage depth. Based on the structure of different contigs or contig groups, the contigs were divided into three types, circular contigs, tangled circular contigs, and linear contigs, and some examples were labeled in the figure. Circular contig, one single contig with head and tail concatenated; tangled circular contigs, many linear contigs link to each other and form a big circular or other complex structure; linear contig, one single contig with no link to other contigs. <bold>(B)</bold> Length distribution of circular contigs. <bold>(C)</bold> Relationship plot of completeness with contig length for all circular contigs. Completeness value of circular contigs was estimated using CheckM.</p>
</caption>
<graphic xlink:href="fmicb-13-1095497-g001.tif"/>
</fig>
<p>To group the separate linear contigs into metagenome-assembled genomes (MAGs), a binning algorithm MetaBAT2 v2.12.1 (<xref ref-type="bibr" rid="ref19">Kang et al., 2019</xref>) was used, with removing all circular and tangled &#x201C;circular&#x201D; contigs from the assembled results. MetaBAT2 was used with parameter &#x201C;-minContig 2000,&#x201D; which resulted in a total of 28 non-circular MAGs.</p>
<p>The completeness (Cp) and contamination (Ct) of all circular contigs and non-circular MAGs were estimated using the &#x201C;Lineage_wf&#x201D; workflow of CheckM v1.07 (<xref ref-type="bibr" rid="ref39">Parks et al., 2015</xref>) with options &#x201C;lineage_wf-t 20-x fa.&#x201D; According to these results, the microbial genome assemblies with three quality ranks were adopted: near complete (Cp&#x2009;&#x2265;&#x2009;90% and Ct&#x2009;&#x003C;&#x2009;5%), high quality (Cp&#x2009;&#x2265;&#x2009;70% and Ct&#x2009;&#x003C;&#x2009;10%), and medium quality (Cp&#x2009;&#x2265;&#x2009;50% and Ct&#x2009;&#x003C;&#x2009;10%), including a total of 47 circular contigs and 28 non-circular MAGs.</p>
</sec>
<sec id="sec11">
<title>Construction of non-redundant microbial genome assemblies</title>
<p>De-replication of all filtered microbial genome assemblies (near-complete, high-quality, and medium-quality) were performed using Mash v2.2 (<xref ref-type="bibr" rid="ref36">Ondov et al., 2016</xref>) on the entire genome sequences with very permissive parameters &#x201C;dist-d 0.05&#x201D; (<xref ref-type="bibr" rid="ref8">Campanaro et al., 2020</xref>), which could cluster these genomes into different groups. To determine the representative genome for each group, a more precise analysis was performed applying the genome-wide average nucleotide identity (ANI; <xref ref-type="bibr" rid="ref50">Varghese et al., 2015</xref>). When two genomes showed ANI value &#x2265;95% and genome coverage &#x2265;50% for both of them, they were considered to belong to the same species, and the genome with higher CheckM score (Cp&#x2014;5&#x2009;&#x00D7;&#x2009;Ct) was selected and retained. After many runs of comparison and selection, the representative genomes for each group were obtained, and other genomes were taken as redundant and removed. Finally, a total of 60 non-redundant microbial genomes were generated, comprising 39 circular and 21 non-circular genomes.</p>
<p>We used INFERNAL v1.1.2 (<xref ref-type="bibr" rid="ref35">Nawrocki and Eddy, 2013</xref>) with parameters &#x201C;cmscan --rfam --cut_ga --nohmmonly --cpu 10&#x201D; to identify rRNA genes, tRNAscan-SE v2.0.3 (<xref ref-type="bibr" rid="ref9">Chan et al., 2021</xref>) with parameters &#x201C;-G-H&#x201D; to identify tRNA genes. Taxonomic annotation of these genomes was performed using the GTDB-Tk v2.1.0 (<xref ref-type="bibr" rid="ref10">Chaumeil et al., 2019</xref>, <xref ref-type="bibr" rid="ref11">2022</xref>) based on the GTDB database version r207 (<xref ref-type="bibr" rid="ref38">Parks et al., 2022</xref>), with the parameter of &#x201C;classify_wf-x fa.&#x201D; In addition, 16S rRNA genes from each genome were also used for taxonomic annotation, with Ribosomal Database Project (RDP) Classifier v2.11 (<xref ref-type="bibr" rid="ref51">Wang et al., 2007</xref>) to classify the genomes at lower taxonomic ranks, and BLAST alignments to the Silva database version r138 (<xref ref-type="bibr" rid="ref42">Quast et al., 2013</xref>) were further used to validate the novelty of these taxonomic units. The phylogenetic tree of these genomes was constructed using FastTree v2.1.11 (<xref ref-type="bibr" rid="ref40">Price et al., 2010</xref>) based on the 16S rRNA genes that retrieved from these genomes. To calculate the sequencing depth for the non-redundant genomes, high-quality HiFi reads were aligned back to these genomes using Minimap2 v2.20 (<xref ref-type="bibr" rid="ref23">Li, 2018</xref>) with parameters &#x201C;-x map-hifi-a -t 60,&#x201D; and the resulted SAM format files were converted to sorted BAM format files by Samtools v1.3 (<xref ref-type="bibr" rid="ref27">Li et al., 2009</xref>). Then, the depth was calculated using the script jgi_summarize_bam_contig_depths in MetaBAT2 according a previous study (<xref ref-type="bibr" rid="ref14">Feng et al., 2022</xref>).</p>
</sec>
<sec id="sec12">
<title>Diversity analysis</title>
<p>To determine whether the real microbial composition of AD can be recovered from the assembled genomes, a 16S rRNA gene based microbial community analysis was performed. We identified the full-length 16S rRNA genes from high-quality HiFi reads using INFERNAL v1.1.2 (<xref ref-type="bibr" rid="ref35">Nawrocki and Eddy, 2013</xref>) with parameters &#x201C;cmscan --rfam --cut_ga --nohmmonly --cpu 48,&#x201D; and the identified 16S rRNA genes with length&#x2009;&#x003C;&#x2009;1,200 or&#x2009;&#x003E;&#x2009;1,700&#x2009;bp were filtered out. The average base error rate of each 16S rRNA gene was calculated, and the sequences with average accuracy less than 99% (Q20) were removed. As a result, a total of 54,135 16S rRNA genes were identified. Then, the RDP Classifier v2.11 (<xref ref-type="bibr" rid="ref51">Wang et al., 2007</xref>) was used to classify the 16S rRNA genes, and the relative abundance of each taxonomic units was calculated by adjusting the gene copy number for 16S rRNA gene sequences according the database rrnDB v5.8 (<xref ref-type="bibr" rid="ref47">Stoddard et al., 2015</xref>).</p>
</sec>
</sec>
<sec id="sec13">
<title>Results and discussion</title>
<sec id="sec14">
<title>Assembly of 47 complete circular microbial genomes and 118 viral genomes from high-fidelity long reads</title>
<p>To obtain a high-quality metagenome assembly for AD of food waste, a total of 64.6&#x2009;Gb of PacBio HiFi reads were generated from three SMRT cells, with the read N50 size of 14.3&#x2009;Kb and N90 size of 7.3&#x2009;Kb (<xref rid="tab1" ref-type="table">Table 1</xref>), and the average base accuracy of 99.94%. Then, we assembled the HiFi reads into contigs with Hifiasm-meta (<xref ref-type="bibr" rid="ref14">Feng et al., 2022</xref>) and generated a total contig length of 924.9&#x2009;Mb, with the N50 size of 87.7&#x2009;Kb and N90 size of 22.2&#x2009;Kb (<xref rid="tab1" ref-type="table">Table 1</xref>), which were much longer than those assembled from Illumina short reads (<xref ref-type="bibr" rid="ref30">Ma et al., 2021</xref>). By viewing the contig linkages from the resulted GFA file with Bandage (<xref ref-type="bibr" rid="ref52">Wick et al., 2015</xref>), the contigs can be classified into three types of circular contig, tangled &#x201C;circular&#x201D; contigs and linear contig (<xref rid="fig1" ref-type="fig">Figure 1A</xref>), and a tangled structure contains many different strains of one species, while a circular or linear structure represents only one single microbial strain of one species.</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Statistics of sequencing reads and assembled contigs.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="middle">Statistics</th>
<th align="center" valign="middle">Sequencing reads</th>
<th align="center" valign="middle">Assembled contigs</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Total number</td>
<td align="center" valign="top">5,833,109</td>
<td align="center" valign="top">17,715</td>
</tr>
<tr>
<td align="left" valign="top">Total length (bp)</td>
<td align="center" valign="top">64,564,585,452</td>
<td align="center" valign="top">924,882,211</td>
</tr>
<tr>
<td align="left" valign="top">Maximum (bp)</td>
<td align="center" valign="top">67,387</td>
<td align="center" valign="top">6,716,598</td>
</tr>
<tr>
<td align="left" valign="top">Minimum (bp)</td>
<td align="center" valign="top">1,000</td>
<td align="center" valign="top">1,390</td>
</tr>
<tr>
<td align="left" valign="top">N50 (bp)</td>
<td align="center" valign="top">14,254</td>
<td align="center" valign="top">87,732</td>
</tr>
<tr>
<td align="left" valign="top">N60 (bp)</td>
<td align="center" valign="top">13,140</td>
<td align="center" valign="top">59,332</td>
</tr>
<tr>
<td align="left" valign="top">N70 (bp)</td>
<td align="center" valign="top">12,074</td>
<td align="center" valign="top">43,546</td>
</tr>
<tr>
<td align="left" valign="top">N80 (bp)</td>
<td align="center" valign="top">10,854</td>
<td align="center" valign="top">32,503</td>
</tr>
<tr>
<td align="left" valign="top">N90 (bp)</td>
<td align="center" valign="top">7,310</td>
<td align="center" valign="top">22,219</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The assembled metagenome contains 292 circular contigs with a total length of 146.0&#x2009;Mb, which accounts for 15.8% of the total assembly length. The length distribution analysis of these circular contigs revealed that 245 contigs (83.9% of total circular contigs) were shorter than 1.0&#x2009;Mb (<xref rid="fig1" ref-type="fig">Figure 1B</xref>), and 228 contigs were even shorter than 100&#x2009;Kb. The other 47 circular contigs ranged from 1.0 to 6.7&#x2009;Mb, and 37 contigs with lengths of 2.0 to 4.0&#x2009;Mb accounted for 69.9% of the total length of circular contigs (<xref rid="fig1" ref-type="fig">Figure 1B</xref>). To determine whether the circular contigs are complete genomes, CheckM analysis was performed using the collocated sets of ubiquitous and single-copy genes within a phylogenetic lineage (<xref ref-type="bibr" rid="ref39">Parks et al., 2015</xref>). The results revealed that the circular contigs longer than 1.0&#x2009;Mb showed an average completeness of 97%, and 38, 6, and 3 of them have completeness &#x003E;95%, 90&#x2013;95%, and&#x2009;&#x003C;&#x2009;90%, respectively (<xref rid="fig1" ref-type="fig">Figure 1C</xref>). However, the completeness of the circular contigs shorter than 1.0&#x2009;Mb was &#x003C;15%, and 243 of them have completeness of 0% (<xref rid="fig1" ref-type="fig">Figure 1C</xref>). Then, viralVerify was used to classify these short circular contigs, and 31, 118, and 92 of them were classified as plasmid, virus, and uncertain, respectively, indicating that most of the short circular contigs were not genomic fragments derived from microbial genomes.</p>
</sec>
<sec id="sec15">
<title>Capacity of the assemblage of HiFi genomes</title>
<p>To construct the reference genomes of microorganisms in AD of food waste, we combined the assembled circular contigs and non-circular MAGs derived from binning algorithm. After removing the redundant and low-quality genomes, a total of 60 non-redundant microbial genomes were generated, including 39 circular microbial genomes and 21 non-circular MAGs (<xref rid="fig2" ref-type="fig">Figure 2A</xref> and <xref ref-type="supplementary-material" rid="SM2">Supplementary Table S2</xref>). Of these 60 genomes, 46 genomes contain only one contigs, six genomes contain 2&#x2013;5 contigs, and only five genomes contain &#x003E;10 contigs (<xref rid="fig2" ref-type="fig">Figure 2B</xref>), which are much superior to the MAGs derived from Illumina short reads (<xref ref-type="bibr" rid="ref8">Campanaro et al., 2020</xref>; <xref ref-type="bibr" rid="ref30">Ma et al., 2021</xref>). Based on the quality assessment by CheckM (<xref ref-type="bibr" rid="ref39">Parks et al., 2015</xref>), 95% of the circular genomes are near-complete, except one genome with Cp&#x2009;&#x003C;&#x2009;90% and one genome with Ct&#x2009;&#x003E;&#x2009;5% (<xref rid="fig2" ref-type="fig">Figure 2C</xref>). However, only 19% of the non-circular MAGs are near-complete (<xref rid="fig2" ref-type="fig">Figure 2C</xref>), mostly due to the relatively low completeness of these genomes (<xref rid="fig2" ref-type="fig">Figure 2A</xref>), and the average genome size of non-circular MAGs (2.65&#x2009;Mb) is smaller than that of circular genomes (2.97&#x2009;Mb; <xref rid="fig2" ref-type="fig">Figure 2D</xref>).</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>Statistics and evaluation of assembled microbial genomes. <bold>(A)</bold> CheckM evaluation of assembled microbial genomes. Circular genomes refer to circular contigs, and non-circular MAGs refer to genome assemblies derived from binning algorithms. Genomes are defined as &#x201C;near-complete,&#x201D; if their CheckM completeness values are &#x2265;90% and contamination values are &#x003C;5%, &#x201C;high-quality&#x201D; if completeness &#x2265;70% and contamination &#x003C;10%, or &#x201C;medium-quality&#x201D; if completeness &#x2265;50% and contamination &#x003C;10%. <bold>(B&#x2013;D)</bold> Distribution of contig numbers, CheckM quality values, and genome sizes of assembled microbial genomes. <bold>(E,F)</bold> Distribution of the number of rRNA operons and standard tRNA genes for assembled genomes.</p>
</caption>
<graphic xlink:href="fmicb-13-1095497-g002.tif"/>
</fig>
<p>In bacteria and archaea, the ribosomal RNA (rRNA) operon typically encodes the 16S, 23S, and 5S rRNA genes, and the rRNA operon usually exists in multiple copies, ranging from 1 to 15 in bacteria and 1 to 4 in archaea (<xref ref-type="bibr" rid="ref22">Klappenbach et al., 2001</xref>; <xref ref-type="bibr" rid="ref47">Stoddard et al., 2015</xref>). Transfer RNA (tRNA) genes are randomly distributed in the genome, often with redundant copies. With the advances in sequencing technologies, the presence and completeness of rRNA and tRNA genes are suggested to be an additional metric for assembly quality (<xref ref-type="bibr" rid="ref5">Bowers et al., 2017</xref>). We predicted the rRNA and tRNA genes in the 60 non-redundant genomes, and found that all genomes have at least one copy of rRNA operon and 54 genomes have &#x2265;18 types of standard tRNA genes (<xref rid="fig2" ref-type="fig">Figures 2E</xref>,<xref rid="fig2" ref-type="fig">F</xref>; <xref ref-type="supplementary-material" rid="SM2">Supplementary Table S2</xref>), suggesting that most of our assembled genomes are of high quality. Most genomes (95%) have 1&#x2013;3 rRNA operons (<xref rid="fig2" ref-type="fig">Figure 2E</xref>), and the average rRNA operon copy number of circular genomes (2.1) is comparable to that of non-circular MAGs (2.0). In addition, more types of standard tRNA genes were identified from circular genomes (average number is 20.0) than that from non-circular MAGs (average number is 18.0), and of the 39 circular genomes, 38 have all 20 types of tRNA genes and only one genome has 19 types of tRNA genes (<xref rid="fig2" ref-type="fig">Figure 2F</xref>; <xref ref-type="supplementary-material" rid="SM2">Supplementary Table S2</xref>).</p>
<p>Until now, many studies have constructed MAGs of AD from short-read assembled contigs (<xref ref-type="bibr" rid="ref49">Treu et al., 2016</xref>; <xref ref-type="bibr" rid="ref8">Campanaro et al., 2020</xref>). To assess the novelty and superiority of our metagenome assembled genomes, two large-scale metagenomic studies on AD were chosen for comparison. <xref ref-type="bibr" rid="ref8">Campanaro et al. (2020)</xref> incorporated nearly 0.9&#x2009;Tb of Illumina sequence data from 134 samples that published between 2014 and 2019, which representing a wide range of different biogas reactor systems, and constructed 1,401 MAGs (BinSet1). <xref ref-type="bibr" rid="ref30">Ma et al. (2021)</xref> used 1.8&#x2009;Tb of Illumina sequence data that generated from 56 full-scale biogas plants fed with diverse feedstocks, and constructed 2,426 MAGs (BinSet2). The results showed that 37 of our genomes have matched (ANI&#x2009;&#x2265;&#x2009;95%) MAGs from the BinSet1 or BinSet2, and the remaining 23 genomes were not found in these two researches (ANI&#x2009;&#x003C;&#x2009;95%), including 11 circular genomes and 12 non-circular MAGs (<xref rid="fig3" ref-type="fig">Figure 3A</xref>). Further analysis of the published MAGs with matching relationships to our 37 genomes showed that, the average contig number of our genomes (5) is much less than that of BinSet1 (289) and BinSet2 (166), while the average contig N50 size of our genomes (2,545&#x2009;Kb) is much higher than that of BinSet1 (49&#x2009;Kb) and BinSet2 (123&#x2009;Kb; <xref rid="fig3" ref-type="fig">Figures 3B</xref>,<xref rid="fig3" ref-type="fig">C</xref>). Besides, our 37 genomes have slightly larger average genome sizes and lower average CheckM contamination values than the matching MAGs (<xref rid="fig3" ref-type="fig">Figures 3C</xref>,<xref rid="fig3" ref-type="fig">D</xref>). However, the average CheckM completeness of our 37 genomes (92.8%) was slightly lower than that of the matching MAGs in BinSet1 (94.5%) and BinSet2 (95.6%; <xref rid="fig3" ref-type="fig">Figure 3D</xref>), which may be resulted from the different completeness cutoffs of 50, 70, and 80% used for our genomes, BinSet1, and BinSet2, respectively. The above results indicate obvious superiority of our HiFi assembled microbial genomes over the short-read assembled MAGs.</p>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>Comparison of HiFi assembled microbial genomes to the short-read assembled genomes. <bold>(A)</bold> Statistics of our assembled microbial genomes with matching relationship to the published short-read derived MAGs from anaerobic digestion. If one of our HiFi assembled microbial genome shows ANI value &#x2265;95% to any of the published MAGs, it is supposed to match to the published MAG. Comparison of average contig number <bold>(B)</bold>, assembled genome size and contig N50 size <bold>(C)</bold>, and CheckM quality <bold>(D)</bold> between our HiFi assembled microbial genomes and the corresponded matching MAGs from two published datasets. BinSet1 published by <xref ref-type="bibr" rid="ref8">Campanaro et al. (2020)</xref> contains 1,401 MAGs, and BinSet2 published by <xref ref-type="bibr" rid="ref30">Ma et al. (2021)</xref> contains 2,426 MAGs.</p>
</caption>
<graphic xlink:href="fmicb-13-1095497-g003.tif"/>
</fig>
</sec>
<sec id="sec16">
<title>The phylogeny of the genomes revealing 23 novel genome representations</title>
<p>We performed the taxonomic annotation of the 60 HiFi assembled genomes by using GTDB-Tk based on the GTDB database, which contains 317,542 genomes belonging to 65,703 species (<xref ref-type="bibr" rid="ref11">Chaumeil et al., 2022</xref>; <xref ref-type="bibr" rid="ref38">Parks et al., 2022</xref>). The results showed that only two genomes were classified as archaea (belonging to the phylum <italic>Euryarchaeota</italic>), while the other 58 genomes were all classified as bacteria. At phylum level, half of the 60 genomes were assigned to <italic>Bacteroidetes</italic> (16) and <italic>Firmicutes</italic> (14), followed by <italic>Planctomycetes</italic> (6), <italic>Chloroflexi</italic> (4), and <italic>Synergistota</italic> (3; <xref rid="fig4" ref-type="fig">Figure 4A</xref>). The remaining 17 genomes were classified into 12 phyla, including <italic>Actinobacteria</italic> (2), <italic>Desulfobacterota</italic> (2), <italic>Euryarchaeota</italic> (2), <italic>Thermotogae</italic> (2), <italic>Verrucomicrobia</italic> (2), <italic>Armatimonadota</italic> (1), <italic>Atribacterota</italic> (1), <italic>Cloacimonadota</italic> (1), <italic>Fusobacteriota</italic> (1), <italic>Marinisomatota</italic> (1), <italic>Myxococcota</italic> (1), and <italic>Spirochaetota</italic> (1; <xref rid="fig4" ref-type="fig">Figure 4A</xref>). In summary, the 60 HiFi assembled genomes come from a total of 17 phyla, revealing a high diversity of microbial genomes constructed by HiFi sequencing data.</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>Phylogeny of the assembled microbial genomes. <bold>(A)</bold> Number of genomes belonged to different phyla<bold>. (B)</bold> Phylogenetic relationship of the assembled genomes. The phylogenetic tree was constructed using the 16S rRNA genes retrieved from all genomes, and the taxonomic annotation of the leaf nodes was performed using GTDB-Tk. The shapes of the leaf nodes correspond to the CheckM quality of the genomes, triangle represents &#x201C;near-complete,&#x201D; rectangle represents &#x201C;high-quality,&#x201D; and diamond represents &#x201C;medium-quality.&#x201D; The colors of the leaf nodes correspond to the taxonomic classification results of GTDB-Tk, &#x201C;green&#x201D; means the leaf node classified to be an existing species in the GTDB database, &#x201C;red&#x201D; and &#x201C;blue&#x201D; means the leaf node unclassified at species and genus level, respectively. Genome ids with prefix &#x201C;Cir&#x201D; represent circular genomes, and prefix &#x201C;Bin&#x201D; represents non-circular MAGs. <bold>(C)</bold> Pair-wise alignment of genome sequences between our genome Cir48 and the published <italic>Defluviitoga tunisiensis</italic> DTL3. The dot plot shows alignments longer than 1,000&#x2009;bp.</p>
</caption>
<graphic xlink:href="fmicb-13-1095497-g004.tif"/>
</fig>
<p>According to the taxonomic annotation by GTDB-Tk, all genomes have been successfully classified at high taxonomic level (domain, phylum, class, order, and family), while 6 and 17 genomes cannot be classified at genus and species level, respectively (<xref rid="fig4" ref-type="fig">Figure 4B</xref>; <xref ref-type="supplementary-material" rid="SM3">Supplementary Tables S3</xref>, <xref ref-type="supplementary-material" rid="SM1">S4</xref>), suggesting that the 6 and 17 genomes are novel assembled genomes of these genera and species. To further classify these genomes at lower taxonomic levels, the 16S rRNA genes that identified from them were taxonomic annotated using the RDP Classifier and BLAST against the 16S rRNA database. Among the six unclassified genera, three were successfully classified at genus level by RDP Classifier, and two (Cir26 and Cir 34) of the three remaining unclassified genera showed 16S rRNA gene identities &#x003C;95% (<xref ref-type="supplementary-material" rid="SM3">Supplementary Table S3</xref>), which is the threshold for demarcating procaryotic genus (<xref ref-type="bibr" rid="ref29">Ludwig et al., 1998</xref>). Among 17 unclassified species, four (Cir02, Cir30, Bin02, and Bin17) showed 16S rRNA gene identities &#x003C;97% (<xref ref-type="supplementary-material" rid="SM4">Supplementary Table S4</xref>), which is the threshold for demarcating procaryotic species (<xref ref-type="bibr" rid="ref46">Stackebrandt and Goebel, 1994</xref>). Therefore, two and four of the HiFi assembled genomes can be treated as novel genera and species, respectively.</p>
<p>The genome Cir26 showed the highest 16S rRNA gene identity (88.6%) to the genus <italic>Sebaldella</italic>, an obligately anaerobic bacteria that could hydrolyze the glucose to produce acetate and lactic acids, and one uncultured clone of this genus was identified in a mesophilic anaerobic digester (<xref ref-type="bibr" rid="ref43">Riviere et al., 2009</xref>; <xref ref-type="bibr" rid="ref17">Harmon-Smith et al., 2010</xref>). The genome Cir02 and Bin17 have the highest 16S rRNA gene identity to <italic>Paludibacter jiangxiensis</italic> (87.5%) and <italic>Desulfonispora thiosulfatigenes</italic> (93.1%), and both of them were anaerobic bacteria and could produce acetate from glucose and organosulfonate taurine, respectively (<xref ref-type="bibr" rid="ref12">Denger et al., 1999</xref>; <xref ref-type="bibr" rid="ref41">Qiu et al., 2014</xref>). In addition, the genome Cir34, Cir30, and Bin02 have the highest 16S rRNA gene identities to the phylum WS1 (90.3%), class <italic>Anaerolineeae</italic> (95.8%), and class <italic>Phycisphaerae</italic> (92.4%), respectively, but the taxonomic annotation at lower levels of these species are unknown. The above results indicated that Cir26, Cir02, and Bin17 may provide substrates to methanogens for methane production in AD, while the functions of Cir34, Cir30, and Bin02 need further investigation.</p>
</sec>
<sec id="sec17">
<title>The most abundant microbial genome belongs to <italic>Defluviitoga tunisiensis</italic></title>
<p>Considering the coverage depth of each genome generated by mapping the HiFi reads to these genomes using Minimap2 (<xref ref-type="bibr" rid="ref23">Li, 2018</xref>), the most abundant genome was a circular genome Cir48 (taxonomically annotated as <italic>Defluviitoga tunisiensis</italic>) with the highest coverage depth of 16,076 (X), much higher than that of other genomes (&#x003C; 1,270 X; <xref rid="fig4" ref-type="fig">Figure 4B</xref>). In 2015, the complete genome sequence of <italic>D</italic>. <italic>tunisiensis</italic> L3 was reported, consisting of a circular contig with length of 2,053,097&#x2009;bp and GC content of 31.4% (<xref ref-type="bibr" rid="ref33">Maus et al., 2015</xref>). The pair-wise sequence alignment between the genomes of Cir48 and <italic>D</italic>. <italic>tunisiensis</italic> L3 showed a clear 1-to-1 syntenic relationship between these two genomes (<xref rid="fig4" ref-type="fig">Figure 4C</xref>). In addition, the two genomes have similar genome size (2.18 vs. 2.05&#x2009;Mb) and GC content (31.2 vs. 31.4%), and high ANI value (97.8%) and 16S rRNA gene identity (100%), suggesting that these two genomes belong to the same species of <italic>D</italic>. <italic>tunisiensis</italic>. <italic>Defluviitoga tunisiensis</italic> was firstly isolated from an anaerobic digester, and it can utilize a variety of complex polysaccharides, such as cellulose, chitin and xylan, and acetate, carbon dioxide and hydrogen were found as possible end-products of the fermentation process (<xref ref-type="bibr" rid="ref3">Ben Hania et al., 2012</xref>; <xref ref-type="bibr" rid="ref32">Maus et al., 2016</xref>). Since these compounds are essential substrates for producing of methane, it is reasonable to explain the highly abundant of Cir48 in current anaerobic digester for food waste.</p>
<p>The other abundant genomes include one archaeal genome Cir17 (<italic>Methanothrix</italic> sp., 1,268 X) and four bacterial genomes Cir16 (UBA1062 sp., 792 X), Cir40 (<italic>Fermentinonas massiliensis</italic>, 712 X), MAG Bin19 (UBA1976 sp., 666 X), and Cir20 (<italic>Gleimia</italic> sp., 451 X; <xref rid="fig4" ref-type="fig">Figure 4B</xref>). The genome Cir17 belongs to the archaeal phylum <italic>Euryarchaeota</italic>, and the coverage depth of this genome is obviously higher than that of the other archaeal genomes (<xref rid="fig4" ref-type="fig">Figure 4B</xref>), suggesting that <italic>Methanothrix</italic> sp. may play the most important role in the last step of methane production in the AD microbial community here analyzed. Noticeably, several complete circular genomes with relatively low coverage depth (&#x003C;20 X) were also successfully assembled by Hifiasm-meta, including Cir02 (11 X), Cir08 (12 X), Cir07 (12 X), Cir15 (14 X), Cir21 (14 X), and Cir30 (16 X; <xref rid="fig4" ref-type="fig">Figure 4B</xref>).</p>
<p>Then, the relative abundance of different taxonomic ranks was calculated based on the taxonomic annotation and coverage depth of each genome, which showed that the microbial community consisted 93.9% of <italic>Bacteria</italic> and 6.1% of <italic>Archaea</italic> at domain level. The most predominant phylum was <italic>Thermotogae</italic> (70.5%), followed by <italic>Euryarchaeota</italic> (6.1%), <italic>Bacteroidetes</italic> (4.7%), <italic>Synergistetes</italic> (4.1%), <italic>Desulfobacterota</italic> (3.5%), <italic>Actinobacteria</italic> (3.1%), and <italic>Firmicutes</italic> (2.4%; <xref rid="fig5" ref-type="fig">Figure 5</xref>). Considering the diverse lifestyle of the members of the phylum <italic>Thermotogae</italic> in both thermophilic (54&#x00B0;C) and mesophilic (37&#x00B0;C) anaerobic digesters (<xref ref-type="bibr" rid="ref25">Li et al., 2013</xref>; <xref ref-type="bibr" rid="ref6">Campanaro et al., 2016</xref>; <xref ref-type="bibr" rid="ref48">Stolze et al., 2016</xref>; <xref ref-type="bibr" rid="ref31">Maus et al., 2017</xref>), the dominance of <italic>Thermotogae</italic> in the microbial community of AD for food waste at mesophilic condition is possibly due to environmental selection.</p>
<fig position="float" id="fig5">
<label>Figure 5</label>
<caption>
<p>Microbial community of the anaerobic digester for food waste. The microbial community derived from the assembled genomes was generated based on the taxonomic annotation of the whole genomes by using GTDB-Tk, while that derived from the 16S rRNA genes was obtained from the taxonomic annotation of the full-length 16S rRNA genes identified from the HiFi reads, using the tool RDP Classifier.</p>
</caption>
<graphic xlink:href="fmicb-13-1095497-g005.tif"/>
</fig>
</sec>
<sec id="sec18">
<title>Full-length 16S rRNA gene diversity analysis</title>
<p>To determine whether the real microbial composition of AD can be recovered from the 60 HiFi assembled genomes, we also used the full-length 16S rRNA genes identified from the HiFi reads to investigate the microbial compositions. We identified the 16S rRNA genes from the accurate HiFi long reads by INFERNAL (<xref ref-type="bibr" rid="ref35">Nawrocki and Eddy, 2013</xref>), and found a total number of 54,135 16S rRNA genes. Unlike the previous study using the PCR amplification and PacBio HiFi sequencing to acquire the full-length 16S rRNA gene sequences (<xref ref-type="bibr" rid="ref28">Liang et al., 2022</xref>), the present study directly identified the full-length 16S rRNA gene sequences from the PacBio HiFi long reads, without any PCR amplification. Of the identified 16S rRNA genes, most of them (67%) ranged from 1,500 to 1,520&#x2009;bp, with the length peaked at 1,512&#x2009;bp (<xref rid="fig6" ref-type="fig">Figure 6A</xref>), consistent with the reported length of microbial full-length 16S rRNA genes. In addition, the average base quality of most of the identified 16S rRNA genes (80%) ranged from Q20 (99% average base accuracy) to Q40 (99.99% average base accuracy; <xref rid="fig6" ref-type="fig">Figure 6B</xref>), indicating the high quality of the identified 16S rRNA genes.</p>
<fig position="float" id="fig6">
<label>Figure 6</label>
<caption>
<p>Analysis of microbial communities based on the full-length 16S rRNA genes identified from HiFi reads. <bold>(A)</bold> Distribution of the length of 16S rRNA genes. <bold>(B)</bold> Distribution of sequencing quality of 16S rRNA genes. Q20 means an average base accuracy of 99%, Q30 means 99.9%, and so on. <bold>(C)</bold> Comparison of the number of taxonomic units identified by genome taxonomy and full-length 16S rRNA genes at different taxonomic ranks.</p>
</caption>
<graphic xlink:href="fmicb-13-1095497-g006.tif"/>
</fig>
<p>Taxonomic annotation of the full-length 16S rRNA genes showed that the relative abundances of <italic>Bacteria</italic> and <italic>Archaea</italic> were 94.8 and 5.2%, respectively. The most predominant bacterial and archaeal phyla were <italic>Thermotogae</italic> (67.0%) and <italic>Euryarchaeota</italic> (5.2%), respectively, which were comparable to that derived from the assembled genomes (<xref rid="fig5" ref-type="fig">Figure 5</xref>). The other abundant phyla were <italic>Bacteroidetes</italic> (5.5%), <italic>Synergistetes</italic> (5.1%), <italic>Actinobacteria</italic> (4.6%), <italic>Firmicutes</italic> (3.1%), <italic>Chloroflexi</italic> (2.9%), <italic>Proteobacteria</italic> (1.8%), and <italic>Planctomycetes</italic> (1.7%), and they were nearly consistent with that derived from the assembled genomes, except slight differences in the relative abundance of a few phyla, such as <italic>Actinobacteria</italic>, <italic>Chloroflexi</italic>, and <italic>Verrucomicrobia</italic> (<xref rid="fig5" ref-type="fig">Figure 5</xref>). In addition, we found that the phylum <italic>Desulfobacterota</italic> was just identified from assembled genomes, and the phylum <italic>Proteobacteria</italic> was only detected from 16S rRNA genes (<xref rid="fig5" ref-type="fig">Figure 5</xref>), which may result from the different taxonomic annotation tools (GTDB-Tk vs. RDP Classifier) were used. We used GTDB-Tk to annotate the assembled genomes, and it classified the genomes of Bin01 and Cir16 as <italic>Desulfobacterota</italic>. However, when used RDP Classifier to annotate the 16S rRNA genes that identified from the two genomes, it classified the two genomes as <italic>Proteobacteria</italic>. So, it is hard to classify the two genomes on the basis of the current classification tools and databases. Noticeably, obviously more taxonomic units were identified by the full-length 16S rRNA genes, with the number of phyla, classes, orders, families, and genera 1.3, 1.6, 1.7, 2.5, and 3.4 times that identified by the assembled genomes, respectively (<xref rid="fig6" ref-type="fig">Figure 6C</xref>), revealing the advantage of using the full-length 16S rRNA gene for investigating microbial community.</p>
</sec>
</sec>
<sec id="sec19" sec-type="conclusions">
<title>Conclusion</title>
<p>Given the importance of AD in treatment of food waste, we used the highly accurate HiFi long reads to investigate the microbiome in a full-scale anaerobic digester for food waste. In this study, we constructed a total of 60 non-redundant microbial genomes, including 39 circular genomes. All genomes have at least one copy of rRNA operons and 54 genomes have &#x2265;18 types of standard tRNA genes. Noticeably, our HiFi-derived genomes exhibit substantial advantages over the previous short-read derived MAGs in continuity, completeness, and contamination metrics. Taxonomic annotation reveals that half of the 60 genomes belong to the phylum <italic>Bacteroidetes</italic> (16) and <italic>Firmicutes</italic> (14), and two and four genomes may belong to novel genus and species, respectively, which may provide substrates to methanogens for producing of methane in AD. The HiFi assembled genomes not only improves the description of the full genomes of the microbiome in AD, but also enables the discovery of novel microbial members living in this extreme environment.</p>
<p>Microbial community analysis based on the assembled genomes reveals the most predominant bacterial and archaeal phyla are <italic>Thermotogae</italic> and <italic>Euryarchaeota</italic>, and the genera are <italic>Defluviitoga</italic> and <italic>Methanothrix</italic>, respectively. Since 16S rRNA-based analysis is an established standard method for elucidating the composition of microbial communities, we identified 54,135 full-length 16S rRNA genes from the HiFi long reads, and revealed a consistent microbial composition with that derived from the assembled genomes, though more taxonomic units were identified. This study provides hundreds of thousands of full-length 16S rRNA genes for microbiome in AD, and deepens the understanding of the microbial community in anaerobic digester for food waste.</p>
</sec>
<sec id="sec20" sec-type="data-availability">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found at: NCBI - PRJNA879921.</p>
</sec>
<sec id="sec21">
<title>Author contributions</title>
<p>FJ, QL, and TS collected the samples and performed experiments. FJ analyzed the data. HW, AW, DX, LY, LL, RC, and BY provide helpful suggestions. FJ and QL wrote the raw manuscript. YD and WF conceived the study and designed the experiments. SW, YD, and WF revised the manuscript. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec id="sec22" sec-type="funding-information">
<title>Funding</title>
<p>This project was supported by grants from Shenzhen Science and Technology Program (JCYJ20190814163805604).</p>
</sec>
<sec id="conf1" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="sec100" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<ack>
<p>We thank Lei Cheng for providing helpful suggestions. We also express our thanks to Yayue Deng for assistance with physicochemical parameters measuring.</p>
</ack>
<sec id="sec24" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/fmicb.2022.1095497/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/fmicb.2022.1095497/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.XLSX" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_2.XLSX" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_3.XLSX" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_4.XLSX" id="SM4" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Angenent</surname> <given-names>L. T.</given-names></name> <name><surname>Karim</surname> <given-names>K.</given-names></name> <name><surname>Al-Dahhan</surname> <given-names>M. H.</given-names></name> <name><surname>Wrenn</surname> <given-names>B. A.</given-names></name> <name><surname>Domiguez-Espinosa</surname> <given-names>R.</given-names></name></person-group> (<year>2004</year>). <article-title>Production of bioenergy and biochemicals from industrial and agricultural wastewater</article-title>. <source>Trends Biotechnol.</source> <volume>22</volume>, <fpage>477</fpage>&#x2013;<lpage>485</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.tibtech.2004.07.001</pub-id>, PMID: <pub-id pub-id-type="pmid">15331229</pub-id></citation></ref>
<ref id="ref2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Antonopoulou</surname> <given-names>G.</given-names></name> <name><surname>Ntaikou</surname> <given-names>I.</given-names></name> <name><surname>Pastore</surname> <given-names>C.</given-names></name> <name><surname>di Bitonto</surname> <given-names>L.</given-names></name> <name><surname>Bebelis</surname> <given-names>S.</given-names></name> <name><surname>Lyberatos</surname> <given-names>G.</given-names></name></person-group> (<year>2019</year>). <article-title>An overall perspective for the energetic valorization of household food waste using microbial fuel cell technology of its extract, coupled with anaerobic digestion of the solid residue</article-title>. <source>Appl. Energy</source> <volume>242</volume>, <fpage>1064</fpage>&#x2013;<lpage>1073</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.apenergy.2019.03.082</pub-id></citation></ref>
<ref id="ref3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ben Hania</surname> <given-names>W.</given-names></name> <name><surname>Godbane</surname> <given-names>R.</given-names></name> <name><surname>Postec</surname> <given-names>A.</given-names></name> <name><surname>Hamdi</surname> <given-names>M.</given-names></name> <name><surname>Ollivier</surname> <given-names>B.</given-names></name> <name><surname>Fardeau</surname> <given-names>M. L.</given-names></name></person-group> (<year>2012</year>). <article-title>Defluviitoga tunisiensis gen. Nov., sp. nov., a thermophilic bacterium isolated from a mesothermic and anaerobic whey digester</article-title>. <source>Int. J. Syst. Evol. Microbiol.</source> <volume>62</volume>, <fpage>1377</fpage>&#x2013;<lpage>1382</lpage>. doi: <pub-id pub-id-type="doi">10.1099/ijs.0.033720-0</pub-id>, PMID: <pub-id pub-id-type="pmid">21828011</pub-id></citation></ref>
<ref id="ref4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bickhart</surname> <given-names>D. M.</given-names></name> <name><surname>Kolmogorov</surname> <given-names>M.</given-names></name> <name><surname>Tseng</surname> <given-names>E.</given-names></name> <name><surname>Portik</surname> <given-names>D. M.</given-names></name> <name><surname>Korobeynikov</surname> <given-names>A.</given-names></name> <name><surname>Tolstoganov</surname> <given-names>I.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Generating lineage-resolved, complete metagenome-assembled genomes from complex microbial communities</article-title>. <source>Nat. Biotechnol.</source> <volume>40</volume>, <fpage>711</fpage>&#x2013;<lpage>719</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41587-021-01130-z</pub-id>, PMID: <pub-id pub-id-type="pmid">34980911</pub-id></citation></ref>
<ref id="ref5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bowers</surname> <given-names>R. M.</given-names></name> <name><surname>Kyrpides</surname> <given-names>N. C.</given-names></name> <name><surname>Stepanauskas</surname> <given-names>R.</given-names></name> <name><surname>Harmon-Smith</surname> <given-names>M.</given-names></name> <name><surname>Doud</surname> <given-names>D.</given-names></name> <name><surname>TBK</surname> <given-names>R.</given-names></name> <etal/></person-group>. (<year>2017</year>). <article-title>Minimum information about a single amplified genome (MISAG) and a metagenome-assembled genome (MIMAG) of bacteria and archaea</article-title>. <source>Nat. Biotechnol.</source> <volume>35</volume>, <fpage>725</fpage>&#x2013;<lpage>731</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nbt.3893</pub-id></citation></ref>
<ref id="ref6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Campanaro</surname> <given-names>S.</given-names></name> <name><surname>Treu</surname> <given-names>L.</given-names></name> <name><surname>Kougias</surname> <given-names>P. G.</given-names></name> <name><surname>De Francisci</surname> <given-names>D.</given-names></name> <name><surname>Valle</surname> <given-names>G.</given-names></name> <name><surname>Angelidaki</surname> <given-names>I.</given-names></name></person-group> (<year>2016</year>). <article-title>Metagenomic analysis and functional characterization of the biogas microbiome using high throughput shotgun sequencing and a novel binning strategy</article-title>. <source>Biotechnol. Biofuels</source> <volume>9</volume>:<fpage>26</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13068-016-0441-1</pub-id>, PMID: <pub-id pub-id-type="pmid">26839589</pub-id></citation></ref>
<ref id="ref7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Campanaro</surname> <given-names>S.</given-names></name> <name><surname>Treu</surname> <given-names>L.</given-names></name> <name><surname>Kougias</surname> <given-names>P. G.</given-names></name> <name><surname>Luo</surname> <given-names>G.</given-names></name> <name><surname>Angelidaki</surname> <given-names>I.</given-names></name></person-group> (<year>2018</year>). <article-title>Metagenomic binning reveals the functional roles of core abundant microorganisms in twelve full-scale biogas plants</article-title>. <source>Water Res.</source> <volume>140</volume>, <fpage>123</fpage>&#x2013;<lpage>134</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.watres.2018.04.043</pub-id>, PMID: <pub-id pub-id-type="pmid">29704757</pub-id></citation></ref>
<ref id="ref8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Campanaro</surname> <given-names>S.</given-names></name> <name><surname>Treu</surname> <given-names>L.</given-names></name> <name><surname>Rodriguez</surname> <given-names>R. L.</given-names></name> <name><surname>Kovalovszki</surname> <given-names>A.</given-names></name> <name><surname>Ziels</surname> <given-names>R. M.</given-names></name> <name><surname>Maus</surname> <given-names>I.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>New insights from the biogas microbiome by comprehensive genome-resolved metagenomics of nearly 1600 species originating from multiple anaerobic digesters</article-title>. <source>Biotechnol. Biofuels</source> <volume>13</volume>:<fpage>25</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13068-020-01679-y</pub-id>, PMID: <pub-id pub-id-type="pmid">32123542</pub-id></citation></ref>
<ref id="ref9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chan</surname> <given-names>P. P.</given-names></name> <name><surname>Lin</surname> <given-names>B. Y.</given-names></name> <name><surname>Mak</surname> <given-names>A. J.</given-names></name> <name><surname>Lowe</surname> <given-names>T. M.</given-names></name></person-group> (<year>2021</year>). <article-title>tRNAscan-SE 2.0: improved detection and functional classification of transfer RNA genes</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>9077</fpage>&#x2013;<lpage>9096</lpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/gkab688</pub-id>, PMID: <pub-id pub-id-type="pmid">34417604</pub-id></citation></ref>
<ref id="ref10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chaumeil</surname> <given-names>P. A.</given-names></name> <name><surname>Mussig</surname> <given-names>A. J.</given-names></name> <name><surname>Hugenholtz</surname> <given-names>P.</given-names></name> <name><surname>Parks</surname> <given-names>D. H.</given-names></name></person-group> (<year>2019</year>). <article-title>GTDB-Tk: a toolkit to classify genomes with the genome taxonomy database</article-title>. <source>Bioinformatics</source> <volume>36</volume>, <fpage>1925</fpage>&#x2013;<lpage>1927</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btz848</pub-id>, PMID: <pub-id pub-id-type="pmid">31730192</pub-id></citation></ref>
<ref id="ref11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chaumeil</surname> <given-names>P.-A.</given-names></name> <name><surname>Mussig</surname> <given-names>A. J.</given-names></name> <name><surname>Hugenholtz</surname> <given-names>P.</given-names></name> <name><surname>Parks</surname> <given-names>D. H.</given-names></name></person-group> (<year>2022</year>). <article-title>GTDB-Tk v2: memory friendly classification with the genome taxonomy database</article-title>. <source>Bioinformatics</source> <volume>2022</volume>:<fpage>499641</fpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btac672</pub-id></citation></ref>
<ref id="ref12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Denger</surname> <given-names>K.</given-names></name> <name><surname>Stackebrandt</surname> <given-names>E.</given-names></name> <name><surname>Cook</surname> <given-names>A. M.</given-names></name></person-group> (<year>1999</year>). <article-title>Desulfonispora thiosulfatigenes gen. Nov., sp. nov., a taurine-fermenting, thiosulfate-producing anaerobic bacterium</article-title>. <source>Int. J. Syst. Bacteriol.</source> <volume>49 Pt 4</volume>, <fpage>1599</fpage>&#x2013;<lpage>1603</lpage>. doi: <pub-id pub-id-type="doi">10.1099/00207713-49-4-1599</pub-id>, PMID: <pub-id pub-id-type="pmid">10555341</pub-id></citation></ref>
<ref id="ref13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Evans</surname> <given-names>P. N.</given-names></name> <name><surname>Parks</surname> <given-names>D. H.</given-names></name> <name><surname>Chadwick</surname> <given-names>G. L.</given-names></name> <name><surname>Robbins</surname> <given-names>S. J.</given-names></name> <name><surname>Orphan</surname> <given-names>V. J.</given-names></name> <name><surname>Golding</surname> <given-names>S. D.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Methane metabolism in the archaeal phylum Bathyarchaeota revealed by genome-centric metagenomics</article-title>. <source>Science</source> <volume>350</volume>, <fpage>434</fpage>&#x2013;<lpage>438</lpage>. doi: <pub-id pub-id-type="doi">10.1126/science.aac7745</pub-id>, PMID: <pub-id pub-id-type="pmid">26494757</pub-id></citation></ref>
<ref id="ref14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Feng</surname> <given-names>X.</given-names></name> <name><surname>Cheng</surname> <given-names>H.</given-names></name> <name><surname>Portik</surname> <given-names>D.</given-names></name> <name><surname>Li</surname> <given-names>H.</given-names></name></person-group> (<year>2022</year>). <article-title>Metagenome assembly of high-fidelity long reads with hifiasm-meta</article-title>. <source>Nat. Methods</source> <volume>19</volume>, <fpage>671</fpage>&#x2013;<lpage>674</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41592-022-01478-3</pub-id>, PMID: <pub-id pub-id-type="pmid">35534630</pub-id></citation></ref>
<ref id="ref15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fisgativa</surname> <given-names>H.</given-names></name> <name><surname>Tremier</surname> <given-names>A.</given-names></name> <name><surname>Le Roux</surname> <given-names>S.</given-names></name> <name><surname>Bureau</surname> <given-names>C.</given-names></name> <name><surname>Dabert</surname> <given-names>P.</given-names></name></person-group> (<year>2017</year>). <article-title>Understanding the anaerobic biodegradability of food waste: relationship between the typological, biochemical and microbial characteristics</article-title>. <source>J. Environ. Manag.</source> <volume>188</volume>, <fpage>95</fpage>&#x2013;<lpage>107</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jenvman.2016.11.058</pub-id>, PMID: <pub-id pub-id-type="pmid">27939694</pub-id></citation></ref>
<ref id="ref16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Garcia-Depraect</surname> <given-names>O.</given-names></name> <name><surname>Martinez-Mendoza</surname> <given-names>L. J.</given-names></name> <name><surname>Diaz</surname> <given-names>I.</given-names></name> <name><surname>Munoz</surname> <given-names>R.</given-names></name></person-group> (<year>2022</year>). <article-title>Two-stage anaerobic digestion of food waste: enhanced bioenergy production rate by steering lactate-type fermentation during hydrolysis-acidogenesis</article-title>. <source>Bioresour. Technol.</source> <volume>358</volume>:<fpage>127358</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.biortech.2022.127358</pub-id>, PMID: <pub-id pub-id-type="pmid">35605777</pub-id></citation></ref>
<ref id="ref17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Harmon-Smith</surname> <given-names>M.</given-names></name> <name><surname>Celia</surname> <given-names>L.</given-names></name> <name><surname>Chertkov</surname> <given-names>O.</given-names></name> <name><surname>Lapidus</surname> <given-names>A.</given-names></name> <name><surname>Copeland</surname> <given-names>A.</given-names></name> <name><surname>Glavina Del Rio</surname> <given-names>T.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>Complete genome sequence of Sebaldella termitidis type strain (NCTC 11300)</article-title>. <source>Stand. Genomic Sci.</source> <volume>2</volume>, <fpage>220</fpage>&#x2013;<lpage>227</lpage>. doi: <pub-id pub-id-type="doi">10.4056/sigs.811799</pub-id>, PMID: <pub-id pub-id-type="pmid">21304705</pub-id></citation></ref>
<ref id="ref18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hassa</surname> <given-names>J.</given-names></name> <name><surname>Maus</surname> <given-names>I.</given-names></name> <name><surname>Off</surname> <given-names>S.</given-names></name> <name><surname>Puhler</surname> <given-names>A.</given-names></name> <name><surname>Scherer</surname> <given-names>P.</given-names></name> <name><surname>Klocke</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Metagenome, metatranscriptome, and metaproteome approaches unraveled compositions and functional relationships of microbial communities residing in biogas plants</article-title>. <source>Appl. Microbiol. Biotechnol.</source> <volume>102</volume>, <fpage>5045</fpage>&#x2013;<lpage>5063</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00253-018-8976-7</pub-id>, PMID: <pub-id pub-id-type="pmid">29713790</pub-id></citation></ref>
<ref id="ref19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kang</surname> <given-names>D. D.</given-names></name> <name><surname>Li</surname> <given-names>F.</given-names></name> <name><surname>Kirton</surname> <given-names>E.</given-names></name> <name><surname>Thomas</surname> <given-names>A.</given-names></name> <name><surname>Egan</surname> <given-names>R.</given-names></name> <name><surname>An</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>MetaBAT 2: an adaptive binning algorithm for robust and efficient genome reconstruction from metagenome assemblies</article-title>. <source>PeerJ.</source> <volume>7</volume>:<fpage>e7359</fpage>. doi: <pub-id pub-id-type="doi">10.7717/peerj.7359</pub-id>, PMID: <pub-id pub-id-type="pmid">31388474</pub-id></citation></ref>
<ref id="ref20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>H.</given-names></name> <name><surname>Kim</surname> <given-names>J.</given-names></name> <name><surname>Shin</surname> <given-names>S. G.</given-names></name> <name><surname>Hwang</surname> <given-names>S.</given-names></name> <name><surname>Lee</surname> <given-names>C.</given-names></name></person-group> (<year>2016</year>). <article-title>Continuous fermentation of food waste leachate for the production of volatile fatty acids and potential as a denitrification carbon source</article-title>. <source>Bioresour. Technol.</source> <volume>207</volume>, <fpage>440</fpage>&#x2013;<lpage>445</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.biortech.2016.02.063</pub-id>, PMID: <pub-id pub-id-type="pmid">26922002</pub-id></citation></ref>
<ref id="ref21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kiran</surname> <given-names>E. U.</given-names></name> <name><surname>Trzcinski</surname> <given-names>A. P.</given-names></name> <name><surname>Ng</surname> <given-names>W. J.</given-names></name> <name><surname>Liu</surname> <given-names>Y.</given-names></name></person-group> (<year>2014</year>). <article-title>Bioconversion of food waste to energy: a review</article-title>. <source>Fuel</source> <volume>134</volume>, <fpage>389</fpage>&#x2013;<lpage>399</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.fuel.2014.05.074</pub-id></citation></ref>
<ref id="ref22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Klappenbach</surname> <given-names>J. A.</given-names></name> <name><surname>Saxman</surname> <given-names>P. R.</given-names></name> <name><surname>Cole</surname> <given-names>J. R.</given-names></name> <name><surname>Schmidt</surname> <given-names>T. M.</given-names></name></person-group> (<year>2001</year>). <article-title>Rrndb: the ribosomal RNA operon copy number database</article-title>. <source>Nucleic Acids Res.</source> <volume>29</volume>, <fpage>181</fpage>&#x2013;<lpage>184</lpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/29.1.181</pub-id>, PMID: <pub-id pub-id-type="pmid">11125085</pub-id></citation></ref>
<ref id="ref23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H.</given-names></name></person-group> (<year>2018</year>). <article-title>Minimap2: pairwise alignment for nucleotide sequences</article-title>. <source>Bioinformatics</source> <volume>34</volume>, <fpage>3094</fpage>&#x2013;<lpage>3100</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/bty191</pub-id>, PMID: <pub-id pub-id-type="pmid">29750242</pub-id></citation></ref>
<ref id="ref24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>Y. Z.</given-names></name> <name><surname>Chen</surname> <given-names>Z.</given-names></name> <name><surname>Peng</surname> <given-names>Y. Y.</given-names></name> <name><surname>Huang</surname> <given-names>W. Z.</given-names></name> <name><surname>Liu</surname> <given-names>J. X.</given-names></name> <name><surname>Mironov</surname> <given-names>V.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Deeper insights into the effects of substrate to inoculum ratio selection on the relationship of kinetic parameters, microbial communities, and key metabolic pathways during the anaerobic digestion of food waste</article-title>. <source>Water Res.</source> <volume>217</volume>:<fpage>118440</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.watres.2022.118440</pub-id>, PMID: <pub-id pub-id-type="pmid">35429887</pub-id></citation></ref>
<ref id="ref25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>A.</given-names></name> <name><surname>Chu</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>X.</given-names></name> <name><surname>Ren</surname> <given-names>L.</given-names></name> <name><surname>Yu</surname> <given-names>J.</given-names></name> <name><surname>Liu</surname> <given-names>X.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>A pyrosequencing-based metagenomic study of methane-producing microbial community in solid-state biogas reactor</article-title>. <source>Biotechnol. Biofuels</source> <volume>6</volume>:<fpage>3</fpage>. doi: <pub-id pub-id-type="doi">10.1186/1754-6834-6-3</pub-id>, PMID: <pub-id pub-id-type="pmid">23320936</pub-id></citation></ref>
<ref id="ref26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>W.</given-names></name> <name><surname>Guo</surname> <given-names>J. B.</given-names></name> <name><surname>Cheng</surname> <given-names>H. C.</given-names></name> <name><surname>Wang</surname> <given-names>W.</given-names></name> <name><surname>Dong</surname> <given-names>R. J.</given-names></name></person-group> (<year>2017</year>). <article-title>Two-phase anaerobic digestion of municipal solid wastes enhanced by hydrothermal pretreatment: viability, performance and microbial community evaluation</article-title>. <source>Appl. Energy</source> <volume>189</volume>, <fpage>613</fpage>&#x2013;<lpage>622</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.apenergy.2016.12.101</pub-id></citation></ref>
<ref id="ref27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Handsaker</surname> <given-names>B.</given-names></name> <name><surname>Wysoker</surname> <given-names>A.</given-names></name> <name><surname>Fennell</surname> <given-names>T.</given-names></name> <name><surname>Ruan</surname> <given-names>J.</given-names></name> <name><surname>Homer</surname> <given-names>N.</given-names></name> <etal/></person-group>. (<year>2009</year>). <article-title>The sequence alignment/map format and SAMtools</article-title>. <source>Bioinformatics</source> <volume>25</volume>, <fpage>2078</fpage>&#x2013;<lpage>2079</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btp352</pub-id></citation></ref>
<ref id="ref28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liang</surname> <given-names>Z.</given-names></name> <name><surname>Lin</surname> <given-names>X.</given-names></name> <name><surname>Liao</surname> <given-names>Y.</given-names></name> <name><surname>Tang</surname> <given-names>T.</given-names></name></person-group> (<year>2022</year>). <article-title>Characteristics and diversity of endophytic bacteria in Panax notoginseng under high temperature analysed using full-length 16S rRNA sequencing</article-title>. <source>Arch. Microbiol.</source> <volume>204</volume>:<fpage>435</fpage>. doi: <pub-id pub-id-type="doi">10.1007/s00203-022-03043-0</pub-id>, PMID: <pub-id pub-id-type="pmid">35763100</pub-id></citation></ref>
<ref id="ref29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ludwig</surname> <given-names>W.</given-names></name> <name><surname>Strunk</surname> <given-names>O.</given-names></name> <name><surname>Klugbauer</surname> <given-names>S.</given-names></name> <name><surname>Klugbauer</surname> <given-names>N.</given-names></name> <name><surname>Weizenegger</surname> <given-names>M.</given-names></name> <name><surname>Neumaier</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>1998</year>). <article-title>Bacterial phylogeny based on comparative sequence analysis</article-title>. <source>Electrophoresis</source> <volume>19</volume>, <fpage>554</fpage>&#x2013;<lpage>568</lpage>. doi: <pub-id pub-id-type="doi">10.1002/elps.1150190416</pub-id></citation></ref>
<ref id="ref30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ma</surname> <given-names>S.</given-names></name> <name><surname>Jiang</surname> <given-names>F.</given-names></name> <name><surname>Huang</surname> <given-names>Y.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>S.</given-names></name> <name><surname>Fan</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>A microbial gene catalog of anaerobic digestion from full-scale biogas plants</article-title>. <source>Gigascience</source> <volume>10</volume>:<fpage>giaa164</fpage>. doi: <pub-id pub-id-type="doi">10.1093/gigascience/giaa164</pub-id>, PMID: <pub-id pub-id-type="pmid">33506264</pub-id></citation></ref>
<ref id="ref31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maus</surname> <given-names>I.</given-names></name> <name><surname>Bremges</surname> <given-names>A.</given-names></name> <name><surname>Stolze</surname> <given-names>Y.</given-names></name> <name><surname>Hahnke</surname> <given-names>S.</given-names></name> <name><surname>Cibis</surname> <given-names>K. G.</given-names></name> <name><surname>Koeck</surname> <given-names>D. E.</given-names></name> <etal/></person-group>. (<year>2017</year>). <article-title>Genomics and prevalence of bacterial and archaeal isolates from biogas-producing microbiomes</article-title>. <source>Biotechnol. Biofuels</source> <volume>10</volume>:<fpage>264</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13068-017-0947-1</pub-id>, PMID: <pub-id pub-id-type="pmid">29158776</pub-id></citation></ref>
<ref id="ref32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maus</surname> <given-names>I.</given-names></name> <name><surname>Cibis</surname> <given-names>K. G.</given-names></name> <name><surname>Bremges</surname> <given-names>A.</given-names></name> <name><surname>Stolze</surname> <given-names>Y.</given-names></name> <name><surname>Wibberg</surname> <given-names>D.</given-names></name> <name><surname>Tomazetto</surname> <given-names>G.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>Genomic characterization of Defluviitoga tunisiensis L3, a key hydrolytic bacterium in a thermophilic biogas plant and its abundance as determined by metagenome fragment recruitment</article-title>. <source>J. Biotechnol.</source> <volume>232</volume>, <fpage>50</fpage>&#x2013;<lpage>60</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jbiotec.2016.05.001</pub-id>, PMID: <pub-id pub-id-type="pmid">27165504</pub-id></citation></ref>
<ref id="ref33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maus</surname> <given-names>I.</given-names></name> <name><surname>Cibis</surname> <given-names>K. G.</given-names></name> <name><surname>Wibberg</surname> <given-names>D.</given-names></name> <name><surname>Winkler</surname> <given-names>A.</given-names></name> <name><surname>Stolze</surname> <given-names>Y.</given-names></name> <name><surname>Konig</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Complete genome sequence of the strain Defluviitoga tunisiensis L3, isolated from a thermophilic, production-scale biogas plant</article-title>. <source>J. Biotechnol.</source> <volume>203</volume>, <fpage>17</fpage>&#x2013;<lpage>18</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jbiotec.2015.03.006</pub-id>, PMID: <pub-id pub-id-type="pmid">25801333</pub-id></citation></ref>
<ref id="ref34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maus</surname> <given-names>I.</given-names></name> <name><surname>Rumming</surname> <given-names>M.</given-names></name> <name><surname>Bergmann</surname> <given-names>I.</given-names></name> <name><surname>Heeg</surname> <given-names>K.</given-names></name> <name><surname>Pohl</surname> <given-names>M.</given-names></name> <name><surname>Nettmann</surname> <given-names>E.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Characterization of Bathyarchaeota genomes assembled from metagenomes of biofilms residing in mesophilic and thermophilic biogas reactors</article-title>. <source>Biotechnol. Biofuels</source> <volume>11</volume>:<fpage>167</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13068-018-1162-4</pub-id>, PMID: <pub-id pub-id-type="pmid">29951113</pub-id></citation></ref>
<ref id="ref35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nawrocki</surname> <given-names>E. P.</given-names></name> <name><surname>Eddy</surname> <given-names>S. R.</given-names></name></person-group> (<year>2013</year>). <article-title>Infernal 1.1: 100-fold faster RNA homology searches</article-title>. <source>Bioinformatics</source> <volume>29</volume>, <fpage>2933</fpage>&#x2013;<lpage>2935</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btt509</pub-id>, PMID: <pub-id pub-id-type="pmid">24008419</pub-id></citation></ref>
<ref id="ref36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ondov</surname> <given-names>B. D.</given-names></name> <name><surname>Treangen</surname> <given-names>T. J.</given-names></name> <name><surname>Melsted</surname> <given-names>P.</given-names></name> <name><surname>Mallonee</surname> <given-names>A. B.</given-names></name> <name><surname>Bergman</surname> <given-names>N. H.</given-names></name> <name><surname>Koren</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>Mash: fast genome and metagenome distance estimation using MinHash</article-title>. <source>Genome Biol.</source> <volume>17</volume>:<fpage>132</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13059-016-0997-x</pub-id>, PMID: <pub-id pub-id-type="pmid">27323842</pub-id></citation></ref>
<ref id="ref37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Paritosh</surname> <given-names>K.</given-names></name> <name><surname>Kushwaha</surname> <given-names>S. K.</given-names></name> <name><surname>Yadav</surname> <given-names>M.</given-names></name> <name><surname>Pareek</surname> <given-names>N.</given-names></name> <name><surname>Chawade</surname> <given-names>A.</given-names></name> <name><surname>Vivekanand</surname> <given-names>V.</given-names></name></person-group> (<year>2017</year>). <article-title>Food waste to energy: an overview of sustainable approaches for food waste management and nutrient recycling</article-title>. <source>Biomed. Res. Int.</source> <volume>2017</volume>, <fpage>1</fpage>&#x2013;<lpage>19</lpage>. doi: <pub-id pub-id-type="doi">10.1155/2017/2370927</pub-id></citation></ref>
<ref id="ref38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Parks</surname> <given-names>D. H.</given-names></name> <name><surname>Chuvochina</surname> <given-names>M.</given-names></name> <name><surname>Rinke</surname> <given-names>C.</given-names></name> <name><surname>Mussig</surname> <given-names>A. J.</given-names></name> <name><surname>Chaumeil</surname> <given-names>P. A.</given-names></name> <name><surname>Hugenholtz</surname> <given-names>P.</given-names></name></person-group> (<year>2022</year>). <article-title>GTDB: an ongoing census of bacterial and archaeal diversity through a phylogenetically consistent, rank normalized and complete genome-based taxonomy</article-title>. <source>Nucleic Acids Res.</source> <volume>50</volume>, <fpage>D785</fpage>&#x2013;<lpage>D794</lpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/gkab776</pub-id>, PMID: <pub-id pub-id-type="pmid">34520557</pub-id></citation></ref>
<ref id="ref39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Parks</surname> <given-names>D. H.</given-names></name> <name><surname>Imelfort</surname> <given-names>M.</given-names></name> <name><surname>Skennerton</surname> <given-names>C. T.</given-names></name> <name><surname>Hugenholtz</surname> <given-names>P.</given-names></name> <name><surname>Tyson</surname> <given-names>G. W.</given-names></name></person-group> (<year>2015</year>). <article-title>CheckM: assessing the quality of microbial genomes recovered from isolates, single cells, and metagenomes</article-title>. <source>Genome Res.</source> <volume>25</volume>, <fpage>1043</fpage>&#x2013;<lpage>1055</lpage>. doi: <pub-id pub-id-type="doi">10.1101/gr.186072.114</pub-id>, PMID: <pub-id pub-id-type="pmid">25977477</pub-id></citation></ref>
<ref id="ref40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Price</surname> <given-names>M. N.</given-names></name> <name><surname>Dehal</surname> <given-names>P. S.</given-names></name> <name><surname>Arkin</surname> <given-names>A. P.</given-names></name></person-group> (<year>2010</year>). <article-title>FastTree 2--approximately maximum-likelihood trees for large alignments</article-title>. <source>PLoS One</source> <volume>5</volume>:<fpage>e9490</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0009490</pub-id>, PMID: <pub-id pub-id-type="pmid">20224823</pub-id></citation></ref>
<ref id="ref41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Qiu</surname> <given-names>Y. L.</given-names></name> <name><surname>Kuang</surname> <given-names>X. Z.</given-names></name> <name><surname>Shi</surname> <given-names>X. S.</given-names></name> <name><surname>Yuan</surname> <given-names>X. Z.</given-names></name> <name><surname>Guo</surname> <given-names>R. B.</given-names></name></person-group> (<year>2014</year>). <article-title>Paludibacter jiangxiensis sp. nov., a strictly anaerobic, propionate-producing bacterium isolated from rice paddy field</article-title>. <source>Arch. Microbiol.</source> <volume>196</volume>, <fpage>149</fpage>&#x2013;<lpage>155</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00203-013-0951-1</pub-id>, PMID: <pub-id pub-id-type="pmid">24419224</pub-id></citation></ref>
<ref id="ref42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Quast</surname> <given-names>C.</given-names></name> <name><surname>Pruesse</surname> <given-names>E.</given-names></name> <name><surname>Yilmaz</surname> <given-names>P.</given-names></name> <name><surname>Gerken</surname> <given-names>J.</given-names></name> <name><surname>Schweer</surname> <given-names>T.</given-names></name> <name><surname>Yarza</surname> <given-names>P.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>The SILVA ribosomal RNA gene database project: improved data processing and web-based tools</article-title>. <source>Nucleic Acids Res.</source> <volume>41</volume>, <fpage>D590</fpage>&#x2013;<lpage>D596</lpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/gks1219</pub-id></citation></ref>
<ref id="ref43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Riviere</surname> <given-names>D.</given-names></name> <name><surname>Desvignes</surname> <given-names>V.</given-names></name> <name><surname>Pelletier</surname> <given-names>E.</given-names></name> <name><surname>Chaussonnerie</surname> <given-names>S.</given-names></name> <name><surname>Guermazi</surname> <given-names>S.</given-names></name> <name><surname>Weissenbach</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2009</year>). <article-title>Towards the definition of a core of microorganisms involved in anaerobic digestion of sludge</article-title>. <source>ISME J.</source> <volume>3</volume>, <fpage>700</fpage>&#x2013;<lpage>714</lpage>. doi: <pub-id pub-id-type="doi">10.1038/ismej.2009.2</pub-id>, PMID: <pub-id pub-id-type="pmid">19242531</pub-id></citation></ref>
<ref id="ref44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schn&#x00FC;rer</surname> <given-names>A.</given-names></name></person-group> (<year>2016</year>). <article-title>Biogas production: microbiology and technology</article-title>. <source>Adv. Biochem. Eng. Biotechnol.</source> <volume>156</volume>, <fpage>195</fpage>&#x2013;<lpage>234</lpage>. doi: <pub-id pub-id-type="doi">10.1007/10_2016_5</pub-id></citation></ref>
<ref id="ref45"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Simmons</surname> <given-names>GM</given-names></name> <name><surname>Greenberg</surname> <given-names>AE</given-names></name> <name><surname>Clesceri</surname> <given-names>LS</given-names></name> <name><surname>Eaton</surname> <given-names>AD</given-names></name></person-group>. (<year>1998</year>). <source>Standard Methods for the Examination of Water and Waste Water</source>. <publisher-loc>Washington DC</publisher-loc>: <publisher-name>American Public Health Association</publisher-name></citation></ref>
<ref id="ref46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stackebrandt</surname> <given-names>E.</given-names></name> <name><surname>Goebel</surname> <given-names>B. M.</given-names></name></person-group> (<year>1994</year>). <article-title>Taxonomic note: a place for DNA-DNA reassociation and 16S rRNA sequence analysis in the present species definition in bacteriology</article-title>. <source>Int. J. Syst. Evol. Microbiol.</source> <volume>44</volume>, <fpage>846</fpage>&#x2013;<lpage>849</lpage>. doi: <pub-id pub-id-type="doi">10.1099/00207713-44-4-846</pub-id></citation></ref>
<ref id="ref47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stoddard</surname> <given-names>S. F.</given-names></name> <name><surname>Smith</surname> <given-names>B. J.</given-names></name> <name><surname>Hein</surname> <given-names>R.</given-names></name> <name><surname>Roller</surname> <given-names>B. R.</given-names></name> <name><surname>Schmidt</surname> <given-names>T. M.</given-names></name></person-group> (<year>2015</year>). <article-title>rrnDB: improved tools for interpreting rRNA gene abundance in bacteria and archaea and a new foundation for future development</article-title>. <source>Nucleic Acids Res.</source> <volume>43</volume>, <fpage>D593</fpage>&#x2013;<lpage>D598</lpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/gku1201</pub-id>, PMID: <pub-id pub-id-type="pmid">25414355</pub-id></citation></ref>
<ref id="ref48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stolze</surname> <given-names>Y.</given-names></name> <name><surname>Bremges</surname> <given-names>A.</given-names></name> <name><surname>Rumming</surname> <given-names>M.</given-names></name> <name><surname>Henke</surname> <given-names>C.</given-names></name> <name><surname>Maus</surname> <given-names>I.</given-names></name> <name><surname>Puhler</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>Identification and genome reconstruction of abundant distinct taxa in microbiomes from one thermophilic and three mesophilic production-scale biogas plants</article-title>. <source>Biotechnol. Biofuels</source> <volume>9</volume>:<fpage>156</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13068-016-0565-3</pub-id>, PMID: <pub-id pub-id-type="pmid">27462367</pub-id></citation></ref>
<ref id="ref49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Treu</surname> <given-names>L.</given-names></name> <name><surname>Kougias</surname> <given-names>P. G.</given-names></name> <name><surname>Campanaro</surname> <given-names>S.</given-names></name> <name><surname>Bassani</surname> <given-names>I.</given-names></name> <name><surname>Angelidaki</surname> <given-names>I.</given-names></name></person-group> (<year>2016</year>). <article-title>Deeper insight into the structure of the anaerobic digestion microbial community; the biogas microbiome database is expanded with 157 new genomes</article-title>. <source>Bioresour. Technol.</source> <volume>216</volume>, <fpage>260</fpage>&#x2013;<lpage>266</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.biortech.2016.05.081</pub-id>, PMID: <pub-id pub-id-type="pmid">27243603</pub-id></citation></ref>
<ref id="ref50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Varghese</surname> <given-names>N. J.</given-names></name> <name><surname>Mukherjee</surname> <given-names>S.</given-names></name> <name><surname>Ivanova</surname> <given-names>N.</given-names></name> <name><surname>Konstantinidis</surname> <given-names>K. T.</given-names></name> <name><surname>Mavrommatis</surname> <given-names>K.</given-names></name> <name><surname>Kyrpides</surname> <given-names>N. C.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Microbial species delineation using whole genome sequences</article-title>. <source>Nucleic Acids Res.</source> <volume>43</volume>, <fpage>6761</fpage>&#x2013;<lpage>6771</lpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/gkv657</pub-id>, PMID: <pub-id pub-id-type="pmid">26150420</pub-id></citation></ref>
<ref id="ref51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Q.</given-names></name> <name><surname>Garrity</surname> <given-names>G. M.</given-names></name> <name><surname>Tiedje</surname> <given-names>J. M.</given-names></name> <name><surname>Cole</surname> <given-names>J. R.</given-names></name></person-group> (<year>2007</year>). <article-title>Naive Bayesian classifier for rapid assignment of rRNA sequences into the new bacterial taxonomy</article-title>. <source>Appl. Environ. Microbiol.</source> <volume>73</volume>, <fpage>5261</fpage>&#x2013;<lpage>5267</lpage>. doi: <pub-id pub-id-type="doi">10.1128/AEM.00062-07</pub-id>, PMID: <pub-id pub-id-type="pmid">17586664</pub-id></citation></ref>
<ref id="ref52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wick</surname> <given-names>R. R.</given-names></name> <name><surname>Schultz</surname> <given-names>M. B.</given-names></name> <name><surname>Zobel</surname> <given-names>J.</given-names></name> <name><surname>Holt</surname> <given-names>K. E.</given-names></name></person-group> (<year>2015</year>). <article-title>Bandage: interactive visualization of de novo genome assemblies</article-title>. <source>Bioinformatics</source> <volume>31</volume>, <fpage>3350</fpage>&#x2013;<lpage>3352</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btv383</pub-id>, PMID: <pub-id pub-id-type="pmid">26099265</pub-id></citation></ref>
<ref id="ref53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wong</surname> <given-names>J. W. C.</given-names></name> <name><surname>Kaur</surname> <given-names>G.</given-names></name> <name><surname>Mehariya</surname> <given-names>S.</given-names></name> <name><surname>Karthikeyan</surname> <given-names>O. P.</given-names></name> <name><surname>Chen</surname> <given-names>G. H.</given-names></name></person-group> (<year>2018</year>). <article-title>Food waste treatment by anaerobic co-digestion with saline sludge and its implications for energy recovery in Hong Kong</article-title>. <source>Bioresour. Technol.</source> <volume>268</volume>, <fpage>824</fpage>&#x2013;<lpage>828</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.biortech.2018.07.113</pub-id>, PMID: <pub-id pub-id-type="pmid">30064901</pub-id></citation></ref>
<ref id="ref54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname> <given-names>K. C.</given-names></name> <name><surname>Ho</surname> <given-names>K. C.</given-names></name> <name><surname>Tang</surname> <given-names>C. C.</given-names></name> <name><surname>Yau</surname> <given-names>Y. H.</given-names></name></person-group> (<year>2021</year>). <article-title>The potential of foodwaste leachate as a phycoremediation substrate for microalgal CO (2) fixation and biodiesel production</article-title>. <source>Environ. Sci. Pollut. Res.</source> <volume>28</volume>, <fpage>40724</fpage>&#x2013;<lpage>40734</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11356-018-1242-9</pub-id>, PMID: <pub-id pub-id-type="pmid">29504078</pub-id></citation></ref>
<ref id="ref55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>F.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Ge</surname> <given-names>X.</given-names></name> <name><surname>Yang</surname> <given-names>L.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name></person-group> (<year>2018</year>). <article-title>Anaerobic digestion of food waste&#x2014;challenges and opportunities</article-title>. <source>Bioresour. Technol.</source> <volume>247</volume>, <fpage>1047</fpage>&#x2013;<lpage>1058</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.biortech.2017.09.020</pub-id>, PMID: <pub-id pub-id-type="pmid">28965912</pub-id></citation></ref>
<ref id="ref56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zan</surname> <given-names>F. X.</given-names></name> <name><surname>Dai</surname> <given-names>J.</given-names></name> <name><surname>Hong</surname> <given-names>Y. Z.</given-names></name> <name><surname>Wong</surname> <given-names>M. Y.</given-names></name> <name><surname>Jiang</surname> <given-names>F.</given-names></name> <name><surname>Chen</surname> <given-names>G. H.</given-names></name></person-group> (<year>2018</year>). <article-title>The characteristics of household food waste in Hong Kong and their implications for sewage quality and energy recovery</article-title>. <source>Waste Manag.</source> <volume>74</volume>, <fpage>63</fpage>&#x2013;<lpage>73</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.wasman.2017.11.051</pub-id>, PMID: <pub-id pub-id-type="pmid">29208531</pub-id></citation></ref>
<ref id="ref57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Jiang</surname> <given-names>F.</given-names></name> <name><surname>Yang</surname> <given-names>B.</given-names></name> <name><surname>Wang</surname> <given-names>S.</given-names></name> <name><surname>Wang</surname> <given-names>H.</given-names></name> <name><surname>Wang</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Improved microbial genomes and gene catalog of the chicken gut from metagenomic sequencing of high-fidelity long reads</article-title>. <source>Gigascience</source> <volume>11</volume>:<fpage>giac116</fpage>. doi: <pub-id pub-id-type="doi">10.1093/gigascience/giac116</pub-id>, PMID: <pub-id pub-id-type="pmid">36399059</pub-id></citation></ref>
<ref id="ref58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>S.</given-names></name> <name><surname>Ma</surname> <given-names>X.</given-names></name> <name><surname>Sun</surname> <given-names>H.</given-names></name> <name><surname>Xie</surname> <given-names>D.</given-names></name> <name><surname>Zhao</surname> <given-names>P.</given-names></name> <name><surname>Wang</surname> <given-names>Q.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Semi-continuous mesophilic-thermophilic two-phase anaerobic co-digestion of food waste and spent mushroom substance: methanogenic performance, microbial, and metagenomic analysis</article-title>. <source>Bioresour. Technol.</source> <volume>360</volume>:<fpage>127518</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.biortech.2022.127518</pub-id>, PMID: <pub-id pub-id-type="pmid">35760249</pub-id></citation></ref>
</ref-list>
<glossary>
<def-list>
<title>Abbreviations</title>
<def-item>
<term>AD</term>
<def>
<p>Anaerobic digestion</p>
</def>
</def-item>
<def-item>
<term>ANI</term>
<def>
<p>Average nucleotide identity</p>
</def>
</def-item>
<def-item>
<term>CCS</term>
<def>
<p>Circular consensus sequence</p>
</def>
</def-item>
<def-item>
<term>COD</term>
<def>
<p>Chemical oxygen demand</p>
</def>
</def-item>
<def-item>
<term>Cp</term>
<def>
<p>Completeness</p>
</def>
</def-item>
<def-item>
<term>Ct</term>
<def>
<p>Contamination</p>
</def>
</def-item>
<def-item>
<term>Gb</term>
<def>
<p>Gigabyte</p>
</def>
</def-item>
<def-item>
<term>HiFi</term>
<def>
<p>High-fidelity</p>
</def>
</def-item>
<def-item>
<term>Kb</term>
<def>
<p>Kilobase</p>
</def>
</def-item>
<def-item>
<term>kg</term>
<def>
<p>Kilogram</p>
</def>
</def-item>
<def-item>
<term>L</term>
<def>
<p>Liter</p>
</def>
</def-item>
<def-item>
<term>mg</term>
<def>
<p>Microgram</p>
</def>
</def-item>
<def-item>
<term>mL</term>
<def>
<p>Microliter</p>
</def>
</def-item>
<def-item>
<term>MAG</term>
<def>
<p>Metagenome-assembled genome</p>
</def>
</def-item>
<def-item>
<term>Mb</term>
<def>
<p>Megabase</p>
</def>
</def-item>
<def-item>
<term>rRNA</term>
<def>
<p>Ribosomal RNA</p>
</def>
</def-item>
<def-item>
<term>RDP</term>
<def>
<p>Ribosomal database project</p>
</def>
</def-item>
<def-item>
<term>tRNA</term>
<def>
<p>Transfer RNA</p>
</def>
</def-item>
<def-item>
<term>TAN</term>
<def>
<p>Total ammonia nitrogen</p>
</def>
</def-item>
<def-item>
<term>TS</term>
<def>
<p>Total solid</p>
</def>
</def-item>
<def-item>
<term>VFA</term>
<def>
<p>Volatile fatty acid</p>
</def>
</def-item>
<def-item>
<term>v</term>
<def>
<p>Volume</p>
</def>
</def-item>
<def-item>
<term>w</term>
<def>
<p>Weight</p>
</def>
</def-item>
<def-item>
<term>PacBio</term>
<def>
<p>Pacific biosciences</p>
</def>
</def-item>
</def-list>
</glossary>
<fn-group>
<fn id="fn0005">
<p><sup>1</sup><ext-link xlink:href="https://github.com/ablab/viralVerify" ext-link-type="uri">https://github.com/ablab/viralVerify</ext-link></p>
</fn>
</fn-group>
</back>
</article>