<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Bioeng. Biotechnol.</journal-id>
<journal-title>Frontiers in Bioengineering and Biotechnology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Bioeng. Biotechnol.</abbrev-journal-title>
<issn pub-type="epub">2296-4185</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1197175</article-id>
<article-id pub-id-type="doi">10.3389/fbioe.2023.1197175</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Bioengineering and Biotechnology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Comparison of metagenomes from fermentation of various agroindustrial residues suggests a common model of community organization</article-title>
<alt-title alt-title-type="left-running-head">Myers et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fbioe.2023.1197175">10.3389/fbioe.2023.1197175</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Myers</surname>
<given-names>Kevin S.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2089102/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ingle</surname>
<given-names>Abel T.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1357143/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Walters</surname>
<given-names>Kevin A.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1953929/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Fortney</surname>
<given-names>Nathaniel W.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/571498/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Scarborough</surname>
<given-names>Matthew J.</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Donohue</surname>
<given-names>Timothy J.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/304825/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Noguera</surname>
<given-names>Daniel R.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2276131/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Great Lakes Bioenergy Research Center</institution>, <institution>University of Wisconsin-Madison</institution>, <addr-line>Madison</addr-line>, <addr-line>WI</addr-line>, <country>United States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Wisconsin Energy Institute</institution>, <institution>University of Wisconsin-Madison</institution>, <addr-line>Madison</addr-line>, <addr-line>WI</addr-line>, <country>United States</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Civil and Environmental Engineering</institution>, <institution>University of Wisconsin-Madison</institution>, <addr-line>Madison</addr-line>, <addr-line>WI</addr-line>, <country>United States</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Department of Civil and Environmental Engineering</institution>, <institution>University of Vermont</institution>, <addr-line>Burlington</addr-line>, <addr-line>VT</addr-line>, <country>United States</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Department of Bacteriology</institution>, <institution>University of Wisconsin-Madison</institution>, <addr-line>Madison</addr-line>, <addr-line>WI</addr-line>, <country>United States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/266107/overview">David Strik</ext-link>, Wageningen University and Research, Netherlands</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/945468/overview">Anna Christine Trego</ext-link>, University of Galway, Ireland</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/629926/overview">Alessandra Fontana</ext-link>, Catholic University of the Sacred Heart, Piacenza, Italy</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Daniel R. Noguera, <email>dnoguera@wisc.edu</email>
</corresp>
<fn fn-type="equal" id="fn1">
<label>
<sup>&#x2020;</sup>
</label>
<p>
<bold>Present address:</bold> Nathaniel W. Fortney, Thermo Fisher Scientific, Middleton, WI, United States</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>10</day>
<month>05</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>11</volume>
<elocation-id>1197175</elocation-id>
<history>
<date date-type="received">
<day>30</day>
<month>03</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>27</day>
<month>04</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Myers, Ingle, Walters, Fortney, Scarborough, Donohue and Noguera.</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Myers, Ingle, Walters, Fortney, Scarborough, Donohue and Noguera</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>The liquid residue resulting from various agroindustrial processes is both rich in organic material and an attractive source to produce a variety of chemicals. Using microbial communities to produce chemicals from these liquid residues is an active area of research, but it is unclear how to deploy microbial communities to produce specific products from the different agroindustrial residues. To address this, we fed anaerobic bioreactors one of several agroindustrial residues (carbohydrate-rich lignocellulosic fermentation conversion residue, xylose, dairy manure hydrolysate, ultra-filtered milk permeate, and thin stillage from a starch bioethanol plant) and inoculated them with a microbial community from an acid-phase digester operated at the wastewater treatment plant in Madison, WI, United States. The bioreactors were monitored over a period of months and sampled to assess microbial community composition and extracellular fermentation products. We obtained metagenome assembled genomes (MAGs) from the microbial communities in each bioreactor and performed comparative genomic analyses to identify common microorganisms, as well as any community members that were unique to each reactor. Collectively, we obtained a dataset of 217 non-redundant MAGs from these bioreactors. This metagenome assembled genome dataset was used to evaluate whether a specific microbial ecology model in which medium chain fatty acids (MCFAs) are simultaneously produced from intermediate products (e.g., lactic acid) and carbohydrates could be applicable to all fermentation systems, regardless of the feedstock. MAGs were classified using a multiclass classification machine learning algorithm into three groups, organisms fermenting the carbohydrates to intermediate products, organisms utilizing the intermediate products to produce MCFAs, and organisms producing MCFAs directly from carbohydrates. This analysis revealed common biological functions among the microbial communities in different bioreactors, and although different microorganisms were enriched depending on the agroindustrial residue tested, the results supported the conclusion that the microbial ecology model tested was appropriate to explain the MCFA production potential from all agricultural residues.</p>
</abstract>
<kwd-group>
<kwd>microbiome</kwd>
<kwd>fermentation</kwd>
<kwd>chain elongation</kwd>
<kwd>agroindustrial residue</kwd>
<kwd>metagenomics</kwd>
</kwd-group>
<contract-num rid="cn001">DE-SC0018409</contract-num>
<contract-sponsor id="cn001">Biological and Environmental Research<named-content content-type="fundref-id">10.13039/100006206</named-content>
</contract-sponsor>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Bioprocess Engineering</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>1 Introduction</title>
<p>Finding ways to generate chemicals and chemical precursors from renewable sources is an important step towards creating a sustainable circular economy that decreases society&#x2019;s dependance on fossil fuels. Medium chain fatty acids (MCFAs) are one such class of product that can be microbially produced, have applications in lubricant synthesis, production of herbicides and antimicrobials, and can be further processing into additional chemicals (<xref ref-type="bibr" rid="B57">Sarria et al., 2017</xref>; <xref ref-type="bibr" rid="B59">Scarborough et al., 2018b</xref>). Microbes and microbial communities can produce MCFAs using a wide variety of carbohydrate-rich substrates, making biological MCFA production an attractive target due to the widespread availability of carbohydrate-rich organic wastes that can be used as substrates, such as undistilled corn beer (<xref ref-type="bibr" rid="B25">Ge et al., 2015</xref>), thin stillage (<xref ref-type="bibr" rid="B19">Fortney et al., 2021</xref>), lignocellulosic fermentation conversion residues (<xref ref-type="bibr" rid="B58">Scarborough et al., 2018a</xref>; <xref ref-type="bibr" rid="B59">Scarborough et al., 2018b</xref>), a soluble fraction of municipal solid waste (<xref ref-type="bibr" rid="B26">Grootscholten et al., 2013</xref>; <xref ref-type="bibr" rid="B27">Grootscholten et al., 2014</xref>) and winery residue (<xref ref-type="bibr" rid="B44">Kucek et al., 2016b</xref>). In addition to MCFAs, other fermentation products have been identified as coproduced by microbial communities that generate MCFAs from various substrates, including the accumulation of acetic, lactic, succinic, and butyric acids, as well as ethanol (<xref ref-type="bibr" rid="B29">Han et al., 2018</xref>; <xref ref-type="bibr" rid="B19">Fortney et al., 2021</xref>). Lactic, succinic, and butyric acids can be used as building blocks for materials such as bioplastics (<xref ref-type="bibr" rid="B30">Harmsen et al., 2014</xref>). Further, both lactic acid and ethanol have been shown to be intermediate metabolites during MCFA production by members of microbial communities that perform reverse &#xdf;-oxidation, also known as chain elongation (<xref ref-type="bibr" rid="B1">Agler et al., 2012</xref>; <xref ref-type="bibr" rid="B78">Zhu et al., 2015</xref>; <xref ref-type="bibr" rid="B43">Kucek et al., 2016a</xref>; <xref ref-type="bibr" rid="B29">Han et al., 2018</xref>). Although most MCFA production research has been conducted with microbial communities, it is not clear how to steer a community towards maximizing MCFA production without accumulation of other fermentation products, or how to harness the microbial community to produce primarily one fermentation product. Therefore, additional knowledge is needed to enable the engineering of microbial communities to produce the desired fermentation products. We are interested in generating models that can explain and possibly predict the relationship of microbial community structure with the type of carbohydrate-rich substrates and the type of fermentation products that accumulate.</p>
<p>An emerging microbial ecology model describes three main functions in a chain elongation microbiome; one group of microbes that can ferment carbohydrates to lactic acid but cannot perform chain elongation, other microbes that can perform chain elongation using lactic acid as an electron donor, and others that can perform chain elongation directly from carbohydrates (<xref ref-type="bibr" rid="B58">Scarborough et al., 2018a</xref>). This model, initially proposed based on experiments using xylose-rich organic residues from lignocellulosic ethanol production (<xref ref-type="bibr" rid="B58">Scarborough et al., 2018a</xref>), has been suggested for other substrates (<xref ref-type="bibr" rid="B13">Crognale et al., 2021</xref>; <xref ref-type="bibr" rid="B19">Fortney et al., 2021</xref>; <xref ref-type="bibr" rid="B33">Ingle et al., 2021</xref>), and there is emerging evidence of MCFA-producing microbes with the genomic capacity for producing MCFA from both lactic acid and carbohydrates (<xref ref-type="bibr" rid="B36">Kang et al., 2022</xref>; <xref ref-type="bibr" rid="B72">Wang et al., 2022</xref>). In other cases, it is proposed that ethanol can be used as an electron donor and act as an intermediate during MCFA production (<xref ref-type="bibr" rid="B1">Agler et al., 2012</xref>; <xref ref-type="bibr" rid="B43">Kucek et al., 2016a</xref>). To evaluate whether this microbial ecology model can be generalized to conceptually explain MCFA production from a variety of carbohydrate-rich organic residues, we evaluated the microbial communities that were enriched when the same inoculum was used in bioreactor experiments that fermented several agroindustrial residues, including thin stillage from starch ethanol production (<xref ref-type="bibr" rid="B19">Fortney et al., 2021</xref>; <xref ref-type="bibr" rid="B20">Fortney et al., 2022</xref>), thin stillage from cellulosic ethanol production (<xref ref-type="bibr" rid="B58">Scarborough et al., 2018a</xref>; <xref ref-type="bibr" rid="B60">Scarborough et al., 2020</xref>), xylose (<xref ref-type="bibr" rid="B61">Scarborough et al., 2022</xref>), dairy manure hydrolysate (<xref ref-type="bibr" rid="B33">Ingle et al., 2021</xref>; <xref ref-type="bibr" rid="B32">Ingle et al., 2022</xref>), and ultrafiltered milk permeate (<xref ref-type="bibr" rid="B71">Walters et al., 2022</xref>; <xref ref-type="bibr" rid="B70">Walters et al., 2023</xref>). In all cases, the inoculum was from an acid-phase anaerobic digester at the local wastewater treatment plant (Madison, WI, United States).</p>
<p>Here we present the comparison of metagenome assembled genomes (MAGs) from these bioreactors and examine the role of different microbial groups in the fermentation and chain elongation processes. For this analysis, we developed a script to identify genes encoding key metabolic enzymes in the MAGs and a machine learning algorithm to bin each MAG into relevant categories. This analysis revealed patterns showing that in fermentations in which MCFA is the primary product that accumulates, and the feedstock is a carbohydrate-rich substrate, the microbial ecology model that describes chain elongation occurring via utilization of intermediates or direct utilization of carbohydrates is applicable, even though different microorganisms were enriched depending on the agroindustrial residue tested.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>2 Materials and methods</title>
<sec id="s2-1">
<title>2.1 Metagenome assembled genome (MAG) sources</title>
<p>MAG data was obtained from previously published lab-scale bioreactor studies of microbial communities grown with various agroindustrial residues (<xref ref-type="bibr" rid="B58">Scarborough et al., 2018a</xref>; <xref ref-type="bibr" rid="B60">Scarborough et al., 2020</xref>; <xref ref-type="bibr" rid="B19">Fortney et al., 2021</xref>; <xref ref-type="bibr" rid="B33">Ingle et al., 2021</xref>; <xref ref-type="bibr" rid="B20">Fortney et al., 2022</xref>; <xref ref-type="bibr" rid="B32">Ingle et al., 2022</xref>; <xref ref-type="bibr" rid="B61">Scarborough et al., 2022</xref>; <xref ref-type="bibr" rid="B71">Walters et al., 2022</xref>). The operational conditions of the bioreactors are summarized in <xref ref-type="table" rid="T1">Table 1</xref> and additional information on sample collection can be found in the respective publications. MAGs were obtained from the inoculum source (two samples, 10 MAGs) (<xref ref-type="bibr" rid="B32">Ingle et al., 2022</xref>) and bioreactors fed cellulosic ethanol thin stillage (six samples, 10 MAGs) (<xref ref-type="bibr" rid="B58">Scarborough et al., 2018a</xref>; <xref ref-type="bibr" rid="B60">Scarborough et al., 2020</xref>), synthetic medium containing xylose as the primary carbon source (three samples, 8 MAGs) (<xref ref-type="bibr" rid="B61">Scarborough et al., 2022</xref>), hydrolysate from dairy manure (four samples, 38 MAGs) (<xref ref-type="bibr" rid="B33">Ingle et al., 2021</xref>; <xref ref-type="bibr" rid="B32">Ingle et al., 2022</xref>), ultra-filtered milk permeate (34 samples, 123 MAGs) (<xref ref-type="bibr" rid="B71">Walters et al., 2022</xref>; <xref ref-type="bibr" rid="B70">Walters et al., 2023</xref>), and starch ethanol thin stillage (31 samples, 51 MAGs) (<xref ref-type="bibr" rid="B19">Fortney et al., 2021</xref>; <xref ref-type="bibr" rid="B20">Fortney et al., 2022</xref>). In all cases, only the best-quality representative MAGs determined in each study were used. In total, we used an initial dataset of 240 MAGs from 80 total samples (Table S1).</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Bioreactor operational conditions.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Feedstock</th>
<th align="center">Experiment<xref ref-type="table-fn" rid="Tfn1">
<sup>a</sup>
</xref>
</th>
<th align="center">Main organic substrates in the feedstock</th>
<th align="center">SRT<xref ref-type="table-fn" rid="Tfn2">
<sup>b</sup>
</xref> (days)</th>
<th align="center">HRT<xref ref-type="table-fn" rid="Tfn2">
<sup>b</sup>
</xref> (days)</th>
<th align="center">Temperature</th>
<th align="center">pH</th>
<th align="center">References</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">Manure Hydrolysate</td>
<td align="center">Manure Hydrolysate</td>
<td align="center">glucose, xylose</td>
<td align="center">6</td>
<td align="center">6</td>
<td align="center">35&#xb0;C</td>
<td align="center">5.5</td>
<td align="center">
<xref ref-type="bibr" rid="B33">Ingle et al. (2021)</xref>
</td>
</tr>
<tr>
<td rowspan="2" align="center">Ultra-Filtered Milk Permeate</td>
<td align="center">Milk Permeate 1 (CSTR)</td>
<td align="center">lactose</td>
<td align="center">6</td>
<td align="center">6</td>
<td align="center">35&#xb0;C</td>
<td align="center">5.5</td>
<td align="center">
<xref ref-type="bibr" rid="B70">Walters et al. (2023)</xref>
</td>
</tr>
<tr>
<td align="center">Milk Permeate 2 (USB)</td>
<td align="center">lactose</td>
<td align="center">&#x3e;40</td>
<td align="center">0.5</td>
<td align="center">room temp</td>
<td align="center">5.5</td>
<td align="center">This Study</td>
</tr>
<tr>
<td align="center">Cellulosic EtOH Thin Stillage</td>
<td align="center">Cellulosic-EtOH Thin Stillage</td>
<td align="center">xylose</td>
<td align="center">6</td>
<td align="center">6</td>
<td align="center">35&#xb0;C</td>
<td align="center">5.5</td>
<td align="center">
<xref ref-type="bibr" rid="B58">Scarborough et al. (2018a),</xref> <xref ref-type="bibr" rid="B60">Scarborough et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="center">Xylose Synthetic Medium</td>
<td align="center">Xylose</td>
<td align="center">xylose</td>
<td align="center">6</td>
<td align="center">6</td>
<td align="center">35&#xb0;C</td>
<td align="center">5.5</td>
<td align="center">This Study</td>
</tr>
<tr>
<td rowspan="5" align="center">Starch EtOH Thin Stillage</td>
<td align="center">Starch-EtOH 1</td>
<td align="center">glycerol, carbohydrates, lactic acid</td>
<td align="center">6</td>
<td align="center">6</td>
<td align="center">35&#xb0;C</td>
<td align="center">5.5</td>
<td align="center">
<xref ref-type="bibr" rid="B19">Fortney et al. (2021)</xref>
</td>
</tr>
<tr>
<td align="center">SR-Starch-EtOH 2</td>
<td align="center">glycerol, carbohydrates, lactic acid</td>
<td align="center">6</td>
<td align="center">6</td>
<td align="center">35&#xb0;C</td>
<td align="center">5.5</td>
<td align="center">
<xref ref-type="bibr" rid="B19">Fortney et al. (2021)</xref>
</td>
</tr>
<tr>
<td align="center">SR-Starch-EtOH 3</td>
<td align="center">glycerol, carbohydrates, lactic acid</td>
<td align="center">1</td>
<td align="center">1</td>
<td align="center">35&#xb0;C</td>
<td align="center">5.5</td>
<td align="center">
<xref ref-type="bibr" rid="B19">Fortney et al. (2021)</xref>
</td>
</tr>
<tr>
<td align="center">SR-Starch-EtOH 4</td>
<td align="center">glycerol, carbohydrates, lactic acid</td>
<td align="center">6</td>
<td align="center">6</td>
<td align="center">55&#xb0;C</td>
<td align="center">5.0</td>
<td align="center">
<xref ref-type="bibr" rid="B19">Fortney et al. (2021)</xref>
</td>
</tr>
<tr>
<td align="center">SR-Starch-EtOH 5</td>
<td align="center">glycerol, carbohydrates, lactic acid</td>
<td align="center">1</td>
<td align="center">1</td>
<td align="center">55&#xb0;C</td>
<td align="center">5.0</td>
<td align="center">
<xref ref-type="bibr" rid="B19">Fortney et al. (2021)</xref>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="Tfn1">
<label>
<sup>a</sup>
</label>
<p>CSTR, continuously stirred tank reactor; USB, upflow sludge blanket reactor; SR, solids removed from the thin stillage by decanting.</p>
</fn>
<fn id="Tfn2">
<label>
<sup>b</sup>
</label>
<p>SRT, solid retention time; HRT, hydraulic retention time.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s2-2">
<title>2.2 MAG dereplication and taxonomic classification</title>
<p>The program dRep (v3.2.2; <italic>dereplicate</italic> command) (<xref ref-type="bibr" rid="B51">Olm et al., 2017</xref>) was used to identify redundant MAGs using default settings, except <italic>-conW</italic> was set to 0.5 and <italic>-N50W</italic> was set to 5. This reduced the total MAG number from 240 to 217 non-redundant MAGs (<xref ref-type="sec" rid="s10">Supplementary Table S2</xref>). CheckM (v1.0.11; <italic>lineage_wf</italic> and <italic>qa</italic> commands with default parameters) (<xref ref-type="bibr" rid="B52">Parks et al., 2015</xref>) was used to determine relevant quality parameters for each of the 217 MAGs (<xref ref-type="sec" rid="s10">Supplementary Table S2</xref>). All 217 MAGs were taxonomically classified using GTDB-Tk (v1.5.1; database release 202; <italic>classify_wf</italic> command with default parameters) (<xref ref-type="sec" rid="s10">Supplementary Table S3</xref>).</p>
</sec>
<sec id="s2-3">
<title>2.3 Alignment and relative abundance calculations</title>
<p>To predict the relative abundance of microorganisms represented by the 217-MAG dataset in samples from the different bioreactors, the genome FASTA files of all the MAGs were concatenated, and then Bowtie2 (v2.2.2 with default parameters) (<xref ref-type="bibr" rid="B45">Langmead and Salzberg, 2012</xref>) was used to align the FASTQ sequencing files. Resulting SAM files were converted into BAM files and sorted using samtools (v1.15.1; <italic>view</italic> and <italic>sort</italic> commands with default parameters) (<xref ref-type="bibr" rid="B47">Li et al., 2009</xref>). CoverM (v0.4.0; <italic>coverm genome</italic> command with default parameters) (<ext-link ext-link-type="uri" xlink:href="https://github.com/wwood/CoverM">https://github.com/wwood/CoverM</ext-link>) was used to generate relative abundance statistics of mapped reads in the sorted BAM files (<xref ref-type="sec" rid="s10">Supplementary Table S2</xref>). We identified 131 MAGs with at least 1% relative abundance in at least one sample across all experiments, which we define as the high-abundance MAG dataset (<xref ref-type="sec" rid="s10">Supplementary Table S4</xref>). A relative abundance of 1% has been used previously as an abundance threshold (<xref ref-type="bibr" rid="B17">Fitzgerald et al., 2015</xref>; <xref ref-type="bibr" rid="B58">Scarborough et al., 2018a</xref>; <xref ref-type="bibr" rid="B59">Scarborough et al., 2018b</xref>; <xref ref-type="bibr" rid="B60">Scarborough et al., 2020</xref>).</p>
</sec>
<sec id="s2-4">
<title>2.4 Phylogenetic analyses</title>
<p>Maximum likelihood phylogenetic trees were generated using RAxML-NG (v0.9.0; model LG &#x2b; G8&#x2b;F) (<xref ref-type="bibr" rid="B41">Kozlov et al., 2019</xref>) using 1,000 bootstraps. GTDB-Tk (v1.5.1; database release 202; <italic>ani_rep</italic> command with default parameters) (<xref ref-type="bibr" rid="B11">Chaumeil et al., 2019</xref>) was used to identify closest related genomes, which were downloaded from NCBI. The MAGs and closest genomes were compared using GTDB-Tk (<italic>identify</italic> and <italic>align</italic> commands with default parameters) using a set of 120 bacterial single-copy marker genes (Bac120) for all trees. <italic>Prevotella intermedia</italic> (GCF_001953955.1) was used as an outgroup to root the trees.</p>
<p>An additional analysis was performed to compare homologs of subunit B of the electron transfer flavoprotein (EtfB). For this, EtfB homologs were identified using known protein sequences (<xref ref-type="bibr" rid="B70">Walters et al., 2023</xref>) and tBLASTn (v2.8.1, default parameters) (<xref ref-type="bibr" rid="B7">Camacho et al., 2009</xref>) with &#x201c;pident&#x201d; (percent identity to the query sequence) &#x3e; 25% and &#x201c;qcovhsp&#x201d; (coverage of the query sequence) &#x3e; 70%. EtfB homologs were aligned using MUSCLE (v3.8.31, default parameters) and a phylogenetic tree was constructed using RAxML-NG using 500 boostraps. All files used in this analysis are available on GitHub (<ext-link ext-link-type="uri" xlink:href="https://github.com/GLBRC/agroindustrial_residue_metagenomics">https://github.com/GLBRC/agroindustrial_residue_metagenomics</ext-link>).</p>
</sec>
<sec id="s2-5">
<title>2.5 Non-metric multidimensional scaling plots</title>
<p>Non-metric multidimensional scaling (NMDS) plots were generated from the relative abundance calculations for the 217 non-redundant MAGs using R (v4.1.0) (Core Team, 2018). Specifically, the <italic>vegdist</italic> command with the &#x201c;<italic>bray</italic>&#x201d; index (from the vegan package, v2.6-4) was used to determine the distance metrics and the <italic>metaMDS</italic> command (from the vegan package, v2.6-4) was used to generate the NMDS values. Plots were constructed using ggplot2 (<xref ref-type="bibr" rid="B74">Wickham, 2016</xref>) from the NMDS values and edited for clarity using Adobe Illustrator (v27.2). Statistical comparisons were performed using permutation-based multivariate analysis of variance (PerMANOVA) via the <italic>adonis</italic> command (from the vegan package, v2.6-4) with &#x201c;<italic>euclidean&#x201d;</italic> distance and the Benjamini-Hochberg adjustment (adjusted <italic>p</italic>-value &#x3c;0.05 accepted as significant) (<xref ref-type="bibr" rid="B4">Benjamini and Hochberg, 1995</xref>; <xref ref-type="bibr" rid="B2">Anderson, 2017</xref>). The R script used to generate the NMDS plot is available on GitHub (GitHub page: <ext-link ext-link-type="uri" xlink:href="https://github.com/GLBRC/agroindustrial_residue_metagenomics">https://github.com/GLBRC/agroindustrial_residue_metagenomics</ext-link>).</p>
</sec>
<sec id="s2-6">
<title>2.6 Homology-based gene identification</title>
<p>A homology-based analysis was performed to identify genes encoding enzymes of fermentation and central carbon metabolism in each MAG. The query protein sequences used were manually vetted through either EcoCyc (<xref ref-type="bibr" rid="B38">Keseler et al., 2011</xref>), MetaCyc (<xref ref-type="bibr" rid="B9">Caspi et al., 2020</xref>), SWISS-PROT via UniProtKB (<xref ref-type="bibr" rid="B6">Boutet et al., 2016</xref>), or other published datasets. Query protein amino acid sequences and metadata were downloaded from the UniProtKB database. tBLASTn (v2.8.1) (<xref ref-type="bibr" rid="B7">Camacho et al., 2009</xref>) was used to identify homologs using default parameters. Subject sequences that had an e-value less than 1 &#xd7; 10<sup>&#x2212;10</sup>, a &#x201c;pident&#x201d; (percent identity to the query sequence) value greater than 25%, and a &#x201c;qcovhsp&#x201d; (coverage of the query sequence) value greater than 70% were used to determine gene homologs (<xref ref-type="sec" rid="s10">Supplementary Table S5</xref>). All files and scripts are available on GitHub (GitHub page: <ext-link ext-link-type="uri" xlink:href="https://github.com/GLBRC/agroindustrial_residue_metagenomics">https://github.com/GLBRC/agroindustrial_residue_metagenomics</ext-link>).</p>
</sec>
<sec id="s2-7">
<title>2.7 Multiclass classification machine learning algorithm</title>
<p>MAGs were classified into four functional groups. The first group, &#x201c;Ferment to Intermediates&#x201d;, consists of MAGs that ferment carbohydrates into intermediate extracellular products, such as ethanol or lactic acid. The second group, &#x201c;Intermediate Chain Elongators&#x201d;, consists of MAGs that convert intermediate extracellular products (e.g., ethanol or lactic acid) into medium chain fatty acids (MCFAs) using reverse &#xdf;-oxidation. The third group, &#x201c;Carbohydrate Chain Elongators&#x201d;, consists of MAGs that ferment carbohydrates directly into MCFAs. A fourth group, &#x201c;uninvolved&#x201d;, was used to bin MAGs that could not be classified into the three functional groups.</p>
<p>Multiclass classification machine learning was utilized to categorize the MAGs based on gene homologs of key fermentation pathways that were detected. A training set was constructed using organisms known to fit into one of the four groups (<xref ref-type="sec" rid="s10">Supplementary Table S6</xref>). <italic>Bifidobacterium</italic> species and lactic acid bacteria were used for the Ferment to Intermediates training set (<xref ref-type="bibr" rid="B50">Okada et al., 1979</xref>; <xref ref-type="bibr" rid="B54">Pokusaeva et al., 2011</xref>; <xref ref-type="bibr" rid="B56">Pruckler et al., 2015</xref>; <xref ref-type="bibr" rid="B65">Tanner et al., 2016</xref>; <xref ref-type="bibr" rid="B15">Eckel and Vogel, 2020</xref>; <xref ref-type="bibr" rid="B16">Ferrero et al., 2021</xref>; <xref ref-type="bibr" rid="B37">Kasmaei et al., 2022</xref>; <xref ref-type="bibr" rid="B42">Ksiezarek et al., 2022</xref>), <italic>Clostridium</italic> and <italic>Megasphaera</italic> species were used for the Intermediate Chain Elongators training set (<xref ref-type="bibr" rid="B69">Wallace et al., 2003</xref>; <xref ref-type="bibr" rid="B63">Seedorf et al., 2008</xref>; <xref ref-type="bibr" rid="B34">Jeon et al., 2017</xref>; <xref ref-type="bibr" rid="B40">Kobayashi et al., 2017</xref>; <xref ref-type="bibr" rid="B66">Tao et al., 2017</xref>; <xref ref-type="bibr" rid="B75">Yang et al., 2018</xref>; <xref ref-type="bibr" rid="B76">Yoshikawa et al., 2018</xref>; <xref ref-type="bibr" rid="B48">Litty and Muller, 2021</xref>), <italic>Caproicibacter</italic> and <italic>Roseburia</italic> species were used for the Carbohydrate Chain Elongators training set (<xref ref-type="bibr" rid="B39">Kim et al., 2015</xref>; <xref ref-type="bibr" rid="B64">Tamanai-Shacoori et al., 2017</xref>; <xref ref-type="bibr" rid="B18">Flaiz et al., 2020</xref>; <xref ref-type="bibr" rid="B62">Schoelmerich et al., 2020</xref>), and <italic>Acetobacter, Prevotella,</italic> and <italic>Sphaerochaeta</italic> species were used for the uninvolved training set.</p>
<p>Multiple multiclass classification machine learning algorithms were tested using the auto_ml module (v2.9.10) (<ext-link ext-link-type="uri" xlink:href="https://github.com/ClimbsRocks/auto_ml">https://github.com/ClimbsRocks/auto_ml</ext-link>). The algorithms tested against baseline were <italic>Decision Tree</italic> (<xref ref-type="bibr" rid="B53">Pedregosa et al., 2011</xref>), <italic>Random Forest</italic> (<xref ref-type="bibr" rid="B53">Pedregosa et al., 2011</xref>), <italic>Linear Regression</italic> (<xref ref-type="bibr" rid="B53">Pedregosa et al., 2011</xref>), <italic>XGBoost</italic> (<ext-link ext-link-type="uri" xlink:href="https://xgboost.readthedocs.io/en/stable/index.html">https://xgboost.readthedocs.io/en/stable/index.html</ext-link>), <italic>Neural Network</italic> (<xref ref-type="bibr" rid="B53">Pedregosa et al., 2011</xref>), <italic>Nearest Neighbors</italic> (<xref ref-type="bibr" rid="B53">Pedregosa et al., 2011</xref>), <italic>Extra Trees</italic> (<xref ref-type="bibr" rid="B53">Pedregosa et al., 2011</xref>), <italic>CatBoost</italic> (<xref ref-type="bibr" rid="B55">Prokhorenkova et al., 2018</xref>), and <italic>LightGBM</italic> (<xref ref-type="bibr" rid="B77">Zhang et al., 2017</xref>). The machine learning algorithms were evaluated for correct classification of training set genomes into functional groups using multiple analyses: the logloss metric (-log(<italic>p</italic>), where <italic>p</italic> is the probability of correctly categorizing the training set) (<xref ref-type="bibr" rid="B5">Bian and Tao, 2011</xref>) for each algorithm compared to the baseline value of no algorithm, precision-recall (PR) curves for each algorithm and receiver operating characteristic (ROC) curves for each algorithm (<xref ref-type="bibr" rid="B28">Haibo and Garcia, 2009</xref>). These evaluations showed that using the <italic>LightGBM</italic> model provided the largest decrease in logloss metric (a 99.91% improvement compared to baseline alone) while maximizing true positives and minimizing false positives. The script, files used for the machine learning analysis, and the results of the multiclass classification machine learning analysis are available on GitHub (GitHub page: <ext-link ext-link-type="uri" xlink:href="https://github.com/GLBRC/agroindustrial_residue_metagenomics">https://github.com/GLBRC/agroindustrial_residue_metagenomics</ext-link>).</p>
</sec>
<sec id="s2-8">
<title>2.9 Hierarchical clustering</title>
<p>MAGs were classified into predicted functional groups using hierarchical clustering based on the detected genes in metabolic pathways important in MCFA production (<xref ref-type="bibr" rid="B70">Walters et al., 2023</xref>). Hierarchical clustering was performed in R (v4.1.0) (Core Team, 2018) using the gplots R package (v3.1.3, heatmap.2 command with default parameters, <ext-link ext-link-type="uri" xlink:href="https://github.com/talgalili/gplots/">https://github.com/talgalili/gplots/</ext-link>). MAGs were classified using the hierarchical clustering results in the Ferment to Intermediates group if they had high percentage of genes detected in the bifid shunt or phosphoketolase pathways and low percentage of genes detected in the lactic acid utilization and reverse &#xdf;-oxidation pathways, in the Intermediate Chain Elongators group if they had low percentage of genes detected in the bifid shunt or phosphoketolase pathways and high percentage of genes detected in the lactic acid utilization and reverse &#xdf;-oxidation pathways, and in the Carbohydrate Chain Elongators group if they had low percentage of genes detected in the bifid shunt, phosphoketolase, and lactic acid utilization pathways but high percentage of genes detected in the reverse &#xdf;-oxidation pathway (<xref ref-type="sec" rid="s10">Supplementary Table S2</xref>). The script, files used, and results of this analysis are available on GitHub (GitHub page: <ext-link ext-link-type="uri" xlink:href="https://github.com/GLBRC/agroindustrial_residue_metagenomics">https://github.com/GLBRC/agroindustrial_residue_metagenomics</ext-link>).</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>3 Results</title>
<sec id="s3-1">
<title>3.1 Analysis of the non-redundant MAG dataset</title>
<p>For this study we used MAGs assembled from 10 different bioreactors that were fed various agroindustrial residues (<xref ref-type="fig" rid="F1">Figure 1</xref>). The microbial communities that were enriched in these bioreactors originated from the same inoculum source, an acid-phase anaerobic digester used in the solids handling treatment train at the local wastewater treatment plant (Madison, WI, United States). In addition to the type of agroindustrial residue used as the feedstock, parameters such as temperature and pH were also different in some bioreactor experiments (<xref ref-type="table" rid="T1">Table 1</xref>). Bioreactor performance has been described elsewhere for a bioreactor fed xylose-rich thin stillage from cellulosic ethanol production (<xref ref-type="bibr" rid="B59">Scarborough et al., 2018b</xref>), one fed a carbohydrate-rich hydrolysate created from chemical pretreatment of dairy manure (<xref ref-type="bibr" rid="B33">Ingle et al., 2021</xref>), five bioreactors fed thin stillage from starch ethanol biorefining (<xref ref-type="bibr" rid="B19">Fortney et al., 2021</xref>), and one bioreactor fed lactose-rich ultra-filtered milk permeate (<xref ref-type="bibr" rid="B70">Walters et al., 2023</xref>). Two additional bioreactors complete the set of 10 bioreactors used in this study; one fed a xylose-rich synthetic medium and a second one operated with ultra-filtered milk permeate as the feedstock. The MAGs assembled from all of the bioreactors have been reported and are publicly available (<xref ref-type="bibr" rid="B58">Scarborough et al., 2018a</xref>; <xref ref-type="bibr" rid="B20">Fortney et al., 2022</xref>; <xref ref-type="bibr" rid="B32">Ingle et al., 2022</xref>; <xref ref-type="bibr" rid="B61">Scarborough et al., 2022</xref>; <xref ref-type="bibr" rid="B71">Walters et al., 2022</xref>). The main fermentation products that accumulated in the medium of these bioreactors include lactic and succinic acids, ethanol, as well as the short chain fatty acids (SCFAs) acetic and propionic acids and the MCFAs butyric, hexanoic, and octanoic acids (<xref ref-type="fig" rid="F2">Figure 2</xref>).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Overview of bioreactors operated with the different agroindustrial feedstocks and their contribution to the non-redundant MAG dataset. <bold>(A)</bold> Graphical overview of inoculum source and enrichments with different feedstocks, indicating the number of MAGs assembled from each source. All reactors were completely mixed flow-through reactors, except for Milk Permeate 2, which was an upflow sludge blanket reactor. See <xref ref-type="table" rid="T1">Table 1</xref> for operational conditions. <bold>(B)</bold> Flow chart indicating how the MAGs were filtered for this work. From a total of 240 MAGs, dRep (<xref ref-type="bibr" rid="B51">Olm et al., 2017</xref>) was used to identify redundant MAGs and define a set of 217 non-redundant MAGs. Abundance was then used to define a set of 131 high-abundance and non-redundant MAGs.</p>
</caption>
<graphic xlink:href="fbioe-11-1197175-g001.tif"/>
</fig>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Summary of extracellular fermentation products that accumulated in the bioreactors. Product concentrations, measured in chemical oxygen demand (COD) per liter, are summarized into four groups, indicating maximum concentrations measured during the course of the experiments: &#x3c;0.1&#xa0;g COD/L (light grey), between 0.1 and 2&#xa0;g COD/L (blue), between 2&#xa0;g COD/L and 10&#xa0;g COD/L (red), &#x3e;10&#xa0;g COD/L (yellow).</p>
</caption>
<graphic xlink:href="fbioe-11-1197175-g002.tif"/>
</fig>
<p>Combined, there are a total of 240 MAGs across these bioreactors (<xref ref-type="fig" rid="F1">Figure 1B</xref>; <xref ref-type="sec" rid="s10">Supplementary Table S1</xref>). Given the similarities in the inoculum source and in the accumulated fermentation products, we hypothesized that the MAGs assembled from these microbial communities would have a high degree of similarity. However, when the program dRep (<xref ref-type="bibr" rid="B51">Olm et al., 2017</xref>) was used to identify MAGs with at least 99% average nucleotide identity (ANI), only 23 MAGs were highly similar among the 240 MAGs (<xref ref-type="fig" rid="F1">Figure 1B</xref>; Table S1). This dereplication analysis resulted in a library of 217 non-redundant MAGs that we used to further evaluate the microbial communities in the bioreactors (<xref ref-type="sec" rid="s10">Supplementary Table S2</xref>).</p>
<p>This collection of 217 non-redundant MAGs represented median relative abundances ranging from 63.5% to 90.3% in the bioreactor samples, but a median relative abundance of only 11.6% for the inoculum (<xref ref-type="table" rid="T2">Table 2</xref>). The low percentage for the inoculum indicates that most of the 217 MAGs in the library represented microbial community members that were not abundant in the acid-phase digester inoculum, but were instead enriched during the operation of the bioreactors.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Relative abundance of all 217 non-redundant MAGs across all experiments.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Experiment</th>
<th align="center">Number of MAGs detected as present<xref ref-type="table-fn" rid="Tfn3">
<sup>a</sup>
</xref>
</th>
<th align="center">Min-max relative abundance range<sup>b</sup> (%)</th>
<th align="center">Median relative abundance (%)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">Inoculum</td>
<td align="center">21</td>
<td align="center">10.3&#x2013;13.0</td>
<td align="center">11.6</td>
</tr>
<tr>
<td align="center">Manure Hydrolysate</td>
<td align="center">99</td>
<td align="center">68.9&#x2013;77.9</td>
<td align="center">74.7</td>
</tr>
<tr>
<td align="center">Milk Permeate 1</td>
<td align="center">148</td>
<td align="center">9.3&#x2013;91.1</td>
<td align="center">74.6</td>
</tr>
<tr>
<td align="center">Milk Permeate 2</td>
<td align="center">139</td>
<td align="center">7.9&#x2013;80.1</td>
<td align="center">69.2</td>
</tr>
<tr>
<td align="center">Cellulosic EtOH Thin Stillage</td>
<td align="center">75</td>
<td align="center">33.0&#x2013;87.3</td>
<td align="center">86.6</td>
</tr>
<tr>
<td align="center">Xylose</td>
<td align="center">21</td>
<td align="center">88.0&#x2013;88.5</td>
<td align="center">88.5</td>
</tr>
<tr>
<td align="center">Starch-EtOH 1</td>
<td align="center">100</td>
<td align="center">8.5&#x2013;87.0</td>
<td align="center">63.5</td>
</tr>
<tr>
<td align="center">SR-Starch-EtOH 2</td>
<td align="center">55</td>
<td align="center">87.9&#x2013;92.6</td>
<td align="center">90.3</td>
</tr>
<tr>
<td align="center">SR-Starch-EtOH 3</td>
<td align="center">52</td>
<td align="center">80.8&#x2013;88.8</td>
<td align="center">85.2</td>
</tr>
<tr>
<td align="center">SR-Starch-EtOH 4</td>
<td align="center">53</td>
<td align="center">84.6&#x2013;89.7</td>
<td align="center">86.1</td>
</tr>
<tr>
<td align="center">SR-Starch-EtOH 5</td>
<td align="center">24</td>
<td align="center">74.9&#x2014;77.4</td>
<td align="center">76.4</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="Tfn3">
<label>
<sup>
<bold>a</bold>
</sup>
</label>
<p>A MAG was defined to be present in a sample if the relative abundance was greater than 0%.</p>
</fn>
<fn id="Tfn4">
<label>
<sup>b</sup>
</label>
<p>Minimum and maximum relative abundances represented by the non-redundant MAG dataset among all the samples from each bioreactor experiment and from the inoculum samples.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>A non-metric multidimensional scaling (NMDS) analysis of the relative abundance of MAGs in the analyzed samples reveals divergence in the microorganisms that were enriched during growth in the different agroindustrial residues (<xref ref-type="fig" rid="F3">Figure 3</xref>). The lack of overlap of the abundant MAGs among agroindustrial residue media used indicates that the media played a large role in shaping the microbial communities in these bioreactors. The dataset includes samples collected from bioreactors operated with the same agroindustrial residue but different operational conditions. In these cases, the NDMS plot suggests that agroindustrial residue used had a larger impact in shaping the microbial community compared to the operational condition. For example, several bioreactors were operated using starch ethanol thin stillage (<xref ref-type="bibr" rid="B19">Fortney et al., 2021</xref>), and in the NDMS plot (<xref ref-type="fig" rid="F3">Figure 3</xref>) the samples from these bioreactors clustered together and separate from the samples from bioreactors that used other agroindustrial residues (adjusted <italic>p</italic>-value &#x3c;0.05). The dataset also includes samples collected from bioreactors operated under identical conditions but receiving different agroindustrial residues. This is the case for the Milk Permeate 1, Xylose, and the Starch-EtOH 1 experiments (<xref ref-type="fig" rid="F3">Figure 3</xref>). Although they were all operated under identical conditions, there is no overlap of the abundant MAGs from these reactors in the NDMS plot (adjusted <italic>p</italic>-value &#x3c;0.05), supporting the argument that the agroindustrial residue used had a larger impact in the microbial communities than the operational conditions used.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Non-metric multidimensional scaling (NMDS) plot of the relative abundances of the microbial communities using the 217 non-redundant MAGs across all experiments over all measured time points (stress value 0.17). Samples from different bioreactor experiments are color coded according to the key. Ovals represent the standard deviation of the average value for all samples from each bioreactor experiment and are color coded according to the key. Samples that were taken at the time of inoculation are marked with &#x2018;0&#x2019;. See <xref ref-type="table" rid="T1">Table 1</xref> for description of bioreactor operational conditions and definition of experiment names.</p>
</caption>
<graphic xlink:href="fbioe-11-1197175-g003.tif"/>
</fig>
<p>The set of non-redundant MAGs has a diverse composition (<xref ref-type="table" rid="T3">Table 3</xref>; <xref ref-type="sec" rid="s10">Supplementary Table S3</xref>), with MAGs belonging to eight phyla and 12 families within these phyla. 24 MAGs were classified to the genus level based on the coverage in the metagenomic data sets. In addition, this non-redundant set includes MAGs assembled with short-read Illumina (149 MAGs) and long-read PacBio technologies (68 MAGs). Estimates of completion and contamination in this dataset are greater than 75% and less than 7.5%, respectively. The MAGs resulting from Illumina sequencing had assemblies with 1&#x2013;558 contigs, whereas the MAGs obtained from PacBio sequencing were assembled in 1&#x2013;44 contigs (<xref ref-type="table" rid="T3">Table 3</xref>; <xref ref-type="sec" rid="s10">Supplementary Table S2</xref>).</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>General information on the 217&#xa0;MAGs.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Characteristic</th>
<th align="left">Value</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Phyla Identified</td>
<td align="left">8</td>
</tr>
<tr>
<td align="left">Families Identified</td>
<td align="left">12</td>
</tr>
<tr>
<td align="left">Genera Identified</td>
<td align="left">24</td>
</tr>
<tr>
<td align="left">Illumina Total (contig range)</td>
<td align="left">149 (1-558)</td>
</tr>
<tr>
<td align="left">PacBio Total (contig range)</td>
<td align="left">68 (1-44)</td>
</tr>
<tr>
<td align="left">Completion Minimum</td>
<td align="left">75%</td>
</tr>
<tr>
<td align="left">Contamination Maximum</td>
<td align="left">7.5%</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-2">
<title>3.2 Enzymes in metabolic pathways identified in the non-redundant MAG dataset</title>
<p>We sought to make predictions on the role of different members of the microbial communities enriched in the bioreactors and to evaluate the microbial ecology model for MCFA production that hypothesizes the presence of some community members that produce MCFA directly from carbohydrates (Carbohydrate Chain Elongators), other community members that produce MCFA from lactic acid or ethanol as intermediate fermentation products (Intermediate Chain Elongators), and other community members that produce these intermediate products but do not perform chain elongation (Ferment to Intermediates) (<xref ref-type="bibr" rid="B58">Scarborough et al., 2018a</xref>). To this end, we queried the MAGs for the presence of homologs of individual proteins present in different fermentation pathways (<xref ref-type="fig" rid="F4">Figure 4</xref>; <xref ref-type="sec" rid="s10">Supplementary Table S5</xref>) (<xref ref-type="bibr" rid="B70">Walters et al., 2023</xref>). This allowed categorization of MAGs by association of similar patterns of the presence of homologous proteins from each metabolic pathway examined. Using the hierarchical clustering of the MAGs based on the percentage of homologs present per pathway, we categorized the MAGs into the functional groups. Based on this analysis, 79 MAGs are predicted to ferment carbohydrates to intermediate products (Ferment to Intermediates), 59 MAGs are predicted to produce MCFA from the intermediate products (Intermediate Chain Elongators), and 13 MAGs are predicted to produce MCFA from carbohydrates (Carbohydrate Chain Elongators, <xref ref-type="fig" rid="F4">Figure 4</xref>; <xref ref-type="sec" rid="s10">Supplementary Table S2</xref>).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Clustering 217 MAGs using metabolic pathways. Identified homologous proteins in the indicated metabolic pathways (columns) for each of the 217 non-redundant MAGs (rows). Colors represent the percentage of protein homologs for each pathway for each MAG as indicated in the key. The MAGs were hierarchically clustered resulting the dendrogram on the left. Functional group assignments based on hierarchical clustering is indicated on the left, and color coded as Ferment to Intermediates (blue), Intermediate Chain Elongators (green), Carbohydrate Chain Elongators (red), and uninvolved in MCFA production (purple).</p>
</caption>
<graphic xlink:href="fbioe-11-1197175-g004.tif"/>
</fig>
</sec>
<sec id="s3-3">
<title>3.3 Machine learning-based classification</title>
<p>We also wanted to test if we could use multiclass classification machine learning to generate similar predictions, as a way to evaluate large MAG datasets quickly and to remove any bias in functional assignments based on enzyme assignments. For this evaluation, we constructed a training set of isolated organisms predicted to perform the three specific functions in the model, plus organisms not known or likely to participate in these activities (<xref ref-type="sec" rid="s10">Supplementary Table S6</xref>). As input to the machine learning algorithm, we used the information gathered about detection of protein homologs in the metabolic pathways relevant to the ecological model (<xref ref-type="sec" rid="s10">Supplementary Table S5</xref>). The training set was then used to investigate a number of possible multiclass classification machine learning algorithms, with the <italic>LightGBM</italic> algorithm (<xref ref-type="bibr" rid="B77">Zhang et al., 2017</xref>) producing the best results of binning the genomes into the correct functional groups based on multiple methods of evaluation (logloss comparison to baseline, PR curve, and ROC curve).</p>
<p>To evaluate the machine learning multiclass classifications, a subset of the most abundant MAGs was selected for further analysis. The 217 non-redundant MAGs across the experiments were filtered to include only MAGs with at least 1% relative abundance in at least one experiment sample (<xref ref-type="fig" rid="F1">Figure 1B</xref>; <xref ref-type="sec" rid="s10">Supplementary Table S4</xref>). The resultant 131 high-abundance MAGs include ones assembled from short read Illumina technology (74 MAGs) and long read PacBio technology (57 MAGs) and were categorized into one of four functional groups using the trained multiclass machine learning model. Overall, 63 MAGs were predicted as being able to ferment carbohydrates to intermediate products (Ferment to Intermediates), 17 MAGs were predicted as being able to convert intermediate products to MCFAs (Intermediate Chain Elongators), 12 MAGs were categorized as being able to ferment carbohydrates to MCFAs (Carbohydrate Chain Elongators), and 39 MAGs were predicted not to be involved in MCFA production (<xref ref-type="fig" rid="F5">Figure 5A</xref>; <xref ref-type="sec" rid="s10">Supplementary Table S4</xref>). The MAGs in each category were derived from several different agroindustrial residue experiments (<xref ref-type="fig" rid="F5">Figure 5B</xref>), showing that similar functions occurred with the different agroindustrial residues.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Summary of machine learning categorization. <bold>(A)</bold> Distribution of the 131 MAGs in the different functional groups used for machine learning classification. <bold>(B)</bold> Distribution of the 131 MAGs according to the experiment from which each was identified in according to how they were classified in by machine learning. Venn diagrams show comparison of the hierarchical pathway clustering classification and the machine learning classification for Ferment to Intermediates group <bold>(C)</bold>, the Intermediate Chain Elongators group <bold>(D)</bold>, and the Carbohydrate Chain Elongators group <bold>(E)</bold>. Only MAGs present with at least 1% relative abundance in at least one sample across all experiments are included in the comparison analysis.</p>
</caption>
<graphic xlink:href="fbioe-11-1197175-g005.tif"/>
</fig>
<p>Comparison of the MAGs classified into the functional groups by the machine learning algorithm to classification by hierarchical pathway clustering reveals differences based on the approaches (<xref ref-type="fig" rid="F5">Figures 5C&#x2013;E</xref>). The Ferment to Intermediates group shows a large amount of overlap between the two methods (<xref ref-type="fig" rid="F5">Figure 5C</xref>). The hierarchical pathway clustering method identified more MAGs than the machine learning algorithm for the Intermediate Chain Elongators group while there was little overlap among the methods for the Carbohydrate Chain Elongators group (<xref ref-type="fig" rid="F5">Figures 5D, E</xref>).</p>
<p>Focusing on the machine learning classification, and to further investigate the MAGs present in functional groups responsible MCFA production, phylogenetic trees were constructed comparing the genomes used in the training set and the MAGs classified into each functional group (<xref ref-type="fig" rid="F6">Figures 6</xref>&#x2013;<xref ref-type="fig" rid="F8">8</xref>). The MAGs were taxonomically classified using GTDB-Tk (<xref ref-type="bibr" rid="B11">Chaumeil et al., 2019</xref>). For each functional group examined, we found multiple taxonomic groups across taxonomic levels, ranging from phyla to family (<xref ref-type="fig" rid="F6">Figures 6</xref>&#x2013;<xref ref-type="fig" rid="F8">8</xref>). Indeed, a subset of the MAGs in groups share no overlap at the class or family level with genomes in the training set, suggesting the machine learning algorithm is identifying new taxonomic groups that may perform the specific biological function.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Phylogenetic tree of MAGs classified in the Ferment to Intermediates group and the genomes used in the training set. A maximum-likelihood phylogenetic tree constructed using RAxML-NG (<xref ref-type="bibr" rid="B41">Kozlov et al., 2019</xref>) with 1,000 bootstraps (values &#x3e;50 shown) and using the 120 bacterial housekeeping gene concatenations generated by GTDB-Tk (<xref ref-type="bibr" rid="B11">Chaumeil et al., 2019</xref>). Taxonomic classification performed using GTDB-Tk (database version 202) (<xref ref-type="bibr" rid="B11">Chaumeil et al., 2019</xref>). The scale bar indicates the number of nucleotide substitutions per sequence site. Genomes used in the training set are shown (labeled Training Set) and NCBI Accession Numbers are found in <xref ref-type="sec" rid="s10">Supplementary Table S6</xref>. Color dots indicate experiment the MAG was identified in (experiments with no MAGs present in the tree are not shown). <italic>Ba.</italic>, <italic>Bacteroidota</italic>; <italic>Pro., Proteobacteria.</italic>
</p>
</caption>
<graphic xlink:href="fbioe-11-1197175-g006.tif"/>
</fig>
</sec>
<sec id="s3-4">
<title>3.4 MAGs predicted to participate in fermentation to intermediate products</title>
<p>The majority of the MAGs predicted in the Ferment to Intermediates group belonged to the <italic>Lactobacillaceae</italic>, <italic>Bifidobacteriaceae</italic>, and <italic>Atopobiaceae</italic> families (<xref ref-type="fig" rid="F6">Figure 6</xref>). In general, the MAGs in <italic>Bifidobacteriaceae</italic> and <italic>Lactobacillaceae</italic> clustered with the genomes from the same taxonomic group used in the training set. Further, the machine learning algorithm classified MAGs of the <italic>Atopobiaceae</italic> family into this group, despite no member of this family being present in the training set. A small subset of the MAGs in this functional group belonged to other taxonomic groups: class <italic>Bacilli</italic> (3 MAGs) and phylum <italic>Proteobacteria</italic> (3 MAGs) (<xref ref-type="fig" rid="F6">Figure 6</xref>).</p>
</sec>
<sec id="s3-5">
<title>3.5 MAGs predicted to participate in chain elongation from intermediate products</title>
<p>The majority of the MAGs in the Intermediate Chain Elongators group, predicted to convert fermentation intermediates into MCFAs, were predicted to belong to five families: <italic>Megasphaeraceae, Acidaminococcaceae</italic>, <italic>Clostridiaceae</italic>, <italic>Anaerovoracaceae</italic>, and <italic>Eubacteriaceae</italic> (<xref ref-type="fig" rid="F7">Figure 7</xref>). This included a MAG (UW_SG_EUB1, <italic>Ca.</italic> Pseudoramibacter fermentans) that was studied at the transcriptomic level and predicted to ferment intermediates into MCFAs (<xref ref-type="bibr" rid="B60">Scarborough et al., 2020</xref>). The MAGs in four of the five families were clustered with genomes in the same families used in the training set. However, there were no genomes in the training set that belonged to the family <italic>Acidaminococcaceae, Lachnospiraceae</italic>, or <italic>Oscillospiraceae</italic>. Two MAGs belonged to phylum <italic>Bacteroidota</italic> (order <italic>Bacteroidales</italic>).</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Phylogenetic tree of MAGs classified in the Intermediate Chain Elongators group and genomes used in the training set. A maximum-likelihood phylogenetic tree constructed using RAxML-NG (<xref ref-type="bibr" rid="B41">Kozlov et al., 2019</xref>) with 1,000 bootstraps (values &#x3e;50 shown) and using the 120 bacterial housekeeping gene concatenations generated by GTDB-Tk (<xref ref-type="bibr" rid="B11">Chaumeil et al., 2019</xref>). Taxonomic classification performed using GTDB-Tk (database version 202) (<xref ref-type="bibr" rid="B11">Chaumeil et al., 2019</xref>). The scale bar indicates the number of nucleotide substitutions per sequence site. Genomes used in the training set for this group are shown (labeled Training Set) and NCBI Accession Numbers are found in <xref ref-type="sec" rid="s10">Supplementary Table S6</xref>. Color dots indicate experiment the MAG was identified in (experiments with no MAGs present in the tree are not shown). <italic>Ba.</italic>, <italic>Bacteroidota</italic>; <italic>Acida., Acidaminococcales; Acida., Acidaminococcaceae; Peptostr., Peptostreptococcales; Anaerov., Anaerovoracaceae; Eubacteriac., Eubacteriaceae; Ls., Lachnospirales; La., Lachnospiraceae; Oscil., Oscillospirales; Os. Oscillospiraceae</italic>.</p>
</caption>
<graphic xlink:href="fbioe-11-1197175-g007.tif"/>
</fig>
</sec>
<sec id="s3-6">
<title>3.6 MAGs predicted to participate in chain elongation from carbohydrates</title>
<p>The MAGs predicted to belong to the Carbohydrate Chain Elongators group, ones which convert carbohydrates directly to MCFAs, belonged primarily to two families: <italic>Lachnospiraceae</italic> and <italic>Acutalibacteraceae</italic> (<xref ref-type="fig" rid="F8">Figure 8</xref>). Included in this group is a MAG (UW_SG_LCO1, <italic>Ca.</italic> Weimeria bifida) previously studied in-depth and suggested to perform chain elongation from carbohydrate substrates (<xref ref-type="bibr" rid="B60">Scarborough et al., 2020</xref>). Seven of the MAGs present in the Carbohydrate Chain Elongators group belonged to other taxonomic groups: class <italic>Bacilli</italic>, class <italic>Clostridia</italic> as well as phyla <italic>Proteobacteria</italic> and <italic>Spirochaetota</italic> (<xref ref-type="fig" rid="F8">Figure 8</xref>).</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Phylogenetic tree of MAGs classified in the Carbohydrate Chain Elongators group and genomes used in the training set. A maximum-likelihood phylogenetic tree constructed using RAxML-NG (<xref ref-type="bibr" rid="B41">Kozlov et al., 2019</xref>) with 1,000 bootstraps (values &#x3e;50 shown) and using the 120 bacterial housekeeping gene concatenations generated by GTDB-Tk (<xref ref-type="bibr" rid="B11">Chaumeil et al., 2019</xref>). Taxonomic classification performed using GTDB-Tk (database version 202) (<xref ref-type="bibr" rid="B11">Chaumeil et al., 2019</xref>). The scale bar indicates the number of nucleotide substitutions per sequence site. Genomes used in the training set for this group are shown (labeled Training Set) and NCBI Accession Numbers are found in <xref ref-type="sec" rid="s10">Supplementary Table S6</xref>. Color dots indicate experiment the MAG was identified in (experiments with no MAGs present in the tree are not shown). <italic>Ba.</italic>, <italic>Bacteroidota</italic>; <italic>Pro., Proteobacteria; Baci., Bacillales; So., Sporolactobacillaceae; Bl., Bacillaceae; Acutalibacter., Acutalibacteraceae; Cl., Clostridiales; Co., Clostridiaceae; Sp., Spirochaetota.</italic>
</p>
</caption>
<graphic xlink:href="fbioe-11-1197175-g008.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>4 Discussion</title>
<p>We have used a dataset of over 200 MAGs from 10 previously published bioreactor experiments to evaluate the prevalence of the emerging microbial ecological model for chain elongation microbiomes. In this model, MCFAs can be produced either from intermediates, such as lactic acid, or directly from carbohydrates. Using machine learning and protein homology predictions, we find that this ecology model is conserved across various microbial communities from bioreactors fed various carbohydrate rich agroindustrial residues. While the MAGs assembled from each microbial community were not found to be identical in terms of sequence similarity, the biological functions of the microbial communities are predicted to be maintained in MAGs from various taxonomic groups with different relative abundances (<xref ref-type="fig" rid="F9">Figure 9</xref>). Below we discuss observations about the organisms classified into each group.</p>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>Cumulative relative abundances for taxa within each group reveal common biological functions across agroindustrial residues. Cumulative relative abundances for each taxa across the 10 experiments for MAGs classified in the Ferment to Intermediates group, the Intermediate Chain Elongators group, and the Carbohydrate Chain Elongators group as labeled. For each panel, the heat map represents the cumulative relative abundance, with white indicating a cumulative relative abundance &#x3c;1. Asterisks indicate taxa present in the machine learning training set. MCFA, Medium Chain Fatty Acid.</p>
</caption>
<graphic xlink:href="fbioe-11-1197175-g009.tif"/>
</fig>
<sec id="s4-1">
<title>4.1 A taxonomically diverse set of MAGs is predicted to ferment carbohydrates to intermediates</title>
<p>The Ferment to Intermediates functional group was comprised of many MAGs classified in the phylum <italic>Firmicutes</italic>, specifically lactic acid bacteria, which are associated with carbohydrate fermentation to lactic acid and other intermediates (<xref ref-type="bibr" rid="B24">Garde et al., 2002</xref>; <xref ref-type="bibr" rid="B21">Ganzle and Follador, 2012</xref>; <xref ref-type="bibr" rid="B22">G&#xe4;nzle, 2015</xref>; <xref ref-type="bibr" rid="B79">Zhang and Vadlani, 2015</xref>). Indeed, <italic>Firmicutes,</italic> specifically those in the family <italic>Lactobacillaceae</italic>, make up a large portion of the microbial community in most of the bioreactors analyzed when using cumulative relative genomic abundance as a measure (<xref ref-type="fig" rid="F9">Figure 9</xref>), suggesting MAGs in this phylum may play a key role in fermentation to intermediates across the agroindustrial residues examined. There were other taxonomic groups classified in this group. MAGs from both family <italic>Atopobiaceae</italic> and family <italic>Bifidobacteriaceae</italic> (phylum <italic>Actinobacteriota</italic>) were found to be fairly abundant in a subset of the experiments, specifically Milk Permeate 1 and 2, as well as Cellulosic Ethanol Thin Stillage and Xylose (<xref ref-type="fig" rid="F9">Figure 9</xref>), which supports previous observations of the relationship between these two families (<xref ref-type="bibr" rid="B58">Scarborough et al., 2018a</xref>; <xref ref-type="bibr" rid="B8">Carvajal-Arroyo et al., 2019</xref>; <xref ref-type="bibr" rid="B70">Walters et al., 2023</xref>). Three MAGs in the class <italic>Bacilli</italic> but not part of the <italic>Lactobacillaceae</italic> family as well as three MAGs in the phylum <italic>Proteobacteria</italic> were both categorized as being in this functional group (<xref ref-type="fig" rid="F9">Figure 9</xref>) and were found to be of high abundance in two Starch-EtOH experiments that were conducted at a higher temperature and did not result in accumulation of MCFA chain elongation products (<xref ref-type="fig" rid="F2">Figure 2</xref>; <xref ref-type="table" rid="T1">Table 1</xref>) (<xref ref-type="bibr" rid="B19">Fortney et al., 2021</xref>).</p>
<p>From a metabolic potential perspective, fermentation to intermediates can be accomplished as homolactic fermentation wherein only lactic acid is produced, or heterolactic fermentation, either by the phosphoketolase pathway or the bifid shunt pathway, wherein lactic acid and other products (ethanol or acetate) are produced (<xref ref-type="bibr" rid="B54">Pokusaeva et al., 2011</xref>; <xref ref-type="bibr" rid="B22">G&#xe4;nzle, 2015</xref>). The percentage of detected gene homologs that encode enzymes unique to each fermentative pathway can be used to evaluate which fermentative pathways may be present in each MAG (<xref ref-type="sec" rid="s10">Supplementary Figure S1A</xref>). In the majority of MAGs, greater than 60% of the unique proteins in the homolactic and the heterolactic bifid shunt pathways were detected, suggesting these are the primary sources of lactic acid across the microbial communities. This included the MAGs in the phylum <italic>Proteobacteria</italic> and the non-<italic>Lactobacillaceae</italic> MAGs in the class <italic>Bacilli</italic>, suggesting this is a key reason these MAGs from unexpected taxonomic groups were categorized into this functional group (<xref ref-type="sec" rid="s10">Supplementary Figure S1A</xref>). No MAGs contained more than 60% of the unique proteins in the heterolactic phosphoketolase fermentation pathway, with the majority containing less than 40% of the unique enzymes (<xref ref-type="sec" rid="s10">Supplementary Figure S1A</xref>), suggesting this is a not a key pathway in abundant members of the communities that are found when using these agroindustrial residues. Nearly all the MAGs in the family <italic>Bifidobacteriaceae</italic> have over 80% of the unique enzymes in the heterolactic bifid shunt fermentative pathway, which is to be expected for members of this family (<xref ref-type="sec" rid="s10">Supplementary Figure S1A</xref>) (<xref ref-type="bibr" rid="B54">Pokusaeva et al., 2011</xref>). Future research can explore the proposal that these MAGs that perform lactic acid fermentation and do so using the homolactic fermentation pathway or heterolactic bifid shunt fermentation pathway.</p>
</sec>
<sec id="s4-2">
<title>4.2 MAGs from several taxonomic groups are predicted to use intermediates for chain elongation</title>
<p>The Intermediate Chain Elongators functional group was comprised of MAGs from a variety of taxonomic classifications (<xref ref-type="fig" rid="F7">Figure 7</xref>). While nearly all the MAGs were part of the phyla <italic>Firmicutes_A</italic> or <italic>Firmicutes_C</italic>, the lower taxonomic levels were more differentiated (<xref ref-type="fig" rid="F7">Figures 7</xref>, <xref ref-type="fig" rid="F9">9</xref>), suggesting a variety of microorganisms capable of performing this transformation in these microbial communities. Several of these MAGs belonged to families included in the training set, supporting the functional classification&#x2014;<italic>Anaerovoracaceae, Clostridiaceae, Eubacteriaceae,</italic> and <italic>Megasphaeraceae</italic>&#x2014;and were the MAGs with the highest relative level of genomic abundance in the experimental microbial communities (<xref ref-type="fig" rid="F9">Figure 9</xref>). This suggests that these MAGs may play a key role in converting intermediates to MCFAs. Interestingly, the machine learning approach predicted MAGs from other families may also perform this biological function. These included MAGs from the phylum <italic>Bacteroidia</italic> and the families <italic>Acidaminococcaceae, Lachnospiraceae,</italic> and <italic>Oscillospiraceae</italic> (<xref ref-type="fig" rid="F7">Figure 7</xref>). A member of the family <italic>Oscillospiraceae</italic>, <italic>Caproicibacterium lactatifermentans</italic>, was shown to utilize lactic acid, a function unique from other members of this family (<xref ref-type="bibr" rid="B72">Wang et al., 2022</xref>), and the <italic>Oscillospiraceae</italic> MAG has homologs of the key proteins for conversion of lactic acid to MCFAs (<xref ref-type="sec" rid="s10">Supplementary Figure S1B</xref>). MAGs that belong to family <italic>Lachnospiraceae</italic> have been shown to convert carbohydrates directly to MCFAs (<xref ref-type="bibr" rid="B58">Scarborough et al., 2018a</xref>; <xref ref-type="bibr" rid="B60">Scarborough et al., 2020</xref>), but our analysis suggests they may also convert fermentation intermediates into these products. Indeed, UW_MP_LCO2_1 contains all three proteins key for conversion of lactic acid to MCFAs, supporting a possible alternative role of the MAG from this family (<xref ref-type="sec" rid="s10">Supplementary Figure S1B</xref>).</p>
<p>However, neither the <italic>Lachnospiraceae</italic> MAG nor the <italic>Oscillospiraceae</italic> MAG were highly abundant in any of the datasets analyzed (<xref ref-type="fig" rid="F9">Figure 9</xref>), suggesting they may not play a large role, even if they do generate MCFAs from intermediates. Interestingly, the <italic>Acidaminococcaceae</italic> and <italic>Bacteroidia</italic> MAGs have relatively high abundance in the Milk Permeate 1 experiment (<xref ref-type="fig" rid="F9">Figure 9</xref>), raising the possibility that the unique conditions of that experiment (<xref ref-type="bibr" rid="B70">Walters et al., 2023</xref>) may lead to the enrichment of these MAGs to convert fermentation intermediates to MCFAs. However, the two MAGs belonging to phylum <italic>Bacteroidota</italic> are the only two MAGs for which a majority of genes encoding for lactic acid utilization and reverse &#xdf;-oxidation were not detected (<xref ref-type="sec" rid="s10">Supplementary Figure S1B</xref>). This raises the possibility that these MAGs were misclassified, but their metabolic potential deserves future exploration since phylogenetically related organisms have recently been associated with SCFA production in microbial communities (<xref ref-type="bibr" rid="B12">Watanabe et al., 2021</xref>; <xref ref-type="bibr" rid="B31">Ho et al., 2021</xref>; <xref ref-type="bibr" rid="B49">Liu et al., 2022</xref>).</p>
</sec>
<sec id="s4-3">
<title>4.3 MAGs from various taxonomic groups are predicted to use carbohydrates for chain elongation</title>
<p>A majority of the MAGs classified in the Carbohydrate Chain Elongators group by the machine learning algorithm we used belong to the phylum <italic>Firmicutes</italic> and specifically five families: <italic>Lachnospiraceae, Acutalibacteraceae, Bacillaceae, Sporolactobacillaceae,</italic> and <italic>Clostridiaceae</italic> (<xref ref-type="fig" rid="F9">Figure 9</xref>)<italic>.</italic> Of these MAGs, <italic>Lachnospiraceae</italic> has been shown to produce MCFAs from carbohydrates in other microbial communities (<xref ref-type="bibr" rid="B58">Scarborough et al., 2018a</xref>; <xref ref-type="bibr" rid="B60">Scarborough et al., 2020</xref>). Indeed, the <italic>Lachnospiraceae</italic> MAGs are the most abundant across the largest number of reactor experiments, suggesting they are key players in MCFA synthesis from carbohydrate (<xref ref-type="fig" rid="F9">Figure 9</xref>). Interestingly, for two of these MAGs we were not able to identify homologs to three of the four enzymes involved in chain elongation (<xref ref-type="sec" rid="s10">Supplementary Figure S1C</xref>). While this may indicate mis-classification, it also raises the possibility that other enzymes may perform these processes in these organisms or that the enzymes have diverged enough in these MAGs so the homologs were below our thresholds. Additional research into these MAGs will be required to examine these hypotheses.</p>
<p>Most of the MAGs in this group contain homologs for the chain elongation genes, although many of them outside the <italic>Lachnospiraceae</italic> family also contain at least one homolog of the lactic acid utilization genes (<xref ref-type="sec" rid="s10">Supplementary Figure S1C</xref>). These results suggest that these MAGs may be able to convert both carbohydrates as well as lactic acid into MCFAs. This has been observed in other microbes including <italic>Caproicibacterium lactatifermentans</italic> (family <italic>Acutalibacteraceae</italic>) (<xref ref-type="bibr" rid="B72">Wang et al., 2022</xref>) and <italic>Megasphaera hexanoica</italic> (family <italic>Megasphaeraceae</italic>) (<xref ref-type="bibr" rid="B34">Jeon et al., 2017</xref>; <xref ref-type="bibr" rid="B36">Kang et al., 2022</xref>). Interestingly, MAGs within the same family (<italic>Acutalibacteraceae</italic>) differ in the presence of lactic acid utilization homologs (<xref ref-type="sec" rid="s10">Supplementary Figure S1C</xref>), suggesting this difference may be on the genus or species level. Recent results suggest members of this family can produce MCFAs from lactic acid (<xref ref-type="bibr" rid="B72">Wang et al., 2022</xref>) as well as carbohydrates (<xref ref-type="bibr" rid="B68">Van Nguyen et al., 2023</xref>). Further research into these MAGs and related isolated organisms will be valuable to evaluate this new hypothesis.</p>
<p>Of the two MAGs in the class <italic>Bacilli</italic> that are classified as Carbohydrate Chain Elongators, UW_MP_SPOR1_1 (family <italic>Sporolactobacillaceae</italic>) lacked homologs to the electron bifurcating acyl-CoA dehydrogenase and the acetyl-CoA C-acetyltransfase enzymes while UW_TS_BAC2_1 (family <italic>Bacillaceae</italic>) contained homologs for all examined enzymes (<xref ref-type="sec" rid="s10">Supplementary Figure S1C</xref>). Members of the family <italic>Sporolactobacillaceae</italic> are known to produce lactic acid (<xref ref-type="bibr" rid="B10">Chang et al., 2008</xref>; <xref ref-type="bibr" rid="B67">Tolieng et al., 2017</xref>), so our findings raise the possibility that some members of class <italic>Bacilli</italic> may be able to produce MCFAs as well. Similarly, the MAG in the family <italic>Clostridiaceae</italic> contained homologs for all enzymes examined, including the lactic acid utilization proteins, suggesting that this MAG may produce MCFAs from lactic acid as well as carbohydrates. Members of the phyla <italic>Spirochaetota</italic> and <italic>Proteobacteria</italic> are not known to perform chain elongation, but the MAGs contain at least some of the genes encoding enzymes important for chain elongation, raising the possibility of an expanded functional role of MAGs from these taxonomic groups (<xref ref-type="sec" rid="s10">Supplementary Figure S1C</xref>). Taken together, the results from the machine learning analysis both support previous research and suggest potential new groups of organisms that may be able to perform the specific biological function.</p>
</sec>
<sec id="s4-4">
<title>4.4 Phylogenetic analysis of EtfB homologs can differentiate between lactic acid utilization and chain elongation</title>
<p>The electron flavoprotein (EtfAB) can form a complex with both electron confurcating lactate dehydrogenase (ecLDH, involved in lactic acid utilization) and acyl-CoA dehydrogenase (ACD, involved in chain elongation) (<xref ref-type="bibr" rid="B23">Garcia Costas et al., 2017</xref>; <xref ref-type="bibr" rid="B14">Detman et al., 2019</xref>) and phylogenetic analysis of the beta subunit (EtfB) can be used to differentiate between the ability to use lactic acid and to perform chain elongation (<xref ref-type="bibr" rid="B70">Walters et al., 2023</xref>). This analysis suggests that three MAGs in the Intermediate Chain Elongators group contain multiple copies of EtfB, one associated with ecLDH and one associated with ACD (<xref ref-type="fig" rid="F10">Figure 10</xref>; <xref ref-type="sec" rid="s10">Supplementary Figure S2</xref>), supporting the functional classification that these MAGs use lactic acid to perform chain elongation. Three MAGs in the Carbohydrate Chain Elongators group contain a single copy of EtfB associated with ACD (<xref ref-type="fig" rid="F10">Figure 10</xref>; <xref ref-type="sec" rid="s10">Supplementary Figure S2</xref>), supporting the classification that these MAGs can produce MCFAs but not utilize lactic acid. However, a majority of the MAGs in both functional groups contain EtfB homologs for which the phylogenetic analysis cannot predict a metabolic function. Additional research into the metabolism of microorganisms represented by these MAGs will be required to elucidate the function of these EtfB homologs.</p>
<fig id="F10" position="float">
<label>FIGURE 10</label>
<caption>
<p>Association of EtfB homologs with lactic acid utilization, chain elongation, or other functions. Summary of the phylogenetic analysis (<xref ref-type="sec" rid="s10">Supplementary Figure S2</xref>) examining EtfB homologs in the MAGs from the Intermediate Chain Elongators group <bold>(A)</bold> and the Carbohydrate Chain Elongators group <bold>(B)</bold>. MAGs with an EtfB homolog that the phylogenetic analysis suggests is associated with lactic acid utilization have a blue box in the first column while MAGs with an EtfB homolog that the phylogenetic analysis suggests is associated with chain elongation have a blue box in the second column. A blue box in the Other column indicates that a MAG has an EtfB homolog for which the phylogenetic analysis cannot indicate a clear function.</p>
</caption>
<graphic xlink:href="fbioe-11-1197175-g010.tif"/>
</fig>
</sec>
<sec id="s4-5">
<title>4.5 Additional data needed to better understand and predict operation of these microbial communities</title>
<p>All of the analyses in this study were performed using metagenomic data for the MAGs across the 10 experiments. Importantly, metagenomics data can inform what genes are present in a microbial community, and thus we can use this presence to classify MAGs using machine learning. However, presence of a gene does not indicate how much that gene is expressed and thus how important the protein is to the microbial community. Previous work has shown a dramatic disconnect in MAG abundance when calculated using metagenomics (DNA) data or metatranscriptomics (RNA) data (<xref ref-type="bibr" rid="B35">Jewell et al., 2016</xref>; <xref ref-type="bibr" rid="B46">Lawson et al., 2017</xref>; <xref ref-type="bibr" rid="B3">Beach et al., 2021</xref>; <xref ref-type="bibr" rid="B12">Watanabe et al., 2021</xref>). The addition of metatranscriptomics to study this ecological microbial model would not only indicate the expression level of the genes in each MAG, but would also provide more information about the functional abundance of each MAG within each functional group.</p>
<p>For the machine learning analysis, we selected isolated bacteria that had been shown to perform the biological function for each group. This meant we were limited in how many organisms were available to use to build our training set. One key example is the lack of isolated organisms shown to convert ethanol to MCFAs. The only isolated organism we were able to find supported evidence for this biological process was the well-studied species <italic>Clostridium kluyveri</italic> (<xref ref-type="bibr" rid="B63">Seedorf et al., 2008</xref>; <xref ref-type="bibr" rid="B29">Han et al., 2018</xref>). Due to the limited available genomes that represent isolated organisms known to produce MCFA from ethanol by chain elongation, we did not attempt to predict this as a separate functional group. As more bacteria are isolated and studied for this biological process, it is likely the machine learning model can be updated to distinguish between MAGs that using ethanol and those that use lactic acid to produce MCFAs, adding more value to this type of classification procedure.</p>
<p>This study suggests that the ecological microbial model of different functional groups (Ferment to Intermediates, Intermediate Chain Elongators, and Carbohydrate Chain Elongators) is common among microbial communities enriched in carbohydrate-rich agroindustrial residues seeded with anaerobic digester sludge from the wastewater treatment plant. Examination of a microbial community enriched in food waste, a carbohydrate-rich liquid medium, and an inoculum of anaerobic digester sludge from a wastewater treatment plant suggested a similar ecological model (<xref ref-type="bibr" rid="B13">Crognale et al., 2021</xref>). A key question that remains is how widespread this ecological model is when applied to other microbial communities, especially in terms of different inocula and feedstock used. Additional research into the composition and genomic make up of other microbial communities would be fascinating and reveal how universal this model is among microbial communities performing chain elongation to produce MCFAs.</p>
</sec>
<sec id="s4-6">
<title>4.6 Concluding remarks</title>
<p>Examining the 240 MAGs across 10 experiments provided us an opportunity to develop new tools to better understand the microbial communities present across the bioreactors. Specifically, the large data set enabled the use of multiclass classification machine learning to categorize the MAGs into distinct functional groups in an unbiased manner. These tools can be adapted to evaluate other microbial ecology models by changing or expanding the functional groups included in the models. Thus, this analysis not only further explained the core functional groups for MCFA production in carbohydrate rich agroindustrial residues but also demonstrated a new way to quickly examine and explore microbial communities. Such knowledge will help generate hypotheses about microbial community members that could be experimentally tested, helping in the development of better strategies to manage microbiomes to produce desired products, as well as to better characterize microbial functions in a wide variety of microbiomes.</p>
</sec>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found below: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>, PRJNA768492, <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>, PRJNA418244, <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>, PRJNA535528, <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>, PRJNA518398, <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>, PRJNA518399, <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>, PRJNA518400.</p>
</sec>
<sec id="s6">
<title>Author contributions</title>
<p>AI, KW, NF, MS, TD, and DN designed the bioreactor experiments. AI, KW, NF, and MS performed the bioreactor experiments. KM and AI performed all computational analyses. KM, TD, and DN wrote the manuscript. All authors listed have made a substantial, direct, and intellectual contribution to the work and approved it for publication.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>This material is based upon work supported by the Great Lakes Bioenergy Research Center, U.S. Department of Energy, Office of Science, Office of Biological and Environmental Research under Award Number DE-SC0018409, the National Dairy Council under project MSN214606 (AAG8952 and AAK8347), and the National Science Foundation under project CBET-1803055.</p>
</sec>
<ack>
<p>We thank members of the TD and DN labs for helpful discussion in preparation of this manuscript.</p>
</ack>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fbioe.2023.1197175/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fbioe.2023.1197175/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table2.XLSX" id="SM1" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table3.XLSX" id="SM2" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image1.eps" id="SM3" mimetype="application/eps" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table6.XLSX" id="SM4" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table4.XLSX" id="SM5" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table1.XLSX" id="SM6" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table5.XLSX" id="SM7" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image2.eps" id="SM8" mimetype="application/eps" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet1.docx" id="SM9" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Agler</surname>
<given-names>M. T.</given-names>
</name>
<name>
<surname>Spirito</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Usack</surname>
<given-names>J. G.</given-names>
</name>
<name>
<surname>Werner</surname>
<given-names>J. J.</given-names>
</name>
<name>
<surname>Angenent</surname>
<given-names>L. T.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Chain elongation with reactor microbiomes: Upgrading dilute ethanol to medium-chain carboxylates</article-title>. <source>Energy &#x26; Environ. Sci.</source> <volume>5</volume> (<issue>8</issue>), <fpage>8189</fpage>. <pub-id pub-id-type="doi">10.1039/c2ee22101b</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Anderson</surname>
<given-names>M. J.</given-names>
</name>
</person-group> (<year>2017</year>). <source>Wiley StatsRef: Statistics reference online</source>. <publisher-loc>New Jersey, United States</publisher-loc>: <publisher-name>Wiley</publisher-name>, <fpage>1</fpage>&#x2013;<lpage>15</lpage>.</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beach</surname>
<given-names>N. K.</given-names>
</name>
<name>
<surname>Myers</surname>
<given-names>K. S.</given-names>
</name>
<name>
<surname>Owen</surname>
<given-names>B. R.</given-names>
</name>
<name>
<surname>Seib</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Donohue</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Noguera</surname>
<given-names>D. R.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Exploring the meta-regulon of the CRP/FNR family of global transcriptional regulators in a partial-nitritation anammox microbiome</article-title>. <source>mSystems</source> <volume>6</volume> (<issue>5</issue>), <fpage>e0090621</fpage>. <pub-id pub-id-type="doi">10.1128/msystems.00906-21</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Benjamini</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hochberg</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Controlling the false discovery rate: A practical and powerful approach to multiple testing</article-title>. <source>J. R. Stat. Soc. Ser. B Methodol.</source> <volume>57</volume> (<issue>1</issue>), <fpage>289</fpage>&#x2013;<lpage>300</lpage>. <pub-id pub-id-type="doi">10.1111/j.2517-6161.1995.tb02031.x</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Bian</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Tao</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2011</year>). in <source>Learning a distance metric by empirical loss minimization</source>. Editor <person-group person-group-type="editor">
<name>
<surname>Walsh</surname>
<given-names>T.</given-names>
</name>
</person-group> (<publisher-loc>Barcelona, Catalonia, Spain</publisher-loc>: <publisher-name>AAAI Press</publisher-name>), <fpage>1186</fpage>&#x2013;<lpage>1191</lpage>.</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boutet</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Lieberherr</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Tognolli</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Schneider</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bansal</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Bridge</surname>
<given-names>A. J.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>UniProtKB/Swiss-Prot, the manually annotated section of the UniProt KnowledgeBase: How to use the entry view</article-title>. <source>Methods Mol. Biol.</source> <volume>1374</volume>, <fpage>23</fpage>&#x2013;<lpage>54</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-4939-3167-5_2</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Camacho</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Coulouris</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Avagyan</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Papadopoulos</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Bealer</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>BLAST&#x2b;: Architecture and applications</article-title>. <source>BMC Bioinforma.</source> <volume>10</volume> (<issue>1</issue>), <fpage>421</fpage>&#x2013;<lpage>429</lpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-10-421</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carvajal-Arroyo</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Candry</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Andersen</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Props</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Seviour</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ganigu&#xe9;</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Granular fermentation enables high rate caproic acid production from solid-free thin stillage</article-title>. <source>Green Chem.</source> <volume>21</volume> (<issue>6</issue>), <fpage>1330</fpage>&#x2013;<lpage>1339</lpage>. <pub-id pub-id-type="doi">10.1039/c8gc03648a</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Caspi</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Billington</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Keseler</surname>
<given-names>I. M.</given-names>
</name>
<name>
<surname>Kothari</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Krummenacker</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Midford</surname>
<given-names>P. E.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>The MetaCyc database of metabolic pathways and enzymes - a 2019 update</article-title>. <source>Nucleic Acids Res.</source> <volume>48</volume>, <fpage>D445</fpage>&#x2013;<lpage>D453</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkz862</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chang</surname>
<given-names>Y. H.</given-names>
</name>
<name>
<surname>Jung</surname>
<given-names>M. Y.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>I. S.</given-names>
</name>
<name>
<surname>Oh</surname>
<given-names>H. M.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>
<italic>Sporolactobacillus vineae</italic> sp. nov., a spore-forming lactic acid bacterium isolated from vineyard soil</article-title>. <source>Int. J. Syst. Evol. Microbiol.</source> <volume>58</volume>, <fpage>2316</fpage>&#x2013;<lpage>2320</lpage>. <pub-id pub-id-type="doi">10.1099/ijs.0.65608-0</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chaumeil</surname>
<given-names>P. A.</given-names>
</name>
<name>
<surname>Mussig</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Hugenholtz</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Parks</surname>
<given-names>D. H.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>GTDB-tk: A toolkit to classify genomes with the genome taxonomy database</article-title>. <source>Bioinformatics</source> <volume>36</volume> (<issue>6</issue>), <fpage>1925</fpage>&#x2013;<lpage>1927</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btz848</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Crognale</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Braguglia</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Gallipoli</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Gianico</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Rossetti</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Montecchio</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Direct conversion of food waste extract into caproate: Metagenomics assessment of chain elongation process</article-title>. <source>Microorganisms</source> <volume>9</volume> (<issue>2</issue>), <fpage>327</fpage>. <pub-id pub-id-type="doi">10.3390/microorganisms9020327</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Detman</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mielecki</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Chojnacka</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Salamon</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Blaszczyk</surname>
<given-names>M. K.</given-names>
</name>
<name>
<surname>Sikora</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Cell factories converting lactate and acetate to butyrate: <italic>Clostridium butyricum</italic> and microbial communities from dark fermentation bioreactors</article-title>. <source>Microb. Cell Fact.</source> <volume>18</volume> (<issue>1</issue>), <fpage>36</fpage>. <pub-id pub-id-type="doi">10.1186/s12934-019-1085-1</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Eckel</surname>
<given-names>V. P. L.</given-names>
</name>
<name>
<surname>Vogel</surname>
<given-names>R. F.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Genomic and physiological insights into the lifestyle of <italic>Bifidobacterium</italic> species from water kefir</article-title>. <source>Arch. Microbiol.</source> <volume>202</volume> (<issue>7</issue>), <fpage>1627</fpage>&#x2013;<lpage>1637</lpage>. <pub-id pub-id-type="doi">10.1007/s00203-020-01870-7</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ferrero</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Tabacco</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Borreani</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>
<italic>Lentilactobacillus hilgardii</italic> inoculum, dry matter contents at harvest and length of conservation affect fermentation characteristics and aerobic stability of corn silage</article-title>. <source>Front. Microbiol.</source> <volume>12</volume>, <fpage>675563</fpage>. <pub-id pub-id-type="doi">10.3389/fmicb.2021.675563</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fitzgerald</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Camejo</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Oshlag</surname>
<given-names>J. Z.</given-names>
</name>
<name>
<surname>Noguera</surname>
<given-names>D. R.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Ammonia-oxidizing microbial communities in reactors with efficient nitrification at low-dissolved oxygen</article-title>. <source>Water Res.</source> <volume>70</volume>, <fpage>38</fpage>&#x2013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.1016/j.watres.2014.11.041</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Flaiz</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Baur</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Brahner</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Poehlein</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Daniel</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Bengelsdorf</surname>
<given-names>F. R.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>
<italic>Caproicibacter fermentans</italic> gen. nov., sp. nov., a new caproate-producing bacterium and emended description of the genus <italic>Caproiciproducens</italic>
</article-title>. <source>Int. J. Syst. Evol. Microbiol.</source> <volume>70</volume> (<issue>7</issue>), <fpage>4269</fpage>&#x2013;<lpage>4279</lpage>. <pub-id pub-id-type="doi">10.1099/ijsem.0.004283</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fortney</surname>
<given-names>N. W.</given-names>
</name>
<name>
<surname>Hanson</surname>
<given-names>N. J.</given-names>
</name>
<name>
<surname>Rosa</surname>
<given-names>P. R. F.</given-names>
</name>
<name>
<surname>Donohue</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Noguera</surname>
<given-names>D. R.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Diverse profile of fermentation byproducts from thin stillage</article-title>. <source>Front. Bioeng. Biotechnol.</source> <volume>9</volume>, <fpage>695306</fpage>. <pub-id pub-id-type="doi">10.3389/fbioe.2021.695306</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fortney</surname>
<given-names>N. W.</given-names>
</name>
<name>
<surname>Myers</surname>
<given-names>K. S.</given-names>
</name>
<name>
<surname>Ingle</surname>
<given-names>A. T.</given-names>
</name>
<name>
<surname>Walters</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Scarborough</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Donohue</surname>
<given-names>T. J.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Metagenomes and metagenome-assembled genomes from microbiomes metabolizing thin stillage from an ethanol biorefinery</article-title>. <source>Microbiol. Resour. Announc</source> <volume>11</volume> (<issue>8</issue>), <fpage>e0029022</fpage>. <pub-id pub-id-type="doi">10.1128/mra.00290-22</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ganzle</surname>
<given-names>M. G.</given-names>
</name>
<name>
<surname>Follador</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Metabolism of oligosaccharides and starch in lactobacilli: A review</article-title>. <source>Front. Microbiol.</source> <volume>3</volume>, <fpage>340</fpage>. <pub-id pub-id-type="doi">10.3389/fmicb.2012.00340</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>G&#xe4;nzle</surname>
<given-names>M. G.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Lactic metabolism revisited: Metabolism of lactic acid bacteria in food fermentations and food spoilage</article-title>. <source>Curr. Opin. Food Sci.</source> <volume>2</volume>, <fpage>106</fpage>&#x2013;<lpage>117</lpage>. <pub-id pub-id-type="doi">10.1016/j.cofs.2015.03.001</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Garcia Costas</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Poudel</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Miller</surname>
<given-names>A. F.</given-names>
</name>
<name>
<surname>Schut</surname>
<given-names>G. J.</given-names>
</name>
<name>
<surname>Ledbetter</surname>
<given-names>R. N.</given-names>
</name>
<name>
<surname>Fixen</surname>
<given-names>K. R.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Defining electron bifurcation in the electron-transferring flavoprotein family</article-title>. <source>J. Bacteriol.</source> <volume>199</volume> (<issue>21</issue>), <fpage>004400</fpage>&#x2013;<lpage>e517</lpage>. <pub-id pub-id-type="doi">10.1128/jb.00440-17</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Garde</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Jonsson</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Schmidt</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Ahring</surname>
<given-names>B. K.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Lactic acid production from wheat straw hemicellulose hydrolysate by <italic>Lactobacillus pentosus</italic> and <italic>Lactobacillus brevis</italic>
</article-title>. <source>Bioresour. Technol.</source> <volume>81</volume> (<issue>3</issue>), <fpage>217</fpage>&#x2013;<lpage>223</lpage>. <pub-id pub-id-type="doi">10.1016/s0960-8524(01)00135-3</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ge</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Usack</surname>
<given-names>J. G.</given-names>
</name>
<name>
<surname>Spirito</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Angenent</surname>
<given-names>L. T.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Long-term n-caproic acid production from yeast-fermentation beer in an anaerobic bioreactor with continuous product extraction</article-title>. <source>Environ. Sci. Technol.</source> <volume>49</volume> (<issue>13</issue>), <fpage>8012</fpage>&#x2013;<lpage>8021</lpage>. <pub-id pub-id-type="doi">10.1021/acs.est.5b00238</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grootscholten</surname>
<given-names>T. I. M.</given-names>
</name>
<name>
<surname>Kinsky Dal Borgo</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Hamelers</surname>
<given-names>H. V. M.</given-names>
</name>
<name>
<surname>Buisman</surname>
<given-names>C. J. N.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Promoting chain elongation in mixed culture acidification reactors by addition of ethanol</article-title>. <source>Biomass Bioenergy</source> <volume>48</volume>, <fpage>10</fpage>&#x2013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.1016/j.biombioe.2012.11.019</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grootscholten</surname>
<given-names>T. I. M.</given-names>
</name>
<name>
<surname>Strik</surname>
<given-names>D. P. B. T. B.</given-names>
</name>
<name>
<surname>Steinbusch</surname>
<given-names>K. J. J.</given-names>
</name>
<name>
<surname>Buisman</surname>
<given-names>C. J. N.</given-names>
</name>
<name>
<surname>Hamelers</surname>
<given-names>H. V. M.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Two-stage medium chain fatty acid (MCFA) production from municipal solid waste and ethanol</article-title>. <source>Appl. Energy</source> <volume>116</volume>, <fpage>223</fpage>&#x2013;<lpage>229</lpage>. <pub-id pub-id-type="doi">10.1016/j.apenergy.2013.11.061</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Haibo</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Garcia</surname>
<given-names>E. A.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Learning from imbalanced data</article-title>. <source>IEEE Trans. Knowl. Data Eng.</source> <volume>21</volume> (<issue>9</issue>), <fpage>1263</fpage>&#x2013;<lpage>1284</lpage>. <pub-id pub-id-type="doi">10.1109/tkde.2008.239</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Han</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Shao</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Metabolic interactions of a chain elongation microbiome</article-title>. <source>Appl. Environ. Microbiol.</source> <volume>84</volume> (<issue>22</issue>), <fpage>e01614</fpage>&#x2013;<lpage>e01618</lpage>. <pub-id pub-id-type="doi">10.1128/aem.01614-18</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Harmsen</surname>
<given-names>P. F. H.</given-names>
</name>
<name>
<surname>Hackmann</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Bos</surname>
<given-names>H. L.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Green building blocks for bio-based plastics</article-title>. <source>Biofuels, Bioprod. Biorefining</source> <volume>8</volume> (<issue>3</issue>), <fpage>306</fpage>&#x2013;<lpage>324</lpage>. <pub-id pub-id-type="doi">10.1002/bbb.1468</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ho</surname>
<given-names>H. E.</given-names>
</name>
<name>
<surname>Chun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Jeong</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jumreornvong</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Sicherer</surname>
<given-names>S. H.</given-names>
</name>
<name>
<surname>Bunyavanich</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Multidimensional study of the oral microbiome, metabolite, and immunologic environment in peanut allergy</article-title>. <source>J. Allergy Clin. Immunol.</source> <volume>148</volume> (<issue>2</issue>), <fpage>627</fpage>&#x2013;<lpage>632.e3</lpage>. <pub-id pub-id-type="doi">10.1016/j.jaci.2021.03.028</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ingle</surname>
<given-names>A. T.</given-names>
</name>
<name>
<surname>Fortney</surname>
<given-names>N. W.</given-names>
</name>
<name>
<surname>Myers</surname>
<given-names>K. S.</given-names>
</name>
<name>
<surname>Walters</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Scarborough</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Donohue</surname>
<given-names>T. J.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Metagenome-assembled genomes from a microbiome grown in dairy manure hydrolysate</article-title>. <source>Microbiol. Resour. Announc</source> <volume>11</volume> (<issue>8</issue>), <fpage>e0029222</fpage>. <pub-id pub-id-type="doi">10.1128/mra.00292-22</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ingle</surname>
<given-names>A. T.</given-names>
</name>
<name>
<surname>Fortney</surname>
<given-names>N. W.</given-names>
</name>
<name>
<surname>Walters</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Donohue</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Noguera</surname>
<given-names>D. R.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Mixed acid fermentation of carbohydrate-rich dairy manure hydrolysate</article-title>. <source>Front. Bioeng. Biotechnol.</source> <volume>9</volume>, <fpage>724304</fpage>. <pub-id pub-id-type="doi">10.3389/fbioe.2021.724304</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jeon</surname>
<given-names>B. S.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sang</surname>
<given-names>B. I.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>
<italic>Megasphaera hexanoica</italic> sp. nov., a medium-chain carboxylic acid-producing bacterium isolated from a cow rumen</article-title>. <source>Int. J. Syst. Evol. Microbiol.</source> <volume>67</volume> (<issue>7</issue>), <fpage>2114</fpage>&#x2013;<lpage>2120</lpage>. <pub-id pub-id-type="doi">10.1099/ijsem.0.001888</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jewell</surname>
<given-names>T. N.</given-names>
</name>
<name>
<surname>Karaoz</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Brodie</surname>
<given-names>E. L.</given-names>
</name>
<name>
<surname>Williams</surname>
<given-names>K. H.</given-names>
</name>
<name>
<surname>Beller</surname>
<given-names>H. R.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Metatranscriptomic evidence of pervasive and diverse chemolithoautotrophy relevant to C, S, N and Fe cycling in a shallow alluvial aquifer</article-title>. <source>ISME J.</source> <volume>10</volume> (<issue>9</issue>), <fpage>2106</fpage>&#x2013;<lpage>2117</lpage>. <pub-id pub-id-type="doi">10.1038/ismej.2016.25</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Jeon</surname>
<given-names>B. S.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Sang</surname>
<given-names>B. I.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Chain elongation process for caproate production using lactate as electron donor in <italic>Megasphaera hexanoica</italic>
</article-title>. <source>Bioresour. Technol.</source> <volume>346</volume>, <fpage>126660</fpage>. <pub-id pub-id-type="doi">10.1016/j.biortech.2021.126660</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kasmaei</surname>
<given-names>K. M.</given-names>
</name>
<name>
<surname>Kalyani</surname>
<given-names>D. C.</given-names>
</name>
<name>
<surname>Reichenbach</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Jimenez-Quero</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Vilaplana</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Divne</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Crystal structure of the feruloyl esterase from <italic>Lentilactobacillus buchneri</italic> reveals a novel homodimeric state</article-title>. <source>Front. Microbiol.</source> <volume>13</volume>, <fpage>1050160</fpage>. <pub-id pub-id-type="doi">10.3389/fmicb.2022.1050160</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Keseler</surname>
<given-names>I. M.</given-names>
</name>
<name>
<surname>Collado-Vides</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Santos-Zavaleta</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Peralta-Gil</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Gama-Castro</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Muniz-Rascado</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>EcoCyc: A comprehensive database of <italic>Escherichia coli</italic> biology</article-title>. <source>Nucleic Acids Res.</source> <volume>39</volume>, <fpage>D583</fpage>&#x2013;<lpage>D590</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkq1143</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>B. C.</given-names>
</name>
<name>
<surname>Seung Jeon</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Um</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Sang</surname>
<given-names>B. I.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>
<italic>Caproiciproducens galactitolivorans</italic> gen. nov., sp. nov., a bacterium capable of producing caproic acid from galactitol, isolated from a wastewater treatment plant</article-title>. <source>Int. J. Syst. Evol. Microbiol.</source> <volume>65</volume> (<issue>12</issue>), <fpage>4902</fpage>&#x2013;<lpage>4908</lpage>. <pub-id pub-id-type="doi">10.1099/ijsem.0.000665</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kobayashi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Nakasato</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Sakamoto</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ohtani</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Terada</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Sakai</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>
<italic>Clostridium pabulibutyricum</italic> sp. nov., a butyric-acid-producing organism isolated from high-moisture grass silage</article-title>. <source>Int. J. Syst. Evol. Microbiol.</source> <volume>67</volume> (<issue>12</issue>), <fpage>4974</fpage>&#x2013;<lpage>4978</lpage>. <pub-id pub-id-type="doi">10.1099/ijsem.0.002387</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kozlov</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Darriba</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Flouri</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Morel</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Stamatakis</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>RAxML-NG: A fast, scalable and user-friendly tool for maximum likelihood phylogenetic inference</article-title>. <source>Bioinformatics</source> <volume>35</volume> (<issue>21</issue>), <fpage>4453</fpage>&#x2013;<lpage>4455</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btz305</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ksiezarek</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Grosso</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ribeiro</surname>
<given-names>T. G.</given-names>
</name>
<name>
<surname>Peixe</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Genomic diversity of genus <italic>Limosilactobacillus</italic>
</article-title>. <source>Microb. Genom</source> <volume>8</volume> (<issue>7</issue>), <fpage>mgen000847</fpage>. <pub-id pub-id-type="doi">10.1099/mgen.0.000847</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kucek</surname>
<given-names>L. A.</given-names>
</name>
<name>
<surname>Spirito</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Angenent</surname>
<given-names>L. T.</given-names>
</name>
</person-group> (<year>2016a</year>). <article-title>High n-caprylate productivities and specificities from dilute ethanol and acetate: Chain elongation with microbiomes to upgrade products from syngas fermentation</article-title>. <source>Energy &#x26; Environ. Sci.</source> <volume>9</volume> (<issue>11</issue>), <fpage>3482</fpage>&#x2013;<lpage>3494</lpage>. <pub-id pub-id-type="doi">10.1039/c6ee01487a</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kucek</surname>
<given-names>L. A.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Nguyen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Angenent</surname>
<given-names>L. T.</given-names>
</name>
</person-group> (<year>2016b</year>). <article-title>Waste conversion into n-caprylate and n-caproate: Resource recovery from wine lees using anaerobic reactor microbiomes and in-line extraction</article-title>. <source>Front. Microbiol.</source> <volume>7</volume>, <fpage>1892</fpage>. <pub-id pub-id-type="doi">10.3389/fmicb.2016.01892</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Langmead</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Salzberg</surname>
<given-names>S. L.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Fast gapped-read alignment with Bowtie 2</article-title>. <source>Nat. Methods</source> <volume>9</volume> (<issue>4</issue>), <fpage>357</fpage>&#x2013;<lpage>359</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.1923</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lawson</surname>
<given-names>C. E.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Bhattacharjee</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Hamilton</surname>
<given-names>J. J.</given-names>
</name>
<name>
<surname>Mcmahon</surname>
<given-names>K. D.</given-names>
</name>
<name>
<surname>Goel</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Metabolic network analysis reveals microbial community interactions in anammox granules</article-title>. <source>Nat. Commun.</source> <volume>8</volume> (<issue>1</issue>), <fpage>15416</fpage>. <pub-id pub-id-type="doi">10.1038/ncomms15416</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Handsaker</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Wysoker</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Fennell</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ruan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Homer</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>The sequence alignment/map format and SAMtools</article-title>. <source>Bioinformatics</source>, <volume>25</volume>(<issue>16</issue>): <fpage>2078</fpage>&#x2013;<lpage>2079</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp352</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Litty</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Muller</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Butyrate production in the acetogen <italic>Eubacterium limosum</italic> is dependent on the carbon and energy source</article-title>. <source>Microb. Biotechnol.</source> <volume>14</volume> (<issue>6</issue>), <fpage>2686</fpage>&#x2013;<lpage>2692</lpage>. <pub-id pub-id-type="doi">10.1111/1751-7915.13779</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Bai</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Kohn</surname>
<given-names>R. A.</given-names>
</name>
<name>
<surname>Tadesse</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Sarria</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Rumen microbial predictors for short-chain fatty acid levels and the grass-fed regimen in angus cattle</article-title>. <source>Anim. (Basel)</source> <volume>12</volume> (<issue>21</issue>), <fpage>2995</fpage>. <pub-id pub-id-type="doi">10.3390/ani12212995</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Okada</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Suzuki</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Kozaki</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>1979</year>). <article-title>A new heterofermentative lactobacillus species with meso-diaminopimelic acid in peptidoglycan, <italic>Lactobacillus vaccinostercus</italic> kozaki and okada sp. Nov</article-title>. <source>J. General Appl. Microbiol.</source> <volume>25</volume> (<issue>4</issue>), <fpage>215</fpage>&#x2013;<lpage>221</lpage>. <pub-id pub-id-type="doi">10.2323/jgam.25.215</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Olm</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Brown</surname>
<given-names>C. T.</given-names>
</name>
<name>
<surname>Brooks</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Banfield</surname>
<given-names>J. F.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>dRep: a tool for fast and accurate genomic comparisons that enables improved genome recovery from metagenomes through de-replication</article-title>. <source>ISME J.</source> <volume>11</volume> (<issue>12</issue>), <fpage>2864</fpage>&#x2013;<lpage>2868</lpage>. <pub-id pub-id-type="doi">10.1038/ismej.2017.126</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Parks</surname>
<given-names>D. H.</given-names>
</name>
<name>
<surname>Imelfort</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Skennerton</surname>
<given-names>C. T.</given-names>
</name>
<name>
<surname>Hugenholtz</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Tyson</surname>
<given-names>G. W.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>CheckM: Assessing the quality of microbial genomes recovered from isolates, single cells, and metagenomes</article-title>. <source>Genome Res.</source> <volume>25</volume> (<issue>7</issue>), <fpage>1043</fpage>&#x2013;<lpage>1055</lpage>. <pub-id pub-id-type="doi">10.1101/gr.186072.114</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pedregosa</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Varoquaux</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Gramfort</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Michel</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Thirion</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Grisel</surname>
<given-names>O.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Scikit-learn: Machine learning in Python</article-title>. <source>J. Mach. Learn. Res.</source> <volume>12</volume> (<issue>85</issue>), <fpage>2825</fpage>&#x2013;<lpage>2830</lpage>.</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pokusaeva</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Fitzgerald</surname>
<given-names>G. F.</given-names>
</name>
<name>
<surname>Van Sinderen</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Carbohydrate metabolism in <italic>bifidobacteria</italic>
</article-title>. <source>Genes Nutr.</source> <volume>6</volume> (<issue>3</issue>), <fpage>285</fpage>&#x2013;<lpage>306</lpage>. <pub-id pub-id-type="doi">10.1007/s12263-010-0206-6</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Prokhorenkova</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Gusev</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Vorobev</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Dorogush</surname>
<given-names>A. V.</given-names>
</name>
<name>
<surname>Gulin</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2018</year>). in <source>CatBoost: Unbiased boosting with categorical features</source>. Editors <person-group person-group-type="editor">
<name>
<surname>Bengio</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wallach</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Larochelle</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Grauman</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Cesa-Bianchi</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Garnett.</surname>
<given-names>R.</given-names>
</name>
</person-group>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pruckler</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lorenz</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Endo</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Kraler</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Durrschmid</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Hendriks</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Comparison of homo- and heterofermentative lactic acid bacteria for implementation of fermented wheat bran in bread</article-title>. <source>Food Microbiol.</source> <volume>49</volume>, <fpage>211</fpage>&#x2013;<lpage>219</lpage>. <pub-id pub-id-type="doi">10.1016/j.fm.2015.02.014</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sarria</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kruyer</surname>
<given-names>N. S.</given-names>
</name>
<name>
<surname>Peralta-Yahya</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Microbial synthesis of medium-chain chemicals from renewables</article-title>. <source>Nat. Biotechnol.</source> <volume>35</volume> (<issue>12</issue>), <fpage>1158</fpage>&#x2013;<lpage>1166</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.4022</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Scarborough</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Lawson</surname>
<given-names>C. E.</given-names>
</name>
<name>
<surname>Hamilton</surname>
<given-names>J. J.</given-names>
</name>
<name>
<surname>Donohue</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Noguera</surname>
<given-names>D. R.</given-names>
</name>
</person-group> (<year>2018a</year>). <article-title>Metatranscriptomic and thermodynamic insights into medium-chain fatty acid production using an anaerobic microbiome</article-title>. <source>mSystems</source> <volume>3</volume> (<issue>6</issue>), <fpage>002211</fpage>&#x2013;<lpage>e318</lpage>. <pub-id pub-id-type="doi">10.1128/msystems.00221-18</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Scarborough</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Lynch</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Dickson</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mcgee</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Donohue</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Noguera</surname>
<given-names>D. R.</given-names>
</name>
</person-group> (<year>2018b</year>). <article-title>Increasing the economic value of lignocellulosic stillage through medium-chain fatty acid production</article-title>. <source>Biotechnol. Biofuels</source> <volume>11</volume>, <fpage>200</fpage>. <pub-id pub-id-type="doi">10.1186/s13068-018-1193-x</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Scarborough</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Myers</surname>
<given-names>K. S.</given-names>
</name>
<name>
<surname>Donohue</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Noguera</surname>
<given-names>D. R.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Medium-chain fatty acid synthesis by "<italic>candidatus</italic> weimeria bifida" gen. Nov., sp. nov., and "<italic>candidatus</italic> pseudoramibacter fermentans" sp. nov</article-title>. <source>Appl. Environ. Microbiol.</source> <volume>86</volume> (<issue>3</issue>), <fpage>022422</fpage>&#x2013;<lpage>e2319</lpage>. <pub-id pub-id-type="doi">10.1128/aem.02242-19</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Scarborough</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Myers</surname>
<given-names>K. S.</given-names>
</name>
<name>
<surname>Fortney</surname>
<given-names>N. W.</given-names>
</name>
<name>
<surname>Ingle</surname>
<given-names>A. T.</given-names>
</name>
<name>
<surname>Donohue</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Noguera</surname>
<given-names>D. R.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Metagenome-assembled genomes from a microbiome converting xylose to medium-chain carboxylic acids</article-title>. <source>Microbiol. Resour. Announc</source> <volume>11</volume> (<issue>4</issue>), <fpage>e0115121</fpage>. <pub-id pub-id-type="doi">10.1128/mra.01151-21</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schoelmerich</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>Katsyv</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Donig</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hackmann</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Muller</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Energy conservation involving 2 respiratory circuits</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>117</volume> (<issue>2</issue>), <fpage>1167</fpage>&#x2013;<lpage>1173</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1914939117</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Seedorf</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Fricke</surname>
<given-names>W. F.</given-names>
</name>
<name>
<surname>Veith</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Bruggemann</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Liesegang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Strittmatter</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2008</year>). <article-title>The genome of <italic>Clostridium kluyveri</italic>, a strict anaerobe with unique metabolic features</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>105</volume> (<issue>6</issue>), <fpage>2128</fpage>&#x2013;<lpage>2133</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0711093105</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tamanai-Shacoori</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Smida</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Bousarghin</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Loreal</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Meuric</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Fong</surname>
<given-names>S. B.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>
<italic>Roseburia</italic> spp.: A marker of health?</article-title> <source>Future Microbiol.</source> <volume>12</volume> (<issue>2</issue>), <fpage>157</fpage>&#x2013;<lpage>170</lpage>. <pub-id pub-id-type="doi">10.2217/fmb-2016-0130</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tanner</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Chassard</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Rigozzi</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Lacroix</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Stevens</surname>
<given-names>M. J.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>
<italic>Bifidobacterium thermophilum</italic> RBL67 impacts on growth and virulence gene expression of <italic>Salmonella enterica</italic> subsp. enterica serovar Typhimurium</article-title>. <source>BMC Microbiol.</source> <volume>16</volume>, <fpage>46</fpage>. <pub-id pub-id-type="doi">10.1186/s12866-016-0659-x</pub-id>
</citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Jin</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Complete genome sequence of <italic>Ruminococcaceae bacterium</italic> CPB6: A newly isolated culture for efficient n-caproic acid production from lactate</article-title>. <source>J. Biotechnol.</source> <volume>259</volume>, <fpage>91</fpage>&#x2013;<lpage>94</lpage>. <pub-id pub-id-type="doi">10.1016/j.jbiotec.2017.07.036</pub-id>
</citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tolieng</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Prasirtsak</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Miyashita</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Shibata</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Tanaka</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Thongchul</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>
<italic>Sporolactobacillus shoreicorticis</italic> sp.nov., a lactic acid-producing bacterium isolated from tree bark</article-title>. <source>Int. J. Syst. Evol. Microbiol.</source> <volume>67</volume> (<issue>7</issue>), <fpage>2363</fpage>&#x2013;<lpage>2369</lpage>. <pub-id pub-id-type="doi">10.1099/ijsem.0.001959</pub-id>
</citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Van Nguyen</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Viver</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Mortier</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Smets</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Bernaerts</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Isolation and characterization of a thermophilic chain elongating bacterium that produces the high commodity chemical n-caproate from polymeric carbohydrates</article-title>. <source>Bioresour. Technol.</source> <volume>367</volume>&#x2013;<lpage>128170</lpage>. <pub-id pub-id-type="doi">10.1016/j.biortech.2022.128170</pub-id>
</citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wallace</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Mckain</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Mcewan</surname>
<given-names>N. R.</given-names>
</name>
<name>
<surname>Miyagawa</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Chaudhary</surname>
<given-names>L. C.</given-names>
</name>
<name>
<surname>King</surname>
<given-names>T. P.</given-names>
</name>
<etal/>
</person-group> (<year>2003</year>). <article-title>
<italic>Eubacterium pyruvativorans</italic> sp. nov., a novel non-saccharolytic anaerobe from the rumen that ferments pyruvate and amino acids, forms caproate and utilizes acetate and propionate</article-title>. <source>Int. J. Syst. Evol. Microbiol.</source> <volume>53</volume>, <fpage>965</fpage>&#x2013;<lpage>970</lpage>. <pub-id pub-id-type="doi">10.1099/ijs.0.02110-0</pub-id>
</citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Walters</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Mohan</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Myers</surname>
<given-names>K. S.</given-names>
</name>
<name>
<surname>Ingle</surname>
<given-names>A. T.</given-names>
</name>
<name>
<surname>Donohue</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Noguera</surname>
<given-names>D. R.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>A metagenome-level analysis of a microbial community fermenting ultra-filtered milk permeate</article-title>. <source>Front. Bioeng. Biotechnol</source>. <volume>11</volume>. <pub-id pub-id-type="doi">10.3389/fbioe.2023.1173656</pub-id>
</citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Walters</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Myers</surname>
<given-names>K. S.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Fortney</surname>
<given-names>N. W.</given-names>
</name>
<name>
<surname>Ingle</surname>
<given-names>A. T.</given-names>
</name>
<name>
<surname>Scarborough</surname>
<given-names>M. J.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Metagenomes and metagenome-assembled genomes from microbial communities fermenting ultrafiltered milk permeate</article-title>. <source>Microbiol. Resour. Announc</source> <volume>11</volume> (<issue>7</issue>), <fpage>e0029322</fpage>. <pub-id pub-id-type="doi">10.1128/mra.00293-22</pub-id>
</citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Revealing the characteristics of glucose- and lactate-based chain elongation for caproate production by <italic>Caproicibacterium lactatifermentans</italic> through transcriptomic, bioenergetic, and regulatory analyses</article-title>. <source>mSystems</source> <volume>7</volume> (<issue>5</issue>), <fpage>e0053422</fpage>. <pub-id pub-id-type="doi">10.1128/msystems.00534-22</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Watanabe</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Yamano</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Masujima</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ohue-Kitano</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Kimura</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Curdlan intake changes gut microbial composition, short-chain fatty acid production, and bile acid transformation in mice</article-title>. <source>Biochem Biophys Rep</source> <volume>27</volume>, <fpage>101095</fpage>. <pub-id pub-id-type="doi">10.1016/j.bbrep.2021.101095</pub-id>
</citation>
</ref>
<ref id="B74">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Wickham</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2016</year>). <source>ggplot2: Elegant graphics for data analysis</source>. <publisher-loc>New York</publisher-loc>: <publisher-name>Springer-Verlag</publisher-name>.</citation>
</ref>
<ref id="B75">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Leng</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>G-Y. A.</given-names>
</name>
<name>
<surname>Dong</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Leu</surname>
<given-names>S-Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W-H.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Upgrading lignocellulosic ethanol for caproate production via chain elongation fermentation</article-title>. <source>Int. Biodeterior. Biodegrad.</source> <volume>135</volume>, <fpage>103</fpage>&#x2013;<lpage>109</lpage>. <pub-id pub-id-type="doi">10.1016/j.ibiod.2018.09.011</pub-id>
</citation>
</ref>
<ref id="B76">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yoshikawa</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Araoka</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Kajihara</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ito</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Miyamoto</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Kodama</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Valerate production by <italic>Megasphaera elsdenii</italic> isolated from pig feces</article-title>. <source>J. Biosci. Bioeng.</source> <volume>125</volume> (<issue>5</issue>), <fpage>519</fpage>&#x2013;<lpage>524</lpage>. <pub-id pub-id-type="doi">10.1016/j.jbiosc.2017.12.016</pub-id>
</citation>
</ref>
<ref id="B79">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Vadlani</surname>
<given-names>P. V.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Lactic acid production from biomass derived sugars via co-fermentation of Lactobacillus brevis and Lactobacillus plantarum</article-title>. <source>J. Biosci. Bioeng.</source> <volume>119</volume> (<issue>6</issue>), <fpage>694</fpage>&#x2013;<lpage>699</lpage>. <pub-id pub-id-type="doi">10.1016/j.jbiosc.2014.10.027</pub-id>
</citation>
</ref>
<ref id="B77">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Si</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Hsieh</surname>
<given-names>C-J.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>GPU-acceleration for Large-scale Tree Boosting</article-title>. <source>Machine Learning (stat.ML)</source>. <comment>arXiv: 1706.08359</comment>. <pub-id pub-id-type="doi">10.48550/arXiv.1706.08359</pub-id>
</citation>
</ref>
<ref id="B78">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Tao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>The synthesis of n-caproate from lactate: A new efficient process for medium-chain carboxylates production</article-title>. <source>Sci. Rep.</source> <volume>5</volume>, <fpage>14360</fpage>. <pub-id pub-id-type="doi">10.1038/srep14360</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>