<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Archiving and Interchange DTD v2.3 20070202//EN" "archivearticle.dtd">
<article article-type="methods-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">777877</article-id>
<article-id pub-id-type="doi">10.3389/fgene.2022.777877</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Methods</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>ARZIMM: A Novel Analytic Platform for the Inference of Microbial Interactions and Community Stability from Longitudinal Microbiome Study</article-title>
<alt-title alt-title-type="left-running-head">He et&#x20;al.</alt-title>
<alt-title alt-title-type="right-running-head">Microbial Interactions and Community Stability</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>He</surname>
<given-names>Linchen</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1621522/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Chan</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Hu</surname>
<given-names>Jiyuan</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1671067/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Gao</surname>
<given-names>Zhan</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1560870/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Falcone</surname>
<given-names>Emilia</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Holland</surname>
<given-names>Steven M.</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/744872/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Blaser</surname>
<given-names>Martin J.</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Li</surname>
<given-names>Huilin</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1086408/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Novartis Pharmaceuticals Corporation</institution>, <addr-line>East Hanover</addr-line>, <addr-line>NJ</addr-line>, <country>United&#x20;States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Division of Biostatistics</institution>, <institution>Department of Population Health</institution>, <institution>New York University School of Medicine</institution>, <addr-line>East Hanover</addr-line>, <addr-line>NY</addr-line>, <country>United&#x20;States</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Center for Advanced Biotechnology and Medicine, Rutgers University</institution>, <addr-line>New Brunswick</addr-line>, <addr-line>NJ</addr-line>, <country>United&#x20;States</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Division of Intramural Research</institution>, <institution>Immunopathogenesis Section</institution>, <institution>NIAID</institution>, <institution>NIH</institution>, <addr-line>Bethesda</addr-line>, <addr-line>MD</addr-line>, <country>United&#x20;States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/258592/overview">Himel Mallick</ext-link>, Merck, United&#x20;States</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/689126/overview">Boyu Ren</ext-link>, Dana&#x2013;Farber Cancer Institute, United&#x20;States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/687204/overview">Siyuan Ma</ext-link>, University of Pennsylvania, United&#x20;States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/895103/overview">Qiwei Li</ext-link>, The University of Texas at Dallas, United&#x20;States</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Huilin Li, <email>huilin.li@nyulangone.org</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Computational Genomics, a section of the journal Frontiers in Genetics</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>25</day>
<month>02</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>13</volume>
<elocation-id>777877</elocation-id>
<history>
<date date-type="received">
<day>16</day>
<month>09</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>31</day>
<month>01</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 He, Wang, Hu, Gao, Falcone, Holland, Blaser and Li.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>He, Wang, Hu, Gao, Falcone, Holland, Blaser and Li</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these&#x20;terms.</p>
</license>
</permissions>
<abstract>
<p>Dynamic changes of microbiome communities may play important roles in human health and diseases. The recent rise in longitudinal microbiome studies calls for statistical methods that can model the temporal dynamic patterns and simultaneously quantify the microbial interactions and community stability. Here, we propose a novel autoregressive zero-inflated mixed-effects model (ARZIMM) to capture the sparse microbial interactions and estimate the community stability. ARZIMM employs a zero-inflated Poisson autoregressive model to model the excessive zero abundances and the non-zero abundances separately, a random effect to investigate the underlining dynamic pattern shared within the group, and a Lasso-type penalty to capture and estimate the sparse microbial interactions. Based on the estimated microbial interaction matrix, we further derive the estimate of community stability, and identify the core dynamic patterns through network inference. Through extensive simulation studies and real data analyses we evaluate ARZIMM in comparison with the other methods.</p>
</abstract>
<kwd-group>
<kwd>autoregressive</kwd>
<kwd>longitudinal microbiome data</kwd>
<kwd>microbial community stability</kwd>
<kwd>mixed-effects model</kwd>
<kwd>zero-inflated</kwd>
<kwd>network analysis</kwd>
<kwd>microbial interaction</kwd>
<kwd>absolute abundance</kwd>
</kwd-group>
<contract-num rid="cn001">R01DK110014 P20CA252728 U01AI22285</contract-num>
<contract-sponsor id="cn001">National Institutes of Health<named-content content-type="fundref-id">10.13039/100000002</named-content>
</contract-sponsor>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>The human microbiota, a diverse array of microbial organisms living in and on human bodies, form a dynamic ecosystem that plays a critical role in human health. While temporally stable microbial communities are observed among healthy adults (<xref ref-type="bibr" rid="B13">Faith et&#x20;al., 2013</xref>), the fluctuation of microbiome has been linked to increasing frailty (<xref ref-type="bibr" rid="B23">Jackson et&#x20;al., 2016</xref>) and declining immune function of hosts (<xref ref-type="bibr" rid="B7">Claesson et&#x20;al., 2012</xref>), and diseases such as inflammatory bowel disease (<xref ref-type="bibr" rid="B29">Martinez et&#x20;al., 2008</xref>; <xref ref-type="bibr" rid="B53">Zuo and Ng, 2018</xref>), colorectal cancer (<xref ref-type="bibr" rid="B38">Scanlan et&#x20;al., 2008</xref>; <xref ref-type="bibr" rid="B46">Uronis et&#x20;al., 2009</xref>), and irritable bowel syndrome (<xref ref-type="bibr" rid="B30">Maukonen et&#x20;al., 2006</xref>; <xref ref-type="bibr" rid="B4">Carroll et&#x20;al., 2012</xref>). When a microbial community changes in response to an external perturbation, it undergoes a dynamic process and tends to evolve toward another stable state (<xref ref-type="fig" rid="F1">Figure&#x20;1</xref>). This dynamic process is stochastic and varies according to the type and strength of perturbation, the community stability prior to the perturbation, and other subject-level relevant features. The recent rise in longitudinal studies, in which microbial samples are collected repeatedly over time, offers unique insights into the responses of such communities to perturbations and the associated dynamic patterns. For example, in our ongoing microbiome study evaluating the effects of antibiotic exposure as a short-term perturbation on microbial, immune, and metabolic physiology (MIME study), we are interested in determining how differently the microbial community responds to the antibiotic treatment.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Schematic of the evolution of microbial community states in response to external perturbation. External perturbation (blue arrows) can affect microbial community composition (shown in a pie chart), defined as a community state. For each state, the ball-in-basin diagram portrays stability measured by the variance in the stationary distribution of the location of the ball. White arrows indicate the reaction of microbial community to the perturbation.</p>
</caption>
<graphic xlink:href="fgene-13-777877-g001.tif"/>
</fig>
<p>Human microbiota studies have been accelerated by the advent of next-generation sequencing technologies which enabled the quantification of the composition of microbiomes, often by two common sequencing approaches&#x2014;16S rRNA marker gene sequencing and shotgun metagenomics sequencing (<xref ref-type="bibr" rid="B50">Woo et&#x20;al., 2008</xref>). There are pros and cons to each of those techniques, which are discussed in recent reviews (<xref ref-type="bibr" rid="B40">Shankar, 2017</xref>; <xref ref-type="bibr" rid="B18">Gilbert et&#x20;al., 2018</xref>). But for both methods, because of the varying sequencing read counts obtained across samples, it is necessary to employ various normalization tools to convert raw counts data into relative abundances (<xref ref-type="bibr" rid="B25">Knight et&#x20;al., 2018</xref>). However, the dependency of the compositional components greatly hampers the interpretation of microbiota changes in longitudinal studies. There is reason to believe that the absolute abundances of bacteria are biologically meaningful measures, especially in the study of microbial interactions. Thus, in our MIME study, we use an independent quantitative polymerase chain reaction (qPCR) technology (<xref ref-type="bibr" rid="B33">Nadkarni et&#x20;al., 2002</xref>; <xref ref-type="bibr" rid="B34">Ott et&#x20;al., 2004</xref>; <xref ref-type="bibr" rid="B24">Kim et&#x20;al., 2013</xref>) to quantify total bacterial load per unit sample, and then use these data to estimate absolute bacterial abundance by combining them with the relative abundance values obtained from 16S rRNA or shotgun sequencing methods. This MIME study motivated us to develop analytical methods to investigate microbial interaction and community stability after a strong external perturbation, and identify core active microbial taxa by modeling the absolute abundances of bacteria.</p>
<p>Although many well-developed statistical tools are widely used for assessing the diversity of microbial communities and its composition, there are only a few methods available for inferring the ecological networks of microbial communities. Here we briefly review the well-developed statistical methods for studying the dynamic microbial systems and their limitations.</p>
<p>A Bayesian network contains a set of multivariate joint distributions that exhibit certain conditional independences and a directed and acyclic graph that encodes conditional independences among random variables. If the dependence relationships repeat and the signals at a certain time point only depend on the signals from previous time points, then the whole network can be formulated as a dynamic Bayesian network (DBN) (<xref ref-type="bibr" rid="B37">Russell and Norvig, 2002</xref>) representation. McGeachie et&#x20;al. (<xref ref-type="bibr" rid="B31">McGeachie, 2016</xref>) constructed a simplified two-stage DBN which uses a Markov assumption that the observed values at time <inline-formula id="inf1">
<mml:math id="m1">
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> are independent of those at earlier time points (<inline-formula id="inf2">
<mml:math id="m2">
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> and earlier) given the variable values at time <inline-formula id="inf3">
<mml:math id="m3">
<mml:mi>t</mml:mi>
</mml:math>
</inline-formula>. Lugo-Martinez et&#x20;al. presented a computational pipeline which first aligns the data collected from all individuals, and then learns a dynamic Bayesian network from the aligned profiles (<xref ref-type="bibr" rid="B27">Lugo-Martinez et&#x20;al., 2019</xref>). However, DBN has several limitations in analyzing the longitudinal microbial data. 1) It can only model the microbial community subject-by-subject. 2) DBN cannot handle the excess zeros in microbiome data. Most methods remove the taxa whose relative abundances exhibit zero entry (i.e.,&#x20;not present in a measurable amount at one or more of the measured time points) before the downstream analysis. 3) The assumed distributions are unrealistic. E.g. all continue variables are assumed to be normally distributed. 4) The computational cost is relatively high, since parent nodes are added sequentially for each bacterial node. Additionally, the maximum number of possible parents is imposed, which is not realistic. 5) Due to sampling and sequencing limitations, the compositionality bias in microbiome data may also cause inaccurate estimation of parameters. The existing methods ignore this compositionality bias, making parameter estimates difficult to interpret. 6) Irregular sampling time may also result in inaccurate parameter estimation. Therefore, it is advised to cautiously interpret the findings from DBN (<xref ref-type="bibr" rid="B14">Faust and Raes, 2012</xref>; <xref ref-type="bibr" rid="B17">Gerber, 2014</xref>).</p>
<p>The classical Lotka-Volterra equation has been used to model simple system such as two species in a predator-prey relationship, where the interactions are strictly assumed to be competitive. The generalized Lotka-Volterra (gLV) equations extend the classical predator-prey (Lotka-Volterra) equations, where the interacting species might have a wide range of relationships including competition, cooperation, or neutralism. Assuming that the interaction (or the effect) of one species with another can be modeled by the corresponding coefficient in the equation, gLV equations provide a framework to analyze and simulate microbial populations. Mounier et&#x20;al. used the gLV equations to model the interaction between bacteria and yeast in a cheese microbiome (<xref ref-type="bibr" rid="B32">Mounier et&#x20;al., 2009</xref>). Other microbiome studies further extended and implemented the gLV equations (<xref ref-type="bibr" rid="B28">Marino et&#x20;al., 2014</xref>; <xref ref-type="bibr" rid="B9">Dam et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B11">de Vos et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B47">Venturelli et&#x20;al., 2018</xref>).</p>
<p>Many software are available for applying gLV modeling on microbial time series data, such as LIMITS (<xref ref-type="bibr" rid="B15">Fisher and Mehta, 2014</xref>), MetaMis (<xref ref-type="bibr" rid="B41">Shaw et&#x20;al., 2016</xref>), and MDSINE (<xref ref-type="bibr" rid="B1">Bucci et&#x20;al., 2016a</xref>). LIMITS and MetaMis can be implemented to construct microbial interactions using the longitudinal microbiome data from one subject. MDSINE can jointly analyze multiple time series, but requires Matlab programming. Web-gLV (<ext-link ext-link-type="uri" xlink:href="http://web.rniapps.net/webglv">http://web.rniapps.net/webglv</ext-link>) can be used for modeling, visualization, and analysis of microbial populations, but can only handle limited number of samples. In summary, there are several limitations of gLV in analyzing the longitudinal microbial data. 1) gLV based models capture the interactions using a single averaged effect, thus they are not well-suited for noisy data. 2) Some methods estimate almost all possible edges without incorporating variable selection techniques. 3) gLV estimates the growth rate of each taxon marginally, therefore, ignores the intrinsic dynamic correlations of the repeated measurements. 4) gLV does not account for random processes which form essential part of any biological system. 5) With the increased number of species and time span of prediction, the simulation output is prone to numerical errors. For example, Web-gLV can only simulate a maximum of 10 species at a time for at most 100&#x20;time points. 6) As DBN, gLV is not suitable for sparse, compositional, and irregular sampled microbiome&#x20;data.</p>
<p>In Ives et&#x20;al. (<xref ref-type="bibr" rid="B21">Ives et&#x20;al., 2003</xref>), the stability of a microbial community is determined by three key interrelated components of microbial community structure: diversity, species composition, and interaction pattern among species. They viewed the dynamics of a microbial community as a stochastic process and proposed to use a first-order multivariate autoregressive process [MAR (1)] time-series model to disentangle the effects of these three components on community stability and to estimate the stability properties of a community by estimating the strengths of interactions between species. This method is widely used to estimate the stability of ecosystems (e.g., lake, ocean) based on culture-dependent microbial data (<xref ref-type="bibr" rid="B3">Carpenter et&#x20;al., 2011</xref>; <xref ref-type="bibr" rid="B39">Shade et&#x20;al., 2013</xref>). Usually a few (four or five) key microbes are detected with high frequency in each ecosystem in time-series measurements over a long period, and their abundances are rarely zero. In contrast, our MIME study will yield microbiome data from approximately nine time points over half a year from 80 subjects in three groups in the complete study&#x2014;a relatively smaller number of repeated microbiome samples but from a relatively larger number of microbial communities (subjects) than what would be the case for an ecosystem study. Moreover, the 16S rRNA sequencing and qPCR methods used in this study provide absolute abundances for a staggering number of taxa, which include a large number of zero values. Because the MAR modeling methods require the normality assumption, they are not appropriate for analyzing data from sequence-based longitudinal microbiome studies. Therefore, we propose an autoregressive zero-inflated mixed effects model (ARZIMM) to address the special features of data instead. Its novelties are threefold. First, we propose to use a zero-inflated Poisson autoregressive model to model the excessive zero abundances and the non-zero abundances separately. Second, the random effects in the proposed model can investigate the underlining dynamic pattern shared within the group. Third, the employment of regularization techniques and network inference in our model enables the identification of the core dynamic patterns. The proposed ARZIMM estimates the strength of interactions between taxa, which is required to estimate the stability properties of a community, and identify key active taxa efficiently by using all of the longitudinal sequencing data. ARZIMM has been implemented in an open-source software package (<ext-link ext-link-type="uri" xlink:href="https://github.com/Hlch1992/ARZIMM">https://github.com/Hlch1992/ARZIMM</ext-link>), and provides a useful tool for formulating, understanding, and implementing longitudinal microbiome data analysis.</p>
<p>In the following Material and Method section, we introduce the ARZIMM framework, discuss the quantification of microbial stability based on the estimated microbial interaction matrix, and investigate the conditions under which there exist a strict-sense stationary distribution. Then in the Result section, we evaluate ARZIMM using extensive simulation studies to show that it outperforms the conventional methods, and apply ARZIMM to the MIME study to illustrate network visualization and inference. In the end, we conclude with Discussion section.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>Materials and Methods</title>
<sec id="s2-1">
<title>ARIZMM Model</title>
<p>As illustrated in <xref ref-type="fig" rid="F2">Figure&#x20;2</xref>, ARZIMM can be considered as a two-part model which comprises a logistic component and an autoregressive component. To address zero inflation, we consider the zero-inflated mixture model because it assumes both sampling zeros (due to the low sequencing depth) and structural zeros (being truly absent) exist in the data. Specifically, the logistic component models the structure zeros of taxa in the samples, and the autoregressive component models the non-structure-zero abundances of the taxa under the assumption that the changes in abundances from time <inline-formula id="inf4">
<mml:math id="m4">
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> to time <inline-formula id="inf5">
<mml:math id="m5">
<mml:mi>t</mml:mi>
</mml:math>
</inline-formula> depend only on the observed abundances at time <inline-formula id="inf6">
<mml:math id="m6">
<mml:mrow>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> and other time-independent covariates, and the observed abundances before time <inline-formula id="inf7">
<mml:math id="m7">
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> have no direct effect. Since the goal of ARZIMM is to characterize microbial interactions and community stability during a short period after a strong external perturbation like the antibiotic usage in our MIME study, we assume there are no other time-dependent factors exist to affect the microbial stability.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Graphical representation of ARZIMM model and analytic techniques.</p>
</caption>
<graphic xlink:href="fgene-13-777877-g002.tif"/>
</fig>
</sec>
<sec id="s2-2">
<title>Notation and Model Specifications</title>
<p>Let <inline-formula id="inf8">
<mml:math id="m8">
<mml:mrow>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> denote the observed absolute abundance of bacterial taxon <inline-formula id="inf9">
<mml:math id="m9">
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>m</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>...</mml:mn>
<mml:mo>,</mml:mo>
<mml:mi>M</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> for subject <inline-formula id="inf10">
<mml:math id="m10">
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> at time <inline-formula id="inf11">
<mml:math id="m11">
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>...</mml:mn>
<mml:mo>,</mml:mo>
<mml:mi>n</mml:mi>
<mml:mo>,</mml:mo>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mi>t</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>...</mml:mn>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>, and we model <inline-formula id="inf12">
<mml:math id="m12">
<mml:mrow>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> with a conditional mixture distribution as follow:<disp-formula id="e1">
<mml:math id="m13">
<mml:mrow>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mi>&#x3bd;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
</mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:msub>
<mml:mo>&#x223c;</mml:mo>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mtable>
<mml:mtr>
<mml:mtd>
<mml:mn>0</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:mrow>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
</mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mi>&#x3bd;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
<mml:mo>;</mml:mo>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mi>&#x3d5;</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mtd>
<mml:mtd>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(1)</label>
</disp-formula>where <inline-formula id="inf13">
<mml:math id="m14">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3bd;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represents all information that is known at time <inline-formula id="inf14">
<mml:math id="m15">
<mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> for individual <inline-formula id="inf15">
<mml:math id="m16">
<mml:mi>i</mml:mi>
</mml:math>
</inline-formula>, including the observed absolute abundance <inline-formula id="inf16">
<mml:math id="m17">
<mml:mrow>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and later defined coviariates <inline-formula id="inf17">
<mml:math id="m18">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">W</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf18">
<mml:math id="m19">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">Z</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. The parameter <inline-formula id="inf19">
<mml:math id="m20">
<mml:mrow>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represents the probability of the observation <inline-formula id="inf20">
<mml:math id="m21">
<mml:mrow>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> being structural zero and is assumed time independent. Furthermore, <inline-formula id="inf21">
<mml:math id="m22">
<mml:mi>F</mml:mi>
</mml:math>
</inline-formula> is assumed to be an exponential dispersion family distribution with the canonical parameter <inline-formula id="inf22">
<mml:math id="m23">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and the dispersion parameter <inline-formula id="inf23">
<mml:math id="m24">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3d5;</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. Both Poisson and negative binomial (NB) distributions can be used as to model absolute abundance. Below we illustrate the detailed modelling using Poisson&#x20;model.</p>
<p>The mixture probability parameters <inline-formula id="inf24">
<mml:math id="m25">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> ,&#x2026;, <inline-formula id="inf25">
<mml:math id="m26">
<mml:mrow>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>)</mml:mo>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> are modeled by the logistic regression:<disp-formula id="e2">
<mml:math id="m27">
<mml:mrow>
<mml:mi mathvariant="italic">log</mml:mi>
<mml:mo>&#x2061;</mml:mo>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:msub>
<mml:mi mathvariant="bold-italic">W</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">a</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
<label>(2)</label>
</disp-formula>where <inline-formula id="inf26">
<mml:math id="m28">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">W</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> consists of intercept and <inline-formula id="inf27">
<mml:math id="m29">
<mml:mi>l</mml:mi>
</mml:math>
</inline-formula> time independent covariates for individual <inline-formula id="inf28">
<mml:math id="m30">
<mml:mi>i</mml:mi>
</mml:math>
</inline-formula>, the parameter <inline-formula id="inf29">
<mml:math id="m31">
<mml:mrow>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mi mathvariant="bold">M</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> is an <inline-formula id="inf30">
<mml:math id="m32">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> matrix whose elements <inline-formula id="inf31">
<mml:math id="m33">
<mml:mrow>
<mml:msub>
<mml:mi>A</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the effect of covariate <inline-formula id="inf32">
<mml:math id="m34">
<mml:mi>j</mml:mi>
</mml:math>
</inline-formula> on the zero proportion of taxon <inline-formula id="inf33">
<mml:math id="m35">
<mml:mi>m</mml:mi>
</mml:math>
</inline-formula>. <inline-formula id="inf34">
<mml:math id="m36">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">a</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi>a</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mi>a</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> is an <inline-formula id="inf35">
<mml:math id="m37">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> vector of random intercepts to model the within-subject heterogeneity of being zero for individual <inline-formula id="inf36">
<mml:math id="m38">
<mml:mi>i</mml:mi>
</mml:math>
</inline-formula> and has the joint multivariate normal distribution <inline-formula id="inf37">
<mml:math id="m39">
<mml:mrow>
<mml:mi mathvariant="script">N</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold">&#x3a3;</mml:mi>
<mml:mi mathvariant="bold">a</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
<p>The canonical parameters for Poisson distribution is <inline-formula id="inf38">
<mml:math id="m40">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext>log</mml:mtext>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>.</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> We introduce the auto-regressive model by relating <inline-formula id="inf39">
<mml:math id="m41">
<mml:mrow>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>1</mml:mn>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> to the <inline-formula id="inf40">
<mml:math id="m42">
<mml:mrow>
<mml:msup>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mi>h</mml:mi>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> individual&#x2019;s observed log-transformed absolute abundance vector at time <inline-formula id="inf41">
<mml:math id="m43">
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>:</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi mathvariant="bold-italic">Y</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>log</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mi>log</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> (where the pseudo count 1 is added to avoid the undefined logarithm when the absolute abudance is zero), and <inline-formula id="inf42">
<mml:math id="m44">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">Z</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mi>Z</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>Z</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>q</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> the intercept and <inline-formula id="inf43">
<mml:math id="m45">
<mml:mi>q</mml:mi>
</mml:math>
</inline-formula> time-independent covariates of individual <inline-formula id="inf44">
<mml:math id="m46">
<mml:mi>i</mml:mi>
</mml:math>
</inline-formula> by<disp-formula id="e3">
<mml:math id="m47">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi mathvariant="bold-italic">Y</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mi mathvariant="bold-italic">B</mml:mi>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi mathvariant="bold-italic">Y</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mi mathvariant="bold-italic">C</mml:mi>
<mml:msub>
<mml:mi mathvariant="bold-italic">Z</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3b7;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
<label>(3)</label>
</disp-formula>where <inline-formula id="inf45">
<mml:math id="m48">
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:math>
</inline-formula> is an <inline-formula id="inf46">
<mml:math id="m49">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> matrix whose element <inline-formula id="inf47">
<mml:math id="m50">
<mml:mrow>
<mml:msub>
<mml:mi>B</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> gives the effect of the abundance of taxon <inline-formula id="inf48">
<mml:math id="m51">
<mml:mi>j</mml:mi>
</mml:math>
</inline-formula> on the growth rate of taxon <inline-formula id="inf49">
<mml:math id="m52">
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <inline-formula id="inf50">
<mml:math id="m53">
<mml:mi mathvariant="bold-italic">C</mml:mi>
</mml:math>
</inline-formula> is an <inline-formula id="inf51">
<mml:math id="m54">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>q</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> matrix whose element <inline-formula id="inf52">
<mml:math id="m55">
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> gives the effect of covariate <inline-formula id="inf53">
<mml:math id="m56">
<mml:mi>j</mml:mi>
</mml:math>
</inline-formula> on taxon <inline-formula id="inf54">
<mml:math id="m57">
<mml:mi>m</mml:mi>
</mml:math>
</inline-formula>, and <inline-formula id="inf55">
<mml:math id="m58">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3b7;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi>&#x3b7;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mn>...</mml:mn>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x3b7;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2032;</mml:mo>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> is time-independent random intercepts. Note that, as an autoregressive model, <inline-formula id="inf56">
<mml:math id="m59">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3b7;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is correlated with the fixed effect <inline-formula id="inf57">
<mml:math id="m60">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi mathvariant="bold-italic">Y</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and this dependency can be tracked all the way back to the initial observation <inline-formula id="inf58">
<mml:math id="m61">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi mathvariant="bold-italic">Y</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. Because the standard random effects model has assumption that the random effects are independent to the other covariates in the model, in order to derive the random effect type maximum likelihood (ML) estimators, we use the Chamberlain type projections (<xref ref-type="bibr" rid="B6">Chamberlain, 1982</xref>) to get around this correlation. Specifically, we project <inline-formula id="inf59">
<mml:math id="m62">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3b7;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> onto the time <inline-formula id="inf60">
<mml:math id="m63">
<mml:mn>0</mml:mn>
</mml:math>
</inline-formula> observations <inline-formula id="inf61">
<mml:math id="m64">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi mathvariant="bold-italic">Y</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> by:<disp-formula id="e4">
<mml:math id="m65">
<mml:mrow>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3b7;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mi mathvariant="bold-italic">&#x3a0;</mml:mi>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi mathvariant="bold-italic">Y</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">b</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
<label>(4)</label>
</disp-formula>where <inline-formula id="inf62">
<mml:math id="m66">
<mml:mi mathvariant="bold-italic">&#x3a0;</mml:mi>
</mml:math>
</inline-formula> is an <inline-formula id="inf63">
<mml:math id="m67">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> matrix with diag(<inline-formula id="inf64">
<mml:math id="m68">
<mml:mrow>
<mml:mi mathvariant="bold-italic">&#x3a0;</mml:mi>
<mml:mo>)</mml:mo>
<mml:mo>&#x3d;</mml:mo>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi>&#x3c0;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mi>&#x3c0;</mml:mi>
<mml:mi>M</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> and off-diagonal components being zero. The components of <inline-formula id="inf65">
<mml:math id="m69">
<mml:mi mathvariant="bold-italic">&#x3a0;</mml:mi>
</mml:math>
</inline-formula> represent how much variation in <inline-formula id="inf66">
<mml:math id="m70">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b7;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> is due to the dependence on subject <inline-formula id="inf67">
<mml:math id="m71">
<mml:mi>i</mml:mi>
</mml:math>
</inline-formula>&#x2019;s initial value <inline-formula id="inf68">
<mml:math id="m72">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi mathvariant="bold-italic">Y</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. <inline-formula id="inf69">
<mml:math id="m73">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">b</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mn>...</mml:mn>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> is an <inline-formula id="inf70">
<mml:math id="m74">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> vector, representing the independent subject-specific random effect and follows a joint multivariate normal distribution <inline-formula id="inf71">
<mml:math id="m75">
<mml:mrow>
<mml:mi mathvariant="script">N</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold">&#x3a3;</mml:mi>
<mml:mi mathvariant="bold">b</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
<p>In the model, our primary interest is to estimate matrix <inline-formula id="inf72">
<mml:math id="m76">
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:math>
</inline-formula> , which measures the strengths of interactions between taxa. For a microbial community with a given number of species, its stability or dynamics status depends on the changes in the species&#x2019; population growth rates due to perturbation, which immediately cause the changes in the population growth rates of other species via species-species interactions (<xref ref-type="bibr" rid="B22">Ives et&#x20;al., 2000</xref>). Interaction between species can be viewed as a filter that amplifies the variability in species&#x2019; population growth rates caused by perturbation.</p>
<p>Note that we choose Poisson distribution because of its nice stationary distribution property in the autoregressive model which is crucial for our following stability investigation. To deal with the over-dispersion of microbiome data, we implemented the quasi-Poisson model (<xref ref-type="bibr" rid="B48">Ver Hoef and Boveng, 2007</xref>) in the simulation and real data analysis.</p>
</sec>
<sec id="s2-3">
<title>Penalized ML Estimation and Variable Selection</title>
<p>To define the joint likelihood of the longitudinal microbial absolute abundance data <inline-formula id="inf73">
<mml:math id="m77">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold">Y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> <italic>,</italic> we assume that the vector of time independent random effects <inline-formula id="inf74">
<mml:math id="m78">
<mml:mrow>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msubsup>
<mml:mi>a</mml:mi>
<mml:mi>i</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msubsup>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mi>b</mml:mi>
<mml:mi>i</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msubsup>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> underlies both the zero and autoregressive generative processes and these random effects account for the within-subject group heterogeneity in the multivariate logistic component and the multivariate autoregressive component. Denote <inline-formula id="inf75">
<mml:math id="m79">
<mml:mrow>
<mml:mo>&#xa0;</mml:mo>
<mml:mi mathvariant="bold-italic">D</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi mathvariant="bold-italic">B</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">C</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">D</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mn>...</mml:mn>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">D</mml:mi>
<mml:mi>M</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> <italic>,</italic> <inline-formula id="inf76">
<mml:math id="m80">
<mml:mrow>
<mml:mi>&#x3d5;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi>&#x3d5;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mn>...</mml:mn>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x3d5;</mml:mi>
<mml:mi>M</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> , and <inline-formula id="inf77">
<mml:math id="m81">
<mml:mrow>
<mml:msub>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mo>&#x22c5;</mml:mo>
<mml:mo>]</mml:mo>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> as the indication function that when <inline-formula id="inf78">
<mml:math id="m82">
<mml:mrow>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mo>&#xb7;</mml:mo>
<mml:mo>]</mml:mo>
</mml:mrow>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> meets, <inline-formula id="inf79">
<mml:math id="m83">
<mml:mrow>
<mml:msub>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mo>&#x22c5;</mml:mo>
<mml:mo>]</mml:mo>
</mml:mrow>
</mml:msub>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, otherwise, <inline-formula id="inf80">
<mml:math id="m84">
<mml:mrow>
<mml:msub>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mo>&#x22c5;</mml:mo>
<mml:mo>]</mml:mo>
</mml:mrow>
</mml:msub>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>. Formally, we have the joint likelihood function as:<disp-formula id="e5">
<mml:math id="m85">
<mml:mrow>
<mml:mi mathvariant="normal">&#x2112;</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">D</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">&#x3a0;</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">&#x3d5;</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:munderover>
<mml:mstyle displaystyle="true">
<mml:mo>&#x220f;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:munderover>
<mml:mstyle displaystyle="true">
<mml:mrow>
<mml:mo>&#x222b;</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:munderover>
<mml:mstyle displaystyle="true">
<mml:mo>&#x220f;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:munderover>
<mml:munderover>
<mml:mstyle displaystyle="true">
<mml:mo>&#x220f;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>M</mml:mi>
</mml:munderover>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>y</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x3d5;</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>a</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
<mml:mi>g</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">c</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:mi mathvariant="bold-italic">&#x3a3;</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
<mml:mi>d</mml:mi>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
<label>(5)</label>
</disp-formula>where <inline-formula id="inf81">
<mml:math id="m86">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>y</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the conditional probability density function and given as<disp-formula id="e6">
<mml:math id="m87">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>y</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x3d5;</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>a</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x3d5;</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msup>
<mml:mo>&#xd7;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x3d5;</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2260;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
<label>(6)</label>
</disp-formula>
</p>
<p>The function <inline-formula id="inf82">
<mml:math id="m88">
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">c</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:mi mathvariant="bold-italic">&#x3a3;</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is the joint distribution of <inline-formula id="inf83">
<mml:math id="m89">
<mml:mrow>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula id="inf84">
<mml:math id="m90">
<mml:mrow>
<mml:mi mathvariant="bold-italic">&#x3a3;</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:mtable>
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3a3;</mml:mi>
<mml:mi mathvariant="bold-italic">a</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mtd>
<mml:mtd>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3a3;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">a</mml:mi>
<mml:mi mathvariant="bold-italic">b</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3a3;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">a</mml:mi>
<mml:mi mathvariant="bold-italic">b</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mtd>
<mml:mtd>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3a3;</mml:mi>
<mml:mi mathvariant="bold-italic">b</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> represents the corresponding <inline-formula id="inf85">
<mml:math id="m91">
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mi>M</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>2</mml:mn>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> covariance matrix, where <inline-formula id="inf86">
<mml:math id="m92">
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
</mml:math>
</inline-formula> accounts for all unique non-zero elements of <inline-formula id="inf87">
<mml:math id="m93">
<mml:mi>&#x3a3;</mml:mi>
</mml:math>
</inline-formula>. For the model and computational simplicity, we assume <inline-formula id="inf88">
<mml:math id="m94">
<mml:mrow>
<mml:mi>C</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>v</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">a</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">b</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mi>&#x3a3;</mml:mi>
<mml:mrow>
<mml:mi>a</mml:mi>
<mml:mi>b</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, i.e. <inline-formula id="inf89">
<mml:math id="m95">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">a</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf90">
<mml:math id="m96">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">b</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are independent.</p>
<p>Assuming that the true underlying fixed effects <inline-formula id="inf91">
<mml:math id="m97">
<mml:mi mathvariant="bold-italic">A</mml:mi>
</mml:math>
</inline-formula> and <inline-formula id="inf92">
<mml:math id="m98">
<mml:mi mathvariant="bold-italic">D</mml:mi>
</mml:math>
</inline-formula> are sparse, we advocate a Lasso-type approach, which adds an <inline-formula id="inf93">
<mml:math id="m99">
<mml:mrow>
<mml:msub>
<mml:mi>&#x2113;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> -penalty for the fixed-effects to the likelihood function. Thus, we consider the following objective function:<disp-formula id="e7">
<mml:math id="m100">
<mml:mrow>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>Q</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#x2061;</mml:mo>
<mml:mi>log</mml:mi>
<mml:mi mathvariant="normal">&#x2112;</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:munderover>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>M</mml:mi>
</mml:munderover>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>&#x3bc;</mml:mi>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">D</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi>&#x3bc;</mml:mi>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>.</mml:mo>
</mml:math>
<label>(7)</label>
</disp-formula>
</p>
<p>Maximization of the penalized log-likelihood function corresponding to <xref ref-type="disp-formula" rid="e7">Eq. 7</xref> with respect to <inline-formula id="inf94">
<mml:math id="m101">
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi mathvariant="bold-italic">D</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">&#x3a0;</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">&#x3d5;</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> is a computationally challenging task. This is mainly because both integrals with respect to the random effects and the zero-inflated structure do not have analytical solutions. Following the conventional methods, we propose to implement a Laplace approximation on the integral of random effects in <xref ref-type="disp-formula" rid="e7">Eq. 7</xref> and use the Expectation-Maximization (EM) algorithm to calculate the expectation and compute parameters iteratively, in which the label of zero is treated as &#x201c;missing data&#x201d;. The tuning parameters are selected using Bayesian information criterion (BIC).</p>
</sec>
<sec id="s2-4">
<title>Stability Properties</title>
<p>The existence of a stationary distribution has been investigated for the log-linear Poisson auto-regression model based on the perturbation technique (<xref ref-type="bibr" rid="B16">Fokianos and Tj&#xf8;stheim, 2011</xref>). Here, we prove the existence of a stationary distribution of a zero-inflated Poisson mixed-effect auto-regression model in Theorem 1 utilizing the theory of Markov chains which has been proposed to prove the existence of a stationary distribution of a general class of time series count models (<xref ref-type="bibr" rid="B12">Douc et&#x20;al., 2013</xref>). The detailed proof is provided in the <xref ref-type="sec" rid="s10">Supplementary Material Section S3</xref>.</p>
<p>
<statement content-type="theorem" id="Theorem_1">
<label>Theorem 1</label>
<p>Assuming that time-independent parameters <inline-formula id="inf95">
<mml:math id="m102">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3b7;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf96">
<mml:math id="m103">
<mml:mrow>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are known, if all eigenvalues of matrix <inline-formula id="inf97">
<mml:math id="m104">
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:math>
</inline-formula> lie inside the unit circle, a strict-sense stationary ergodic process <inline-formula id="inf98">
<mml:math id="m105">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">Y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>}</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> will exist, where <inline-formula id="inf99">
<mml:math id="m106">
<mml:mi mathvariant="bold-italic">N</mml:mi>
</mml:math>
</inline-formula> denotes the set of natural numbers.</p>
<p>With this Theorem, we can first show that for a microbial community, its dynamic process <inline-formula id="inf100">
<mml:math id="m107">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">Y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>}</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mi mathvariant="bold-italic">N</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> has a stationary distribution by proving that all eigenvalues of matrix <inline-formula id="inf101">
<mml:math id="m108">
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:math>
</inline-formula> lie inside the unit circle. Then, following Ives et&#x20;al. (<xref ref-type="bibr" rid="B21">Ives et&#x20;al., 2003</xref>), we consider the return rate and reactivity as two stability measures based on the variability of the stationary distribution for MAR (1) model. Specifically, return rate depends on the rate at which the perturbed microbial community approaches the stationary distribution and reactivity, and assesses how strongly population-level microbiome abundances are pulled towards the mean of the stationary distribution. Both are bounded by the largest eigenvalue of <inline-formula id="inf102">
<mml:math id="m109">
<mml:mi>B</mml:mi>
</mml:math>
</inline-formula>, denoted by <inline-formula id="inf103">
<mml:math id="m110">
<mml:mrow>
<mml:mtext>max</mml:mtext>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3bb;</mml:mi>
<mml:mi>B</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>. In general, a smaller <inline-formula id="inf104">
<mml:math id="m111">
<mml:mrow>
<mml:mtext>max</mml:mtext>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3bb;</mml:mi>
<mml:mi>B</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> indicates the perturbed microbial community approaches its stationary distribution faster, or a system is less reactive, then the microbial community is more stable. The detailed proof is deferred in the <xref ref-type="sec" rid="s10">Supplementary Material Section S3.2</xref>.</p>
<p>Based on the theory in Ives et&#x20;al. (<xref ref-type="bibr" rid="B21">Ives et&#x20;al., 2003</xref>), for a community with multiple species, the covariance matrix of the stationary distribution depends on the covariance matrix of the process error and the interactions between species captured in the matrix <inline-formula id="inf105">
<mml:math id="m112">
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:math>
</inline-formula>. As illustrated in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>, when the external perturbation(blue arrow) acts on the community, the ball(microbial community) sitting in a deep bowl in state 2 which represents a relatively stable system, will return to its stationary state faster than the ball sitting in a shallow bowl in state 1 which represents a less stable system. In a stable system, the variance of stationary distribution is only slightly greater than the variance of process error and the variance of species interaction is small. In contrast, in a less stable system, the species interaction will amplify the environmental variance and create large variance in the stationary distribution, therefore the variance of species interaction is large, assuming the process errors are similar in the compared two states. Thus, the difference between the variances of stationary distribution of different communities can be attributed to species interactions. The smaller of the variance of matrix <inline-formula id="inf106">
<mml:math id="m113">
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> the more stable of the study microbial community.</p>
</statement>
</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec id="s3-1">
<title>Simulation Study</title>
<p>We have conducted extensive simulation studies to evaluate the performance of ARZIMM in both model fitting and variable selection by comparing it with the competing methods: penalized Poisson auto-regression (Poisson), penalized log-normal multivariate auto-regression (MAR), and extended generalized Lotka-Volterra (gLV) equations using Bayesian algorithm (MDSINE) (<xref ref-type="bibr" rid="B2">Bucci et&#x20;al., 2016b</xref>). The brief descriptions of these methods are provided in the <xref ref-type="sec" rid="s10">Supplementary Material Section S2</xref>.</p>
<sec id="s3-1-1">
<title>Simulation Design</title>
<p>We generated the longitudinal absolute abundances from zero-inflated Poisson distribution with parameters <inline-formula id="inf107">
<mml:math id="m114">
<mml:mrow>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf108">
<mml:math id="m115">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> for each taxon. Since our focus is on the estimation of the interaction matrix <inline-formula id="inf109">
<mml:math id="m116">
<mml:mrow>
<mml:mi mathvariant="bold-italic">B</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">&#xa0;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> which depends on the non-zero part, we adopted a simple simulation design for the zero inflation proportions <inline-formula id="inf110">
<mml:math id="m117">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mn>...</mml:mn>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2032;</mml:mo>
<mml:mo>.</mml:mo>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> We ignored the individual variations in <inline-formula id="inf111">
<mml:math id="m118">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> by dropping the random effect term <inline-formula id="inf112">
<mml:math id="m119">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">a</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> in <xref ref-type="disp-formula" rid="e2">Eq. 2</xref>. With model <inline-formula id="inf113">
<mml:math id="m120">
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>g</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:msub>
<mml:mi mathvariant="bold-italic">W</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and by controlling the values of <inline-formula id="inf114">
<mml:math id="m121">
<mml:mi mathvariant="bold-italic">W</mml:mi>
</mml:math>
</inline-formula> and <inline-formula id="inf115">
<mml:math id="m122">
<mml:mi mathvariant="bold-italic">A</mml:mi>
</mml:math>
</inline-formula> respectively, we set the zero inflation proportions <inline-formula id="inf116">
<mml:math id="m123">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> for 20 taxa to mimic the observed sparsity in real data as<disp-formula id="e8">
<mml:math id="m124">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mn>0.72</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>1.00</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.96</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.34</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.50</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.56</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.94</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.84</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.98</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>1.00</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.78</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.68</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.96</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>1.00</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.38</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.56</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.82</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>1.00</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.28</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>1.00</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2032;</mml:mo>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
<label>(8)</label>
</disp-formula>
</p>
<p>The detailed values of <inline-formula id="inf117">
<mml:math id="m125">
<mml:mi mathvariant="bold-italic">W</mml:mi>
</mml:math>
</inline-formula> and <inline-formula id="inf118">
<mml:math id="m126">
<mml:mi mathvariant="bold-italic">A</mml:mi>
</mml:math>
</inline-formula> are provided in the <xref ref-type="sec" rid="s10">Supplementary Material Section S4</xref>. We generated the non-zero absolute abundances from Poisson distribution with their <inline-formula id="inf119">
<mml:math id="m127">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>1</mml:mn>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mn>...</mml:mn>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mi>&#x0027;</mml:mi>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> defined as <inline-formula id="inf120">
<mml:math id="m128">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mi mathvariant="bold-italic">B</mml:mi>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi mathvariant="bold-italic">Y</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">b</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">b</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, where the intercept <inline-formula id="inf121">
<mml:math id="m129">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">b</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> was set to be the mean log-transformed non-zero absolute abundances of taxa in MIME real data, and the random effects <inline-formula id="inf122">
<mml:math id="m130">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">b</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x223c;</mml:mo>
<mml:mi mathvariant="script">N</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
<mml:mi>d</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>g</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3a3;</mml:mi>
<mml:mi>b</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> with <inline-formula id="inf123">
<mml:math id="m131">
<mml:mrow>
<mml:mi>d</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>g</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3a3;</mml:mi>
<mml:mi>b</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x223c;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="script">N</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.5</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>0.5</mml:mn>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>. We assumed that the interaction matrix <inline-formula id="inf124">
<mml:math id="m132">
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:math>
</inline-formula> was sparse by randomly selecting 5% of its elements to be non-zero. Three interaction matrices were considered with varied informative absolute effect strengths: high (<inline-formula id="inf125">
<mml:math id="m133">
<mml:mrow>
<mml:msubsup>
<mml:mi>B</mml:mi>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mi>H</mml:mi>
</mml:msubsup>
<mml:mo>&#x223c;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="script">N</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>0.5.0.5</mml:mn>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>), medium (<inline-formula id="inf126">
<mml:math id="m134">
<mml:mrow>
<mml:msubsup>
<mml:mi>B</mml:mi>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mi>M</mml:mi>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:mn>0.1</mml:mn>
</mml:mrow>
</mml:msqrt>
<mml:msubsup>
<mml:mi>&#x3b2;</mml:mi>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mi>H</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula>), and low (<inline-formula id="inf127">
<mml:math id="m135">
<mml:mrow>
<mml:msubsup>
<mml:mi>B</mml:mi>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mi>L</mml:mi>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0.1</mml:mn>
<mml:msubsup>
<mml:mi>B</mml:mi>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mi>H</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula>), for the non-zero elements <inline-formula id="inf128">
<mml:math id="m136">
<mml:mrow>
<mml:msub>
<mml:mi>B</mml:mi>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. In addition, we designed four simulation scenarios: Scenario 1 with <inline-formula id="inf129">
<mml:math id="m137">
<mml:mrow>
<mml:mi>d</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>g</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3a3;</mml:mi>
<mml:mi>b</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf130">
<mml:math id="m138">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, considered as the benchmark situation where subjects are homogeneous and taxa are all presented; Scenario 2 with <inline-formula id="inf131">
<mml:math id="m139">
<mml:mrow>
<mml:mi mathvariant="bold-italic">&#xa0;</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>g</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3a3;</mml:mi>
<mml:mi>b</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x223c;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="script">N</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.5.0.5</mml:mn>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
<mml:mi mathvariant="bold-italic">&#xa0;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf132">
<mml:math id="m140">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, where subjects are heterogeneous and taxa are all presented; Scenario 3 with <inline-formula id="inf133">
<mml:math id="m141">
<mml:mrow>
<mml:mi>d</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>g</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3a3;</mml:mi>
<mml:mi>b</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf134">
<mml:math id="m142">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> as in <xref ref-type="disp-formula" rid="e8">(8)</xref>, where subjects are homogeneous and taxa have zero inflated structure; and Scenario 4 with <inline-formula id="inf135">
<mml:math id="m143">
<mml:mrow>
<mml:mi>d</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>g</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3a3;</mml:mi>
<mml:mi>b</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x223c;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="script">N</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.5.0.5</mml:mn>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf136">
<mml:math id="m144">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> as in <xref ref-type="disp-formula" rid="e8">(8)</xref>, where subjects are heterogeneous and taxa have zero inflated structure.</p>
<p>In each scenario, we generated 500 independent repetitions for <inline-formula id="inf137">
<mml:math id="m145">
<mml:mrow>
<mml:mi>n</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>20</mml:mn>
<mml:mo>&#xa0;</mml:mo>
<mml:mtext>or</mml:mtext>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>50</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> subjects, <inline-formula id="inf138">
<mml:math id="m146">
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>10</mml:mn>
<mml:mo>&#xa0;</mml:mo>
<mml:mtext>or</mml:mtext>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>20</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> time points, and <inline-formula id="inf139">
<mml:math id="m147">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>20</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> taxa for each sample to evaluate the performance of ARZIMM.</p>
</sec>
<sec id="s3-1-2">
<title>Simulation Results</title>
<p>We first compared the model fittings of ARZIMM, Poisson, and MAR methods using mean normalized squared error score (MNSES), as suggested in the prior studies (<xref ref-type="bibr" rid="B5">Carroll and Cressie, 1997</xref>; <xref ref-type="bibr" rid="B26">Liesenfeld et&#x20;al., 2006</xref>; <xref ref-type="bibr" rid="B8">Czado et&#x20;al., 2009</xref>; <xref ref-type="bibr" rid="B45">Tkacz et&#x20;al., 2018a</xref>). MNSES is defined as <inline-formula id="inf140">
<mml:math id="m148">
<mml:mrow>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mi>n</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>T</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:msup>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>&#x3c3;</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> with <inline-formula id="inf141">
<mml:math id="m149">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> being the estimated <inline-formula id="inf142">
<mml:math id="m150">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf143">
<mml:math id="m151">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>&#x3c3;</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> being the estimated standard error of <inline-formula id="inf144">
<mml:math id="m152">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. The closer the MNSES is to 1, the better model fitting the method has. Since MDSINE only provides the estimates of interactions among species without their variance estimates, it was excluded from this comparison. <xref ref-type="table" rid="T1">Table&#x20;1</xref> and <xref ref-type="sec" rid="s10">Supplementary Table S1</xref> summarize the median and interquartile range (IQR) of MNSES over 500 replications for these three methods. Overall, the medians of MNSES for ARZIMM are all around the expected value of 1 in various settings across four scenarios, which indicates the good fitness and robustness of ARZIMM in dealing with excess zeros and the correlation among repeated measures at the same time, as well as its satisfying estimation accuracy on the microbial interaction parameters. However, the other two methods: Poisson and MAR, both exhibit inferior performance. The Poisson model is only competent in Scenario 1, when subjects are homogeneous and no excess zeros are present. In Scenarios 2-4, when any factor, excess zero or subject heterogeneity, presents, the predicted values based on the Poisson model deviate greatly from the observed values. Comparing the considered two factors, Poisson model is more sensitive to the subject heterogeneity and presents larger deviations with it. Due to the invalid normality assumption and lack of consideration of the correlation among the longitudinal measurements, the MAR model exhibits the worst performance among three methods with enormous deviation especially in Scenarios 3 and 4, which confirms the inappropriateness of using conventional statistical methods which require the normality assumption to analyze the microbiome&#x20;data.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Simulation results for all settings under scenario 1 and 4. Poisson refers to the penalized Poisson autoregression model and MAR refers to penalized log-normal multivariate autoregression model. The reported value is median (IQR) of mean normalized squared error score (MNSES) calculated over 500 simulations for each setting. <inline-formula id="inf145">
<mml:math id="m153">
<mml:mi>n</mml:mi>
</mml:math>
</inline-formula> refers to the number of subjects, and <inline-formula id="inf146">
<mml:math id="m154">
<mml:mi>T</mml:mi>
</mml:math>
</inline-formula> refers to the number of time points. Scenarios 2 and 3 are deferred to Supplementary Material.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th colspan="2" align="left">Methods</th>
<th colspan="3" align="center">ARZIMM</th>
<th colspan="3" align="center">Poisson</th>
<th colspan="3" align="center">MAR</th>
</tr>
<tr>
<th colspan="2" align="left">Effect size</th>
<th align="center">High</th>
<th align="center">Median</th>
<th align="center">Low</th>
<th align="center">High</th>
<th align="center">Median</th>
<th align="center">Low</th>
<th align="center">High</th>
<th align="center">Median</th>
<th align="center">Low</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td colspan="11" align="left">Scenario 1</td>
</tr>
<tr>
<td align="left">&#x2003;n</td>
<td align="left">T</td>
<td colspan="9" align="center">Median (IQR)</td>
</tr>
<tr>
<td rowspan="2" align="left">&#x2003;20</td>
<td rowspan="2" align="left">10</td>
<td align="center">0.98</td>
<td align="center">0.98</td>
<td align="center">0.98</td>
<td align="center">1.00</td>
<td align="center">0.99</td>
<td align="center">1.00</td>
<td align="center">47</td>
<td align="center">50</td>
<td align="center">52</td>
</tr>
<tr>
<td align="center">(0.97&#x2013;0.99)</td>
<td align="center">(0.97&#x2013;0.99)</td>
<td align="center">(0.97&#x2013;0.99)</td>
<td align="center">(0.99&#x2013;1.01)</td>
<td align="center">(0.984&#x2013;1.00)</td>
<td align="center">(0.99&#x2013;1.00)</td>
<td align="center">(33&#x2013;77)</td>
<td align="center">(35&#x2013;80)</td>
<td align="center">(37&#x2013;80)</td>
</tr>
<tr>
<td rowspan="2" align="left">&#x2003;50</td>
<td rowspan="2" align="left">20</td>
<td align="center">0.99</td>
<td align="center">0.99</td>
<td align="center">0.99</td>
<td align="center">1.00</td>
<td align="center">1.00</td>
<td align="center">1.00</td>
<td align="center">123</td>
<td align="center">115</td>
<td align="center">114</td>
</tr>
<tr>
<td align="center">(0.99&#x2013;1.00)</td>
<td align="center">(0.99&#x2013;1.00)</td>
<td align="center">(0.99&#x2013;1.00)</td>
<td align="center">(1.00&#x2013;1.01)</td>
<td align="center">(1.00&#x2013;1.00)</td>
<td align="center">(1.00&#x2013;1.00)</td>
<td align="center">(86&#x2013;192)</td>
<td align="center">(78&#x2013;187)</td>
<td align="center">(80&#x2013;177)</td>
</tr>
<tr>
<td colspan="11" align="left">Scenario 4</td>
</tr>
<tr>
<td align="left">&#x2003;n</td>
<td align="left">T</td>
<td colspan="9" align="center">Median (IQR)</td>
</tr>
<tr>
<td rowspan="2" align="left">&#x2003;20</td>
<td rowspan="2" align="left">10</td>
<td align="center">0.95</td>
<td align="center">0.92</td>
<td align="center">0.91</td>
<td align="center">30.59</td>
<td align="center">18.87</td>
<td align="center">18.46</td>
<td align="center">30071.82</td>
<td align="center">29390</td>
<td align="center">22435</td>
</tr>
<tr>
<td align="center">(0.87&#x2013;2.30)</td>
<td align="center">(0.86&#x2013;1.10)</td>
<td align="center">(0.86&#x2013;1.02)</td>
<td align="center">(21.90&#x2013;41.51)</td>
<td align="center">(15.26&#x2013;21.95)</td>
<td align="center">(14.77&#x2013;21.80)</td>
<td align="center">(8984&#x2013;133153)</td>
<td align="center">(13929&#x2013;77371)</td>
<td align="center">(10251&#x2013;50171)</td>
</tr>
<tr>
<td rowspan="2" align="left">&#x2003;50</td>
<td rowspan="2" align="left">20</td>
<td align="center">1.09</td>
<td align="center">0.92</td>
<td align="center">0.85</td>
<td align="center">40.31</td>
<td align="center">31.08</td>
<td align="center">30.30</td>
<td align="center">211141</td>
<td align="center">110656</td>
<td align="center">93579</td>
</tr>
<tr>
<td align="center">(1.05&#x2013;1.20)</td>
<td align="center">(0.90&#x2013;0.93)</td>
<td align="center">(0.85&#x2013;0.86)</td>
<td align="center">(36.80&#x2013;43.63)</td>
<td align="center">(30.25&#x2013;31.76)</td>
<td align="center">(29.65&#x2013;30.95)</td>
<td align="center">(118860&#x2013;473551)</td>
<td align="center">(80809&#x2013;202068)</td>
<td align="center">(66942&#x2013;167227)</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Next, we evaluated the variable selection performance for ARZIMM, Poisson, MAR, and MDSINE in terms of true positive rate (TPR; mathematically equals to the power) and false positive rate (FPR; mathematically equals to the type I error). Specifically, TPR quantifies the probability of a significant interaction identified by one method given that the interaction effect is truly nonzero; and FPR quantifies the probability of a significant interaction identified by one method given that the interaction effect is truly zero. The simulation results for 50 subjects with 20&#x20;time points are summarized in <xref ref-type="fig" rid="F3">Figure&#x20;3</xref> and all the other simulation results with different subject numbers and time points are deferred to <xref ref-type="sec" rid="s10">Supplementary Figure S1</xref>, because they have a similar pattern as seen in <xref ref-type="fig" rid="F3">Figure&#x20;3</xref>. <xref ref-type="fig" rid="F3">Figure&#x20;3</xref> shows that the FPRs of ARZIMM are all at or below the nominal level (5%) across different simulation regimes and effect sizes, and its TPR estimates exhibit a sensible and consistent pattern as they increase as the interaction effect gets stronger across four scenarios. As expected, the FPR and TRP estimates of Poisson and ARZIMM models are coincident under Scenario 1, because when subjects are homogeneous and taxa don&#x2019;t have excess zeros, ARZIMM model is reduced to Poisson model. However, in Scenarios 2-4, because simple Poisson model fails to take care of the excess zeros or subject heterogeneity, it suffers from the inflated false positives, while ARZIMM does not. For the other two methods, both MAR and MDSINE perform poorly on controlling false positive rates for all simulation scenarios, because MAR fails to fit the skewed and highly sparse microbiome data, while MDSINE captures the interactions based on the averaged effect over subjects in a group but completely ignores the randomness at the subject level process which is the essential characteristic of any biological system. In summary, ARZIMM outperforms the other competitors in handling the excess zeros and subject heterogeneity well with controlled FPR and satisfactory&#x20;TPR.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Simulation results of variable selection performance. Poisson refers to the penalized Poisson auto-regression model and MAR refers to penalized log-normal multivariate auto-regression model. MDSINE refers to the method with extended generalized Lotka-Volterra (gLV) equations using a Bayesian algorithm. Mean (and 95% confidence interval) of false positive and true positive rates are reported for 500 simulations with 50 subjects and 20&#x20;time points in four scenario: <bold>(A)</bold> no zero-inflated structure and no heterogeneity, <bold>(B)</bold> heterogeneity but no zero-inflated structure, <bold>(C)</bold> zero-inflated structure but no heterogeneity, and <bold>(D)</bold> both zero-inflated structure and heterogeneity.</p>
</caption>
<graphic xlink:href="fgene-13-777877-g003.tif"/>
</fig>
<p>To further investigate the performance of informative interaction selection, we calculate Matthew correlation coefficient (MCC), defined as <inline-formula id="inf147">
<mml:math id="m155">
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2217;</mml:mo>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2217;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msqrt>
<mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</inline-formula>, and F-score, defined as <inline-formula id="inf148">
<mml:math id="m156">
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>/</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</inline-formula>, where TP gives the number of selected interactions being true positive, FP gives the number of selected interactions being false positive, TN gives the number of unselected interactions being true negative, and FN gives the number of selected interactions being false negative. MCC ranges from <inline-formula id="inf149">
<mml:math id="m157">
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> to <inline-formula id="inf150">
<mml:math id="m158">
<mml:mn>1</mml:mn>
</mml:math>
</inline-formula>, where value <inline-formula id="inf151">
<mml:math id="m159">
<mml:mn>1</mml:mn>
</mml:math>
</inline-formula> indicates perfect agreement between truth and selection, value <inline-formula id="inf152">
<mml:math id="m160">
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> indicates perfect disagreement, and value 0 indicates that the selection is random with respect to the truth. F-score ranges from <inline-formula id="inf153">
<mml:math id="m161">
<mml:mn>0</mml:mn>
</mml:math>
</inline-formula> to <inline-formula id="inf154">
<mml:math id="m162">
<mml:mn>1</mml:mn>
</mml:math>
</inline-formula>, where value <inline-formula id="inf155">
<mml:math id="m163">
<mml:mn>1</mml:mn>
</mml:math>
</inline-formula> indicates that there are neither false negatives nor false positives and value 0 only indicates no true positives are reported. As expected, MCC and F score are comparable to each other and increase as effect size increases (<xref ref-type="sec" rid="s10">Supplementary Figure S2</xref>). This consistent pattern is observed across four scenarios for ARZIMM but not for Poisson nor MAR models. Similar to TPR and FPR estimates, the MCC and F score values of Poisson and ARZIMM models are coincident under Scenario 1. However, in other situations, both Poisson and MAR perform poorly with low MCC and F score values.</p>
<p>As for the computational cost, ARIZMM took about 2.4&#xa0;h to complete the estimation and bootstrap inference for a simulated dataset with 50 subjects, 20 timepoints, and 20&#x20;taxa.</p>
</sec>
</sec>
<sec id="s3-2">
<title>Real Data Application</title>
<p>We applied ARZIMM methods to the MIME study. The MIME study is an ongoing randomized trial on 80 healthy volunteers with one control group (ctrl) and two antibiotic groups (amoxicillin, amx, and azithromycin, azm); antibiotics are provided for a 1-week period at the start of the trial. The main microbiome research goal of the MIME study is to evaluate the effects of antibiotics on microbial profiles at both the community and taxonomical levels. With ARIZMM, we propose a different perspective to evaluate the effect of antibiotics through the investigation of microbial interaction and community stability across groups. Because the clinical trial is still ongoing and only partial data are available, the following data analysis is done on a subset of MIME data including only 11 subjects who were randomized to two groups: 4 ctrls and 7 azms. The main purpose of this analysis is to illustrate how to use ARIZMM, not for the scientific conclusion. For each subject, we collected two baseline microbiome samples, three samples during the course of antibiotics, and five post-antibiotic samples. The gut microbiota of these individuals were profiled using 16S rRNA gene targeted sequencing on the Illumina MiSeq platform. To obtain the microbial absolute abundances, we multiplied the relative abundances of OTUs by the sample density 1.1&#xa0;g/cm<sup>3</sup> and the number of universal 16S rRNA per gram measured using qPCR (<xref ref-type="bibr" rid="B42">Stein et&#x20;al., 2013a</xref>). In our analysis, samples that collected before treatment in both antibiotic groups were excluded. The abundances of taxa were agglomerated at the genus level and taxa were further filtered if 1) the average relative abundances over all samples are less than 0.1%, and 2) the taxa are presented in less than 5 samples within each&#x20;group.</p>
<p>First, <xref ref-type="fig" rid="F4">Figure&#x20;4A</xref> shows a comparison of the relative abundance (top panel) and the absolute abundances determined by quantitative sequencing (bottom panel) of the dominant bacterial genera in 99 fecal samples from 11 subjects (blocks) across seven to nine time points (shown from left to right within each block) of this preliminary dataset. It is evident that the relative abundance and absolute abundance data present different information about the microbial profiles, and that the total bacterial load changes over time for each subject (i.e.,&#x20;within each block). Thus it is essential to study the microbial interactions using the absolute abundance&#x20;data.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>MIME study microbiome data. <bold>(A)</bold> Difference between relative abundances (top panel) and absolute abundances based on qPCR (bottom panel) of dominant genera in XX fecal samples obtained from 21 subjects (block) at 7&#x2013;9&#x20;time points (<italic>x</italic>-axis) each. <bold>(B)</bold> Distribution of absolute abundances of two representative genera from the MIME study, shown in the left and right panels, respectively. For each genus, the absolute abundance is fitted with a log-normal distribution (red line) or a two-part distribution: a zero part (dark green line shown in right panel) and a non-zero part fitted with an over-dispersion Poisson distribution (blue line).</p>
</caption>
<graphic xlink:href="fgene-13-777877-g004.tif"/>
</fig>
<p>Then, we evaluate the model fitting of the log-normal distribution [used in MAR(1)] and zero-inflated over-dispersed Poisson distribution (used in ARZIMM) on the available subset of MIME data using chi-square goodness of fit test at 5% significance level taxon by taxon. Out of 45 taxa in the control group, 1 and 44 of their absolute abundances were fitted well (<italic>p</italic>&#x20;&#x3e; 0.05) by log-normal distribution and zero-inflated over-dispersed Poisson distribution respectively. The log-normal distribution fails to fit the data well when microbial taxa&#x2019;s absolute abundance data are left-skewed and sparse (two examples are illustrated in <xref ref-type="fig" rid="F4">Figure&#x20;4B</xref>).</p>
<p>Next we demonstrate how to conduct inference for microbial interactions and community stability with ARZIMM on MIME data. First, we fit ARZIMM to ctrl and azm groups separately, adjusting for age, gender, and BMI, to get their estimated interaction matrix <inline-formula id="inf156">
<mml:math id="m164">
<mml:mrow>
<mml:mover accent="true">
<mml:mi mathvariant="bold-italic">B</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> s. <xref ref-type="table" rid="T2">Table&#x20;2</xref> reports the characteristics of microbial interaction matrix estimates <inline-formula id="inf157">
<mml:math id="m165">
<mml:mrow>
<mml:mover accent="true">
<mml:mi mathvariant="bold-italic">B</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> s. Defining the interaction effect as informative if its <inline-formula id="inf158">
<mml:math id="m166">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>B</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> &#x2019;s 95% bootstrap confidence interval (based on 100 bootstrap samples) does not contain zero, we identified 125 and 105 informative interactions, respectively, in azm and ctrl groups. Their interaction effects are illustrated using networks in <xref ref-type="fig" rid="F5">Figure&#x20;5</xref>. With more informative interactions, the azm groups have bigger and more complex networks than the ctrl group (first row of <xref ref-type="fig" rid="F5">Figure&#x20;5</xref>), while the control group has more large estimated interaction effects than those in azm group as showed in <xref ref-type="table" rid="T2">Table&#x20;2</xref> and the last three rows of <xref ref-type="fig" rid="F5">Figure&#x20;5</xref>. This observation indicates that the antibiotic treatment reduce the strength of the interactions among the taxa and create more variations with more weak interactions among taxa, thus reduce its stability. In the last row of <xref ref-type="table" rid="T2">Table&#x20;2</xref>, based on our stability theory we report the stability properties of the studied microbial communities. The ctrl group has the lower estimates of maximum eigenvalue squared 0.11 comparing to the azm group&#x2019;s maximum eigenvalue squared 0.32, which indicates that the control microbial community is more stable than the antibiotic communities.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>The characteristics of networks.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Group description</th>
<th align="center">Azithromycin</th>
<th align="center">Control</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Sample size</td>
<td align="center">7</td>
<td align="center">4</td>
</tr>
<tr>
<td align="left">Number of time points</td>
<td align="center">9</td>
<td align="center">9</td>
</tr>
<tr>
<td align="left">Number of taxa</td>
<td align="center">49</td>
<td align="center">45</td>
</tr>
<tr>
<td align="left">Number of informative interactions</td>
<td align="center">125</td>
<td align="center">105</td>
</tr>
<tr>
<td align="left">Number of <inline-formula id="inf159">
<mml:math id="m167">
<mml:mrow>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>B</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:mo>&#x3c;</mml:mo>
<mml:mn>0.1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">73</td>
<td align="center">45</td>
</tr>
<tr>
<td align="left">Number of <inline-formula id="inf160">
<mml:math id="m168">
<mml:mrow>
<mml:mn>0.1</mml:mn>
<mml:mo>&#x2264;</mml:mo>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>B</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:mo>&#x3c;</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.25</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">30</td>
<td align="center">29</td>
</tr>
<tr>
<td align="left">Number of <inline-formula id="inf161">
<mml:math id="m169">
<mml:mrow>
<mml:mn>0.25</mml:mn>
<mml:mo>&#x2264;</mml:mo>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>B</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:mo>&#x3c;</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.5</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">17</td>
<td align="center">14</td>
</tr>
<tr>
<td align="left">Number of <inline-formula id="inf162">
<mml:math id="m170">
<mml:mrow>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>B</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:mo>&#x2265;</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mn>0.5</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">5</td>
<td align="center">17</td>
</tr>
<tr>
<td align="left">Informative interaction percentage (<inline-formula id="inf163">
<mml:math id="m171">
<mml:mo>%</mml:mo>
</mml:math>
</inline-formula>)</td>
<td align="center">5.21</td>
<td align="center">5.19</td>
</tr>
<tr>
<td align="left">Maximum eigenvalue squared</td>
<td align="center">0.32</td>
<td align="center">0.11</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Interaction network. Estimated interaction network for: <bold>(A)</bold> azithromycin (azm), and <bold>(B)</bold> control groups, displaying <bold>(1)</bold> all selected interactions, <bold>(2)</bold> interactions with <inline-formula id="inf164">
<mml:math id="m172">
<mml:mrow>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>B</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:mo>&#x2265;</mml:mo>
<mml:mn>0.1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, <bold>(3)</bold> interactions with <inline-formula id="inf165">
<mml:math id="m173">
<mml:mrow>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>B</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:mo>&#x2265;</mml:mo>
<mml:mn>0.25</mml:mn>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> and <bold>(4)</bold> interactions with <inline-formula id="inf166">
<mml:math id="m174">
<mml:mrow>
<mml:mo>&#x7c;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>B</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x7c;</mml:mo>
<mml:mo>&#x2265;</mml:mo>
<mml:mn>0.5</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>. Each node represents a taxon at the genus level, the size of which shows the degree of that taxa and the color of which shows the phylogenetic Order level for each taxon. Each edge with arrow represents an interaction effect, the width of which represents the absolute effect size on a log<sub>10</sub> scale, with the color showing a positive (orange) or negative (blue) effect.</p>
</caption>
<graphic xlink:href="fgene-13-777877-g005.tif"/>
</fig>
<p>
<xref ref-type="fig" rid="F6">Figure&#x20;6</xref> provides additional information on the network feature comparison between ctrl and azm groups. <xref ref-type="fig" rid="F6">Figure&#x20;6A</xref> displays the distribution of the positive and negative informative interaction estimates separately. The ratios between the numbers of positive and negative interactions are both around 1:1 in two groups. <xref ref-type="fig" rid="F6">Figure&#x20;6B</xref> presents the frequency distribution of vertex degree of all the taxa in each group and they are all skew to the right. In the figure, a vertex represents a taxon in a community and its vertex degree is the number of informative interaction effect it has with the other taxa. By defining average neighbor degree as the average number of a given taxon&#x2019;s neighbor vertices&#x2019; degrees, <xref ref-type="fig" rid="F6">Figure&#x20;6C</xref> shows that the average neighbor degree is negatively correlated with the vertex degree in azm antibiotic treated group, but not in the control group. This indicates that there may be a group of taxa interacting with each other actively in the antibiotic group. It would be interesting to identify such sub-community with additional effort.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Characteristics of estimated interactions. <bold>(A)</bold> The effect size of estimated informative interactions, wherein the <italic>x</italic>-axis represents the log<sub>10</sub> scaled absolute effect size, the <italic>y</italic>-axis represents the count of informative interactions, and the colors represent the positive or negative effects. <bold>(B)</bold> Histogram of vertex degree, wherein given a vertex, vertex degree is defined as the counts of edges upon the vertex. <bold>(C)</bold> The average neighbor degree (<italic>y</italic>-axis) versus vertex degree on a log-log scale (<italic>x</italic>-axis). The average neighbor degree is the average number of a given taxon&#x2019;s neighbor vertices&#x2019; degrees. Dotted lines represent 95% confidence limits.</p>
</caption>
<graphic xlink:href="fgene-13-777877-g006.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>In this paper, we propose ARZIMM, an analytic platform which estimates the microbial interactions and community stability using longitudinal microbiome data. ARZIMM tackles the zero-inflated absolute abundance with a mixture distribution of zero and exponential dispersion distribution family, and enhances statistical efficiency by utilizing a random-effects term to account for the correlations among repeated measurements.</p>
<p>It is well-known that microbial correlations calculated from relative abundances are distorted by the compositional nature of microbiome data, and are insufficient in tracking microbial dynamics(<xref ref-type="bibr" rid="B19">Gloor et&#x20;al., 2017</xref>). We advocate to investigate the microbial correlations using longitudinal absolute abundances which can be determined by combining gene amplicon sequencing with auxiliary total DNA quantitation data. qPCR is one of the most commonly used strategies to quantify total DNA (<xref ref-type="bibr" rid="B10">Dannemiller et&#x20;al., 2014</xref>) and has been implemented in various statistical analyses (<xref ref-type="bibr" rid="B43">Stein et&#x20;al., 2013b</xref>). Other alternative methods to quantify the absolute abundances include the combination of the sequencing approach (16S rRNA gene) with robust single-cell enumeration technologies (flow cytometry) (<xref ref-type="bibr" rid="B35">Props et&#x20;al., 2017</xref>) and the usage of synthetic chimeric DNA spikes (<xref ref-type="bibr" rid="B44">Tkacz et&#x20;al., 2018b</xref>).</p>
<p>Plenty of zero-inflated mixed effects models have been recently proposed to handle the excess zeros in microbiome abundance data such as zero-inflated Poisson, negative binomial and quasi-Poisson models(<xref ref-type="bibr" rid="B51">Xia et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B52">Zhang et&#x20;al., 2018</xref>). However, none of the existing methods estimates the microbial interactions and community stability. To fill this gap, we extended a zero-inflated Poisson model with auto-regression and random effects modeling, which plays crucial role in efficiently handling the individual heterogeneity and enable the investigation of microbial interactions.</p>
<p>We investigated two community stability measurements derived from ARZIMM: the return rate and reactivity, to further understand ecological dynamics. The estimated interaction matrix <inline-formula id="inf167">
<mml:math id="m175">
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:math>
</inline-formula> from the ARZIMM model serves the basis to calculate the largest eigenvalue of <inline-formula id="inf168">
<mml:math id="m176">
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:math>
</inline-formula>: <inline-formula id="inf169">
<mml:math id="m177">
<mml:mrow>
<mml:mtext>max</mml:mtext>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi>&#x3bb;</mml:mi>
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>, which determines the return rate of the mean of the transition distribution from the departure to the mean of the stationary distribution. We proposed to measure the reactivity of a microbial community by the expected change of the stationary distribution&#x2019;s mean in distance from one time point to the next time point. In ARZIMM, higher reactivity coincides with larger eigenvalues of <inline-formula id="inf170">
<mml:math id="m178">
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:math>
</inline-formula>, thus governed again by <inline-formula id="inf171">
<mml:math id="m179">
<mml:mrow>
<mml:mtext>max</mml:mtext>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi>&#x3bb;</mml:mi>
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>. Other measures of community stability, such as variance of the stationary distribution (<xref ref-type="bibr" rid="B21">Ives et&#x20;al., 2003</xref>), warrant further investigations.</p>
<p>It is worth noting that by utilizing the ARZIMM model framework, the time-dependent perturbation (for instance, diet) can also be assessed flexibly in both the autoregressive part and the logistic part in the model. However, the stability based on the microbial interactions has to be interpreted with caution, since the mean of stationary distribution changes along with the time-dependent covariates.</p>
<p>We have demonstrated that ARZIMM outperforms the competing methods and exhibits its feasibility for examining microbial interactions and stability based on longitudinal microbial data. We applied our method to a real human microbiome study of antibiotic treatment and elucidated the microbial interaction network of bacteria from antibiotic and non-antibiotic groups separately. The application of ARZIMM to temporal microbiome data shows great promise. Still, the development of accurate predictive models will require further developments. For example, the method used here to infer microbial interactions may be expanded by adding functional information as well as phylogenetic information. Although this method is primarily developed for the gut microbiota, it may be potentially applied to longitudinal data from any ecological systems. Since interactions between members of microbial communities are primary driving forces for the long-term stability(<xref ref-type="bibr" rid="B36">Ratzke et&#x20;al., 2020</xref>), the corresponding stability properties will provide useful principles for community dynamics.</p>
<p>Note that the proposed ARIZMM assumes the probability of observing a zero count for a taxon is constant over time. The reason is two-fold. 1) One major goal of ARIZMM is to derive the inference on the stability of the microbial community over a certain period. With the constant probability of observing a zero count assumption, the stability inference will solely depend on the estimation of the taxon-by-taxon interaction matrix <bold>
<italic>B</italic>
</bold>. Otherwise, a stationary distribution will not exit. 2) Using the MIME data, we estimated the proportions of zeros (denoted as <inline-formula id="inf172">
<mml:math id="m180">
<mml:mrow>
<mml:msub>
<mml:mi>q</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> for all taxa by group at all time points, then calculated the mean(<inline-formula id="inf173">
<mml:math id="m181">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>q</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo stretchy="true">&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mrow>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> and standard deviation (<inline-formula id="inf174">
<mml:math id="m182">
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>D</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>q</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> over all the time points and the coefficient of variation ( <inline-formula id="inf175">
<mml:math id="m183">
<mml:mrow>
<mml:mi>C</mml:mi>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>D</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>q</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>/</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>q</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo stretchy="true">&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mrow>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mi>m</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mi>M</mml:mi>
<mml:mo>)</mml:mo>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> to evaluate their temporal variations. The median of <inline-formula id="inf176">
<mml:math id="m184">
<mml:mrow>
<mml:mi>C</mml:mi>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> over all taxa in the control, Amoxicillin and Azithromycin groups are 0.16, 0.12, and 0.34 respectively. This results reveal two observations: 1) the temporal variations of <inline-formula id="inf177">
<mml:math id="m185">
<mml:mrow>
<mml:msub>
<mml:mi>q</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> in most taxa are relative weak; and 2) the temporal variation of the proportions of zero is heterogeneous and there may be no one perfect model fitting all the taxa well. Thus, we believe our assumption that <inline-formula id="inf178">
<mml:math id="m186">
<mml:mrow>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is constant over time is valid and pragmatic. To further check the robustness of our proposed model, we conducted additional simulation by introducing extra randomness when we generate the probability of observing a zero count across the time points, while analyze the data using our proposed model. Our results show that the moderate temporal variation in probability of zero count does not affect ARIZMM&#x2019;s performance much in capturing the informative interactions by estimating <bold>
<italic>B</italic>
</bold> when the absolute effect strengths of interaction matrices is high or medium. The detailed simulation design and results are reported in the <xref ref-type="sec" rid="s10">Supplementary Material Section S4.2</xref> and <xref ref-type="sec" rid="s10">Supplementary Figure&#x20;S3</xref>.</p>
<p>The proposed method, ARZIMM has a few limitations and future works are needed to improve it. ARZIMM adopts a simple correlation structure that the random effects in the multivariate logistic component and the multivariate autoregressive component <inline-formula id="inf179">
<mml:math id="m187">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">a</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf180">
<mml:math id="m188">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">b</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> are assumed independent. We took this parsimonious model based on our experience(<xref ref-type="bibr" rid="B20">Hu, 2021</xref>; <xref ref-type="bibr" rid="B49">Wang, 2021</xref>) in modeling the longitudinal microbiome data to ease the computational burden. The more general random effects structure with cross-part correlations can provide more robust modeling, however, can suffer from model convergence as well. Further investigation is warranted.</p>
</sec>
</body>
<back>
<sec id="s5">
<title>Data Availability Statement</title>
<p>The data analyzed in this study is subject to the following licenses/restrictions: The motivating study is still ongoing. After it is closed, it will be uploaded to the public repository. Requests to access these datasets should be directed to <email>martin.blaser@cabm.rutgers.edu</email>.</p>
</sec>
<sec id="s6">
<title>Author Contributions</title>
<p>LH and HL developed the methodological ideas. LH implemented the methods, performed the simulations and real data analysis, and developed the software package. CW and JH contributed to the simulation design and real data analysis. ZG, EF, SH, and MB contributed to the acquisition of utilized real microbiome data. MB provided biological insights and interpretation of the real data analysis. LH and HL wrote the manuscript. All authors read, edited, and approved the final manuscript.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>This work was supported in part by National Institutes of Health grants R01DK110014, P20CA252728, and U01AI22285.</p>
</sec>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of Interest</title>
<p>LH was employed by the company Novartis Pharmaceuticals Corporation.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2022.777877/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2022.777877/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet1.docx" id="SM1" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bucci</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Tzen</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Simmons</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Tanoue</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Bogart</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>MDSINE: Microbial Dynamical Systems INference Engine for Microbiome Time-Series Analyses</article-title>. <source>Genome Biol.</source> <volume>17</volume> (<issue>1</issue>), <fpage>121</fpage>&#x2013;<lpage>217</lpage>. <pub-id pub-id-type="doi">10.1186/s13059-016-0980-6</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bucci</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Tzen</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Simmons</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Tanoue</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Bogart</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>MDSINE: Microbial Dynamical Systems INference Engine for Microbiome Time-Series Analyses</article-title>. <source>Genome Biol.</source> <volume>17</volume> (<issue>1</issue>), <fpage>121</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-016-0980-6</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carpenter</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Cole</surname>
<given-names>J.&#x20;J.</given-names>
</name>
<name>
<surname>Pace</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>Batt</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Brock</surname>
<given-names>W. A.</given-names>
</name>
<name>
<surname>Cline</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Early Warnings of Regime Shifts: a Whole-Ecosystem experiment</article-title>. <source>Science</source> <volume>332</volume> (<issue>6033</issue>), <fpage>1079</fpage>&#x2013;<lpage>1082</lpage>. <pub-id pub-id-type="doi">10.1126/science.1203672</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carroll</surname>
<given-names>I. M.</given-names>
</name>
<name>
<surname>Ringel-Kulka</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Siddle</surname>
<given-names>J.&#x20;P.</given-names>
</name>
<name>
<surname>Ringel</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Alterations in Composition and Diversity of the Intestinal Microbiota in Patients with Diarrhea-Predominant Irritable Bowel Syndrome</article-title>. <source>Neurogastroenterology Motil.</source> <volume>24</volume> (<issue>6</issue>), <fpage>521</fpage>&#x2013;<lpage>e248</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-2982.2012.01891.x</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carroll</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>Cressie</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>Spatial Modeling of Snow Water Equivalent Using Covariances Estimated from Spatial and Geomorphic Attributes</article-title>. <source>J.&#x20;Hydrol.</source> <volume>190</volume> (<issue>1-2</issue>), <fpage>42</fpage>&#x2013;<lpage>59</lpage>. <pub-id pub-id-type="doi">10.1016/s0022-1694(96)03062-4</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chamberlain</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>1982</year>). <article-title>Multivariate Regression Models for Panel Data</article-title>. <source>J.&#x20;Econom.</source> <volume>18</volume> (<issue>1</issue>), <fpage>5</fpage>&#x2013;<lpage>46</lpage>. <pub-id pub-id-type="doi">10.1016/0304-4076(82)90094-x</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Claesson</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Jeffery</surname>
<given-names>I. B.</given-names>
</name>
<name>
<surname>Conde</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Power</surname>
<given-names>S. E.</given-names>
</name>
<name>
<surname>O&#x2019;Connor</surname>
<given-names>E. M.</given-names>
</name>
<name>
<surname>Cusack</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>Gut Microbiota Composition Correlates with Diet and Health in the Elderly</article-title>. <source>Nature</source> <volume>488</volume> (<issue>7410</issue>), <fpage>178</fpage>&#x2013;<lpage>184</lpage>. <pub-id pub-id-type="doi">10.1038/nature11319</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Czado</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Gneiting</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Held</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Predictive Model Assessment for Count Data</article-title>. <source>Biometrics</source> <volume>65</volume> (<issue>4</issue>), <fpage>1254</fpage>&#x2013;<lpage>1261</lpage>. <pub-id pub-id-type="doi">10.1111/j.1541-0420.2009.01191.x</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dam</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Fonseca</surname>
<given-names>L. L.</given-names>
</name>
<name>
<surname>Konstantinidis</surname>
<given-names>K. T.</given-names>
</name>
<name>
<surname>Voit</surname>
<given-names>E. O.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Dynamic Models of the Complex Microbial Metapopulation of lake mendota</article-title>. <source>NPJ&#x20;Syst. Biol. Appl.</source> <volume>2</volume> (<issue>1</issue>), <fpage>16007</fpage>&#x2013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1038/npjsba.2016.7</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dannemiller</surname>
<given-names>K. C.</given-names>
</name>
<name>
<surname>Lang-Yona</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Yamamoto</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Rudich</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Peccia</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Combining Real-Time PCR and Next-Generation DNA Sequencing to Provide Quantitative Comparisons of Fungal Aerosol Populations</article-title>. <source>Atmos. Environ.</source> <volume>84</volume>, <fpage>113</fpage>&#x2013;<lpage>121</lpage>. <pub-id pub-id-type="doi">10.1016/j.atmosenv.2013.11.036</pub-id> </citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>de Vos</surname>
<given-names>M. G. J.</given-names>
</name>
<name>
<surname>Zagorski</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>McNally</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bollenbach</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Interaction Networks, Ecological Stability, and Collective Antibiotic Tolerance in Polymicrobial Infections</article-title>. <source>Proc. Natl. Acad. Sci. USA</source> <volume>114</volume> (<issue>40</issue>), <fpage>10666</fpage>&#x2013;<lpage>10671</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1713372114</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Douc</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Doukhan</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Moulines</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Ergodicity of Observation-Driven Time Series Models and Consistency of the Maximum Likelihood Estimator</article-title>. <source>Stochastic Process. their Appl.</source> <volume>123</volume> (<issue>7</issue>), <fpage>2620</fpage>&#x2013;<lpage>2647</lpage>. <pub-id pub-id-type="doi">10.1016/j.spa.2013.04.010</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Faith</surname>
<given-names>J.&#x20;J.</given-names>
</name>
<name>
<surname>Guruge</surname>
<given-names>J.&#x20;L.</given-names>
</name>
<name>
<surname>Charbonneau</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Subramanian</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Seedorf</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Goodman</surname>
<given-names>A. L.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>The Long-Term Stability of the Human Gut Microbiota</article-title>. <source>Science</source> <volume>341</volume> (<issue>6141</issue>), <fpage>1237439</fpage>. <pub-id pub-id-type="doi">10.1126/science.1237439</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Faust</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Raes</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Microbial Interactions: from Networks to Models</article-title>. <source>Nat. Rev. Microbiol.</source> <volume>10</volume> (<issue>8</issue>), <fpage>538</fpage>&#x2013;<lpage>550</lpage>. <pub-id pub-id-type="doi">10.1038/nrmicro2832</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fisher</surname>
<given-names>C. K.</given-names>
</name>
<name>
<surname>Mehta</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Identifying keystone Species in the Human Gut Microbiome from Metagenomic Timeseries Using Sparse Linear Regression</article-title>. <source>PloS one</source> <volume>9</volume> (<issue>7</issue>), <fpage>e102451</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0102451</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fokianos</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Tj&#xf8;stheim</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Log-linear Poisson Autoregression</article-title>. <source>J.&#x20;Multivariate Anal.</source> <volume>102</volume> (<issue>3</issue>), <fpage>563</fpage>&#x2013;<lpage>578</lpage>. <pub-id pub-id-type="doi">10.1016/j.jmva.2010.11.002</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gerber</surname>
<given-names>G. K.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>The Dynamic Microbiome</article-title>. <source>FEBS Lett.</source> <volume>588</volume> (<issue>22</issue>), <fpage>4131</fpage>&#x2013;<lpage>4139</lpage>. <pub-id pub-id-type="doi">10.1016/j.febslet.2014.02.037</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gilbert</surname>
<given-names>J.&#x20;A.</given-names>
</name>
<name>
<surname>Blaser</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Caporaso</surname>
<given-names>J.&#x20;G.</given-names>
</name>
<name>
<surname>Jansson</surname>
<given-names>J.&#x20;K.</given-names>
</name>
<name>
<surname>Lynch</surname>
<given-names>S. V.</given-names>
</name>
<name>
<surname>Knight</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Current Understanding of the Human Microbiome</article-title>. <source>Nat. Med.</source> <volume>24</volume> (<issue>4</issue>), <fpage>392</fpage>&#x2013;<lpage>400</lpage>. <pub-id pub-id-type="doi">10.1038/nm.4517</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gloor</surname>
<given-names>G. B.</given-names>
</name>
<name>
<surname>Macklaim</surname>
<given-names>J.&#x20;M.</given-names>
</name>
<name>
<surname>Pawlowsky-Glahn</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Egozcue</surname>
<given-names>J.&#x20;J.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Microbiome Datasets Are Compositional: And This Is Not Optional</article-title>. <source>Front. Microbiol.</source> <volume>8</volume>, <fpage>2224</fpage>. <pub-id pub-id-type="doi">10.3389/fmicb.2017.02224</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Joint Modeling of Zero-Inflated Longitudinal Proportions and Time-To-Event Data with Application to a Gut Microbiome Study</article-title>. <source>Biometrics</source> <volume>2</volume>, <fpage>2020</fpage>. <pub-id pub-id-type="doi">10.1111/biom.13515</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ives</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Dennis</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Cottingham</surname>
<given-names>K. L.</given-names>
</name>
<name>
<surname>Carpenter</surname>
<given-names>S. R.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Estimating Community Stability and Ecological Interactions from Time-Series Data</article-title>. <source>Ecol. Monogr.</source> <volume>73</volume> (<issue>2</issue>), <fpage>301</fpage>&#x2013;<lpage>330</lpage>. <pub-id pub-id-type="doi">10.1890/0012-9615(2003)073[0301:ecsaei]2.0.co;2</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ives</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Klug</surname>
<given-names>J.&#x20;L.</given-names>
</name>
<name>
<surname>Gross</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Stability and Species Richness in Complex Communities</article-title>. <source>Ecol. Lett.</source> <volume>3</volume> (<issue>5</issue>), <fpage>399</fpage>&#x2013;<lpage>411</lpage>. <pub-id pub-id-type="doi">10.1046/j.1461-0248.2000.00144.x</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jackson</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Jeffery</surname>
<given-names>I. B.</given-names>
</name>
<name>
<surname>Beaumont</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bell</surname>
<given-names>J.&#x20;T.</given-names>
</name>
<name>
<surname>Clark</surname>
<given-names>A. G.</given-names>
</name>
<name>
<surname>Ley</surname>
<given-names>R. E.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Signatures of Early Frailty in the Gut Microbiota</article-title>. <source>Genome Med.</source> <volume>8</volume> (<issue>1</issue>), <fpage>8</fpage>. <pub-id pub-id-type="doi">10.1186/s13073-016-0262-7</pub-id> </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Lim</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Quantitative Real-Time PCR Approaches for Microbial Community Studies in Wastewater Treatment Systems: Applications and Considerations</article-title>. <source>Biotechnol. Adv.</source> <volume>31</volume> (<issue>8</issue>), <fpage>1358</fpage>&#x2013;<lpage>1373</lpage>. <pub-id pub-id-type="doi">10.1016/j.biotechadv.2013.05.010</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Knight</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Vrbanac</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Taylor</surname>
<given-names>B. C.</given-names>
</name>
<name>
<surname>Aksenov</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Callewaert</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Debelius</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Best Practices for Analysing Microbiomes</article-title>. <source>Nat. Rev. Microbiol.</source> <volume>16</volume> (<issue>7</issue>), <fpage>410</fpage>&#x2013;<lpage>422</lpage>. <pub-id pub-id-type="doi">10.1038/s41579-018-0029-9</pub-id> </citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liesenfeld</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Nolte</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Pohlmeier</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Modelling Financial Transaction price Movements: a Dynamic Integer Count Data Model</article-title>. <source>Empirical Econ.</source> <volume>30</volume> (<issue>4</issue>), <fpage>795</fpage>&#x2013;<lpage>825</lpage>. <pub-id pub-id-type="doi">10.1007/s00181-005-0001-1</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lugo-Martinez</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ruiz-Perez</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Narasimhan</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Bar-Joseph</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Dynamic Interaction Network Inference from Longitudinal Microbiome Data</article-title>. <source>Microbiome</source> <volume>7</volume> (<issue>1</issue>), <fpage>54</fpage>&#x2013;<lpage>14</lpage>. <pub-id pub-id-type="doi">10.1186/s40168-019-0660-3</pub-id> </citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marino</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Baxter</surname>
<given-names>N. T.</given-names>
</name>
<name>
<surname>Huffnagle</surname>
<given-names>G. B.</given-names>
</name>
<name>
<surname>Petrosino</surname>
<given-names>J.&#x20;F.</given-names>
</name>
<name>
<surname>Schloss</surname>
<given-names>P. D.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Mathematical Modeling of Primary Succession of Murine Intestinal Microbiota</article-title>. <source>Proc. Natl. Acad. Sci. USA</source> <volume>111</volume> (<issue>1</issue>), <fpage>439</fpage>&#x2013;<lpage>444</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1311322111</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Martinez</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Antolin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Santos</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Torrejon</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Casellas</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Borruel</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2008</year>). <article-title>Unstable Composition of the Fecal Microbiota in Ulcerative Colitis during Clinical Remission</article-title>. <source>Am. J.&#x20;Gastroenterol.</source> <volume>103</volume> (<issue>3</issue>), <fpage>643</fpage>&#x2013;<lpage>648</lpage>. <pub-id pub-id-type="doi">10.1111/j.1572-0241.2007.01592.x</pub-id> </citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Maukonen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Satokari</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>M&#xe4;tt&#xf6;</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>S&#xf6;derlund</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Mattila-Sandholm</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Saarela</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Prevalence and Temporal Stability of Selected Clostridial Groups in Irritable Bowel Syndrome in Relation to Predominant Faecal Bacteria</article-title>. <source>J.&#x20;Med. Microbiol.</source> <volume>55</volume> (<issue>5</issue>), <fpage>625</fpage>&#x2013;<lpage>633</lpage>. <pub-id pub-id-type="doi">10.1099/jmm.0.46134-0</pub-id> </citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McGeachie</surname>
<given-names>M. J.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Longitudinal Prediction of the Infant Gut Microbiome with Dynamic Bayesian Networks</article-title>. <source>Scientific Rep.</source> <volume>6</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>11</lpage>. <pub-id pub-id-type="doi">10.1038/srep20359</pub-id> </citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mounier</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Monnet</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Jacques</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Antoinette</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Irlinger</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Assessment of the Microbial Diversity at the Surface of Livarot Cheese Using Culture-dependent and Independent Approaches</article-title>. <source>Int. J.&#x20;Food Microbiol.</source> <volume>133</volume> (<issue>1-2</issue>), <fpage>31</fpage>&#x2013;<lpage>37</lpage>. <pub-id pub-id-type="doi">10.1016/j.ijfoodmicro.2009.04.020</pub-id> </citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nadkarni</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Martin</surname>
<given-names>F. E.</given-names>
</name>
<name>
<surname>Jacques</surname>
<given-names>N. A.</given-names>
</name>
<name>
<surname>Hunter</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Determination of Bacterial Load by Real-Time PCR Using a Broad-Range (Universal) Probe and Primers Set</article-title>. <source>Microbiology (Reading)</source> <volume>148</volume> (<issue>Pt 1</issue>), <fpage>257</fpage>&#x2013;<lpage>266</lpage>. <pub-id pub-id-type="doi">10.1099/00221287-148-1-257</pub-id> </citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ott</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Musfeldt</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ullmann</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Hampe</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Schreiber</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Quantification of Intestinal Bacterial Populations by Real-Time PCR with a Universal Primer Set and Minor Groove Binder Probes: a Global Approach to the Enteric flora</article-title>. <source>J.&#x20;Clin. Microbiol.</source> <volume>42</volume> (<issue>6</issue>), <fpage>2566</fpage>&#x2013;<lpage>2572</lpage>. <pub-id pub-id-type="doi">10.1128/jcm.42.6.2566-2572.2004</pub-id> </citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Props</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Kerckhof</surname>
<given-names>F.-M.</given-names>
</name>
<name>
<surname>Rubbens</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>De Vrieze</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hernandez Sanabria</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Waegeman</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Absolute Quantification of Microbial Taxon Abundances</article-title>. <source>Isme J.</source> <volume>11</volume> (<issue>2</issue>), <fpage>584</fpage>&#x2013;<lpage>587</lpage>. <pub-id pub-id-type="doi">10.1038/ismej.2016.117</pub-id> </citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ratzke</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Barrere</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Gore</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2020</year>) <article-title>Strength of Species Interactions Determines Biodiversity and Stability in Microbial Communities</article-title>
<italic>.</italic> <source>Nat. Ecol. Evol.</source> <volume>4</volume>, <fpage>376</fpage>&#x2013;<lpage>383</lpage>. <pub-id pub-id-type="doi">10.1038/s41559-020-1099-4</pub-id> </citation>
</ref>
<ref id="B37">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Russell</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Norvig</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2002</year>). <source>Artificial Intelligence: A Modern Approach</source>. <publisher-loc>Englewood Cliffs, NJ</publisher-loc>: <publisher-name>University of California at Berkeley</publisher-name>. </citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Scanlan</surname>
<given-names>P. D.</given-names>
</name>
<name>
<surname>Shanahan</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Clune</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Collins</surname>
<given-names>J.&#x20;K.</given-names>
</name>
<name>
<surname>O&#x27;Sullivan</surname>
<given-names>G. C.</given-names>
</name>
<name>
<surname>O&#x27;Riordan</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2008</year>). <article-title>Culture-independent Analysis of the Gut Microbiota in Colorectal Cancer and Polyposis</article-title>. <source>Environ. Microbiol.</source> <volume>10</volume> (<issue>3</issue>), <fpage>789</fpage>&#x2013;<lpage>798</lpage>. <pub-id pub-id-type="doi">10.1111/j.1462-2920.2007.01503.x</pub-id> </citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shade</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Gregory Caporaso</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Handelsman</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Knight</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Fierer</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>A Meta-Analysis of Changes in Bacterial and Archaeal Communities with Time</article-title>. <source>Isme J.</source> <volume>7</volume> (<issue>8</issue>), <fpage>1493</fpage>&#x2013;<lpage>1506</lpage>. <pub-id pub-id-type="doi">10.1038/ismej.2013.54</pub-id> </citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shankar</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Insights into Study Design and Statistical Analyses in Translational Microbiome Studies</article-title>. <source>Ann. Transl. Med.</source> <volume>5</volume> (<issue>12</issue>), <fpage>249</fpage>. <pub-id pub-id-type="doi">10.21037/atm.2017.01.13</pub-id> </citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shaw</surname>
<given-names>G. T.</given-names>
</name>
<name>
<surname>Pao</surname>
<given-names>Y. Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>MetaMIS: a Metagenomic Microbial Interaction Simulator Based on Microbial Community Profiles</article-title>. <source>BMC bioinformatics</source> <volume>17</volume> (<issue>1</issue>), <fpage>488</fpage>&#x2013;<lpage>512</lpage>. <pub-id pub-id-type="doi">10.1186/s12859-016-1359-0</pub-id> </citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stein</surname>
<given-names>R. R.</given-names>
</name>
<name>
<surname>Bucci</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Toussaint</surname>
<given-names>N. C.</given-names>
</name>
<name>
<surname>Buffie</surname>
<given-names>C. G.</given-names>
</name>
<name>
<surname>R&#xe4;tsch</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Pamer</surname>
<given-names>E. G.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Ecological Modeling from Time-Series Inference: Insight into Dynamics and Stability of Intestinal Microbiota</article-title>. <source>Plos Comput. Biol.</source> <volume>9</volume> (<issue>12</issue>), <fpage>e1003388</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1003388</pub-id> </citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stein</surname>
<given-names>R. R.</given-names>
</name>
<name>
<surname>Bucci</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Toussaint</surname>
<given-names>N. C.</given-names>
</name>
<name>
<surname>Buffie</surname>
<given-names>C. G.</given-names>
</name>
<name>
<surname>R&#xe4;tsch</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Pamer</surname>
<given-names>E. G.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Ecological Modeling from Time-Series Inference: Insight into Dynamics and Stability of Intestinal Microbiota</article-title>. <source>Plos Comput. Biol.</source> <volume>9</volume> (<issue>12</issue>), <fpage>e1003388</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1003388</pub-id> </citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tkacz</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hortala</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Poole</surname>
<given-names>P. S.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Absolute Quantitation of Microbiota Abundance in Environmental Samples</article-title>. <source>Microbiome</source> <volume>6</volume> (<issue>1</issue>), <fpage>110</fpage>&#x2013;<lpage>113</lpage>. <pub-id pub-id-type="doi">10.1186/s40168-018-0491-7</pub-id> </citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tkacz</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hortala</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Poole</surname>
<given-names>P. S.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Absolute Quantitation of Microbiota Abundance in Environmental Samples</article-title>. <source>Microbiome</source> <volume>6</volume> (<issue>1</issue>), <fpage>110</fpage>. <pub-id pub-id-type="doi">10.1186/s40168-018-0491-7</pub-id> </citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Uronis</surname>
<given-names>J.&#x20;M.</given-names>
</name>
<name>
<surname>M&#xfc;hlbauer</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Herfarth</surname>
<given-names>H. H.</given-names>
</name>
<name>
<surname>Rubinas</surname>
<given-names>T. C.</given-names>
</name>
<name>
<surname>Jones</surname>
<given-names>G. S.</given-names>
</name>
<name>
<surname>Jobin</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Modulation of the Intestinal Microbiota Alters Colitis-Associated Colorectal Cancer Susceptibility</article-title>. <source>PloS one</source> <volume>4</volume> (<issue>6</issue>), <fpage>e6026</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0006026</pub-id> </citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Venturelli</surname>
<given-names>O. S.</given-names>
</name>
<name>
<surname>Carr</surname>
<given-names>A. C.</given-names>
</name>
<name>
<surname>Fisher</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Hsu</surname>
<given-names>R. H.</given-names>
</name>
<name>
<surname>Lau</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Bowen</surname>
<given-names>B. P.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Deciphering Microbial Interactions in Synthetic Human Gut Microbiome Communities</article-title>. <source>Mol. Syst. Biol.</source> <volume>14</volume> (<issue>6</issue>), <fpage>e8157</fpage>. <pub-id pub-id-type="doi">10.15252/msb.20178157</pub-id> </citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ver Hoef</surname>
<given-names>J.&#x20;M.</given-names>
</name>
<name>
<surname>Boveng</surname>
<given-names>P. L.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Quasi-Poisson vs. Negative Binomial Regression: How Should We Model Overdispersed Count Data</article-title>. <source>Ecology</source> <volume>88</volume> (<issue>11</issue>), <fpage>2766</fpage>&#x2013;<lpage>2772</lpage>. <pub-id pub-id-type="doi">10.1890/07-0043.1</pub-id> </citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Microbial Trend Analysis for Common Dynamic Trend, Group Comparison and Classification in Longitudinal Microbiome Study</article-title>. <source>BMC Genomics</source> <volume>15</volume>, <fpage>667</fpage>. <pub-id pub-id-type="doi">10.1186/s12864-021-07948-w</pub-id> </citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Woo</surname>
<given-names>P. C. Y.</given-names>
</name>
<name>
<surname>Lau</surname>
<given-names>S. K. P.</given-names>
</name>
<name>
<surname>Teng</surname>
<given-names>J.&#x20;L. L.</given-names>
</name>
<name>
<surname>Tse</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Yuen</surname>
<given-names>K.-Y.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Then and Now: Use of 16S rDNA Gene Sequencing for Bacterial Identification and Discovery of Novel Bacteria in Clinical Microbiology Laboratories</article-title>. <source>Clin. Microbiol. Infect.</source> <volume>14</volume> (<issue>10</issue>), <fpage>908</fpage>&#x2013;<lpage>934</lpage>. <pub-id pub-id-type="doi">10.1111/j.1469-0691.2008.02070.x</pub-id> </citation>
</ref>
<ref id="B51">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Xia</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>D.-G.</given-names>
</name>
</person-group> (<year>2018</year>). <source>Statistical Analysis of Microbiome Data with R</source>, <volume>847</volume>. <publisher-name>Springer</publisher-name>. </citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Pei</surname>
<given-names>Y.-F.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Pendegraft</surname>
<given-names>A. H.</given-names>
</name>
<name>
<surname>Zhuang</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Negative Binomial Mixed Models for Analyzing Longitudinal Microbiome Data</article-title>. <source>Front. Microbiol.</source> <volume>9</volume>, <fpage>1683</fpage>. <pub-id pub-id-type="doi">10.3389/fmicb.2018.01683</pub-id> </citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zuo</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ng</surname>
<given-names>S. C.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>The Gut Microbiota in the Pathogenesis and Therapeutics of Inflammatory Bowel Disease</article-title>. <source>Front. Microbiol.</source> <volume>9</volume>, <fpage>2247</fpage>. <pub-id pub-id-type="doi">10.3389/fmicb.2018.02247</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>
